c - 使用 cuda Throw::max_element 查找数组中的最大元素有时返回不正确-6ren

c - 使用 cuda Throw::max_element 查找数组中的最大元素有时返回不正确

转载作者：行者123 更新时间：2023-11-30 19:18:02

25

4

我有一个 2^20 元素数组正在设备上填充；这些数字每次都应该相同。然后，我将该数组移至主机，然后搜索数组中的最大元素，此技术适用于 2^10 元素数组，但一旦我开始获得大于该值的值，我开始得到随机答案，不确定推力是否为弄乱或设备计算。

max_element 应该返回的答案是 0.094479，通常程序第一次运行时代码会输出正确的答案，然后答案会每隔几次随机显示

GPU是运行5.0的tesla k20，也在780GTX上进行了测试；两次都是同样的问题

//Host Code
int main( void ) {
    float h_c[TOTAL];
    float *d_c;

    cudaMalloc((void**)&d_c, sizeof(float)*TOTAL);

    cudaEvent_t start, stop;
    cudaEventCreate(&start);
    cudaEventCreate(&stop);
    cudaEventRecord(start);

    //Number of threads
    kernel<<<BLOCKS,THREADS>>>(d_c);

    cudaEventRecord(stop);
    cudaEventSynchronize(stop);
    float mil = 0;
    cudaEventElapsedTime(&mil, start, stop);

    cudaMemcpy(h_c, d_c, sizeof(float)*TOTAL, cudaMemcpyDeviceToHost);

    for(int y = 0; y < TOTAL; y++){
        printf(" %d: Host C: %f \n",y, h_c[y]);
    }
    float *result = thrust::max_element(h_c, h_c + TOTAL);
    printf("Max is: %f \n", *result);
    printf("Time:  %f \n", mil/1000);
    printf("THREADS:  %d \n", THREADS);
    printf("BLOCKS:  %d \n", BLOCKS);
    printf("TOTAL:  %d \n", TOTAL);
    cudaFree(d_c);
    cudaDeviceReset() ;
    return 0;
}

设备代码

#include <thrust/extrema.h>
#include <math.h>
#include <stdio.h>

#define ARRAYSIZE 15
#define THREADS 1024
#define BLOCKS 32
#define TOTAL THREADS * BLOCKS 

__global__ void kernel(float *cc){

//Get thread for summing all elements 
int threadId = threadIdx.x + blockDim.x * blockIdx.x;

int decimalNumber,quotient;
//Size of the array
//const int size = 10;
//Holds the binary number in an array
int binaryNumber[ARRAYSIZE];
int i = 0;


int a[ARRAYSIZE] = {1192, 1315, 1462, 1484, 1476, 1443, 1508, 1489, 1470, 1573, 1633, 1539, 1600, 1707, 1701};//, 1682, 1688, 1681, 1694, 1728};
int b[ARRAYSIZE] = {1162, 1337, 1282, 1491, 1508, 1517, 1488, 1513, 1539, 1576, 1626 ,1634, 1573,    1786, 1741};//, 1782, 1755, 1669, 1700, 1826};

//Holds Product from the dot product
int c[ARRAYSIZE];
//Arrays to hold integers to be summed 
int aSumArr[ARRAYSIZE];
int bSumArr[ARRAYSIZE];

for(int i = 0; i < ARRAYSIZE; i++){
    c[i] = 0;
    aSumArr[i] = 0;
    bSumArr[i] = 0;
}

//Holds the value for the dot product
int dotSum = 0;
//Holds sum of valid array positions for array a
int aSum = 0;
//Holds sum of valid array positions for array b
int bSum = 0;

//Holds the Value of the arcCos of the dot product / sqrt(array a) * sqrt(array b)
float finalValue = 0;
//printf("ThreadID: %d \n", threadId);
//ALL 1's 1048575 = Threads
decimalNumber = threadId;
//printf("decimal number:  %d \n", decimalNumber); 

quotient = decimalNumber;
//Loop to convert decimal into binary and store in array
while(quotient!=0){

    binaryNumber[i++]= quotient % 2;

    quotient = quotient / 2;

}

//Test if conversion from decimal to binary is complete and correct
//printf("Equivalent binary value of decimal number %d: \n",decimalNumber);

//for(int in = size-1; in >= 0;in--){
  //printf("Index: %d | binary number:  %d ----  a:%d || b: %d\n",in,binaryNumber[in],a[in],b[in]);
//}
//printf(" \n ");

//Loop through binaryNumber array
for(int x = ARRAYSIZE-1 ; x >= 0; x--){
    //If index is == 1 Perform calculation
    if(binaryNumber[x] == 1){
        //Multiply numbers at good index
        c[x] = a[x] * b[x];
        //Fill sum arrays at correct index
        aSumArr[x] = a[x];
        bSumArr[x] = b[x];

        //Checks if the loop is executing correctly
        //sumArray[x] = 1;
        //printf("Multiplied - %d * %d = %f\n", a[x], b[x], c[x]);
        //printf("--This should not be run --\n");
    }else{
//          printf("SKIPPED - %d * %d = %f\n", a[x], b[x], c[x]);
    }


}

//Sums up the product array to complete dot product
for(int j = 0; j < ARRAYSIZE; ++j){
    dotSum += c[j];
    //printf("aSumArr %d \n", aSumArr[j]);
    //printf("bSumArr %d \n", bSumArr[j]);
    aSum += powf( aSumArr[j], 2 );
    bSum += powf( bSumArr[j], 2 );
//      printf("aSum: %d +  aSumArr %d \n", aSum, aSumArr[j]);
//      printf("bSum: %d +  bSumArr %d \n", bSum, bSumArr[j]);
}


//printf("\n");
//Print out the dot prudct
//printf("Dot product is: %d \n", dotSum);
//printf("aSum is: %d \n", aSum);
//printf("bSum is: %d \n", bSum);

float sqSum1 = sqrtf(aSum);
float sqSum2 = sqrtf(bSum);
// printf("sqSum1: %f \n", sqSum1);
// printf("sqSum2: %f \n", sqSum2);
float sqSum = sqSum1 * sqSum2;
// printf("sqSum %f \n", sqSum);     
float div = dotSum / sqSum ;
// printf("div: %f \n", div);
finalValue = acosf( div ) ;

//Stores the threads final value in array cc, in the respected index
if(finalValue == finalValue){
    cc[threadId] = finalValue;
}else{
    cc[threadId] = -2;
}
//printf("final value is: %f for number %d \n", finalValue, threadId);
}

最佳答案

这似乎是使用了不正确初始化/未初始化变量的情况。

添加以下行后:

for(int i = 0; i < ARRAYSIZE; i++){
    c[i] = 0;
    aSumArr[i] = 0;
    bSumArr[i] = 0;
    binaryNumber[i] = 0; // add this line
}

我无法再重现该问题。

关于c - 使用 cuda Throw::max_element 查找数组中的最大元素有时返回不正确，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/27238084/

25

4

0

文章推荐： javascript - Trigger使用通配符部署云函数失败

文章推荐： c# - 使用转换后的 VB 到 C# 代码

文章推荐： c# - 从 C# 方法返回方法

文章推荐： c# - 在 EnvDTE 中调试时捕获 VS 局部变量

c# - 什么会导致 throw 重置调用堆栈(我使用的是 "throw"，而不是 "throw ex")
我一直认为“throw”和“throw ex”的区别was that throw alone wasn't resetting the stacktrace of the exception. 不幸的
ios - 从 '(_) throws -> ()'类型的 throw 函数无效转换为 '(Response) -> Void'类型的非 throw 函数
我需要处理这样的api错误代码，并为某些状态代码抛出错误。但是遵循代码显示了以上错误。我怎样才能做到这一点？ func login(data: [String: Any], completion: @
javascript - `throw ' foo '`, ` throw Error ('foo' )`, ` throw new Error ('foo' )` 有什么区别？
我见过在 JavaScript 中抛出错误的 3 种不同方式: throw 'message'; throw Error('message'); throw new Error('message');
java - 异常处理中的 Throws 和 Throw
这个问题在这里已经有了答案: Exception handling : throw, throws and Throwable (8 个答案) 关闭 10 年前。谁能简单介绍一下Java异常处理中
ios - 错误 : Invalid conversion from throwing function of type '(_) throws -> ()' to non-throwing function type '(DataSnapshot) -> Void'
这是我的代码: func loadData() { ref.child(currentUserID!).observe(.childAdded) { (snapshot) in
flutter - Dart throw 和重新 throw 有什么区别？
可能很明显，但是我仍然无法理解throw和rethrow之间的区别，什么时候应该使用它们中的任何一个？最佳答案根据Effective Dart: If you decide to rethrow
Scala 函数式编程 : Should I use 'throw' or 'throw new' ?
这个问题在这里已经有了答案: "new" keyword in Scala (3 个答案) 关闭 5 年前。在 Scala 中进行一些函数式编程，并且来自 Java 背景，我倾向于像这样抛出异常:
java - 如何避免使用多个 throw 语句并仅使用一个带有所需错误消息的通用 throw 语句
我有一个验证输入字符串的代码，如果输入字符串与所需的格式不匹配，我需要抛出 IllegalArgumentException，有多个字段，每个字段都有一组不同的验证条件，因此对于当前我正在执行的每个字
java - 我应该在使用 throw 的同时使用 throws 吗？
我的方法有一个抛出 NullPointerException 的返回类型。 public class Student { public String studentOne() {
c# - "throw"和 "throw ex"之间有区别吗？
有些帖子询问这两者之间的区别。 (为什么我要提这个...) 但我的问题在某种程度上有所不同，我在另一个错误神级处理方法中调用了“throw ex”。 public class Program {
java - 异常处理 : throw, throws 和 Throwable
谁能解释一下 throw、throws 和 Throwable 之间的区别以及何时使用哪个？最佳答案 throws :在编写方法时使用，声明有问题的方法抛出了指定的(检查的)异常。与检查的异常相反
c++ - "throw MyException()"和 "throw (MyException())"之间有区别吗？
我想知道编写异常收件箱和发件箱是否会改变特定程序的行为，例如抛出 MyException(); 和抛出(我的异常())；我的代码: #include #include using names
c# - 为什么C#有一个单独的重新抛出语句( throw; )而不是重载 throw ex ？
抛出异常时，保留堆栈跟踪是最常见的期望行为，在 Java 中，这可以通过 throw ex; 获得，但在 C# 中，throw; 必须使用。 (另请注意，许多 C# 程序员经常错误地使用 throw
java - Java 中 throw 和 throws 的区别？
这个问题在这里已经有了答案: Exception handling : throw, throws and Throwable (8 个答案) 关闭 8 年前。谁能举个例子说清楚Java异常处理中
java - throws Throwable 和 throws Exception 有什么区别
这两个有什么区别吗？最佳答案异常是针对程序逻辑中的错误。 JVM 使用错误来表示环境有问题，例如 OutOfMemoryError 或 IncompatibleClassChangeError。
node.js - Mongoose {严格: throw} doesn't throw error
我试图到处寻找这个问题的答案，但似乎我运气不好。我有一个非常简单的 Mongoose 模型 var userObject = { profile: { username: {
java - "throw(e)"和 "throw e"之间的区别？
我遇到了这个重新抛出的异常，我很惊讶它甚至可以编译。 } catch(SomeException e) { ... throw(e); } 这个throw()和平时用的有什么区别吗？.
c++ - throw 和 throw 与捕获异常的 arg 有什么区别？
想象两段相似的代码: try { [...] } catch (myErr &err) { err.append("More info added to error..."); throw
java - Java 中方法签名中的 Throw 和 Throw 语句之间的区别
我试图弄清楚Java中方法签名中的抛出和抛出语句之间的区别。方法签名中的抛出如下: public void aMethod() throws IOException{ FileReader f
javascript - `throw new Error` 和 `throw Error` 之间的区别？
这个问题在这里已经有了答案: throw Error('msg') vs throw new Error('msg') (2 个回答) 24 天前关闭。没有 new 时抛出错误有什么缺点吗？关键词？

首页

博学

6Ren·AI

商城

c - 使用 cuda Throw::max_element 查找数组中的最大元素有时返回不正确