c++ - 在 Debug模式下，所有程序运行良好，但在 Release模式下，我的 cudaMalloc 操作出现错误-6ren

c++ - 在 Debug模式下，所有程序运行良好，但在 Release模式下，我的 cudaMalloc 操作出现错误

转载作者：行者123 更新时间：2023-11-30 20:03:28

在debug模式下程序运行良好，但在Release模式下memcpy操作出现错误

 CellBot *hCellList;
        CellBot *dCellList;
        size_t CellSize = WorldConst.numberOfCells * sizeof(CellBot);
        assert(!((hCellList = (CellBot *)malloc(CellSize)) == NULL));
        gpuAssert(cudaMalloc((void**)&dCellList, CellSize));


        ::memcpy(hCellList, CellList.data(), CellSize);
        gpuAssert(cudaMemcpy(dCellList, hCellList, CellSize, cudaMemcpyHostToDevice));

对此没有任何想法。我总是在 Debug模式下工作，当决定发布时会出现这样的错误。程序停止在这行代码上:

::memcpy(hCellList, CellList.data(), CellSize);

OgreCu_0.01.exe 中的 0x00007FFB9820C447 (vcruntime140.dll) 抛出异常:0xC0000005:访问冲突写入位置 0x0000000000000000。

Visual Studio 在 memcpy.asm 中显示错误线标记**

 CopyUp:
        cmp     r8, 128
        jbe     XmmCopySmall

        bt      __favor, __FAVOR_ENFSTRG ; check for ENFSTRG (enhanced fast strings)
        jnc     XmmCopyUp               ; If Enhanced Fast String not available, use XMM

        ; use Enhanced Fast Strings
        ; but first align the destination dst to 16 byte alignment
        mov     rax, r11                ; return original destination pointer
        mov     r11, rdi                ; save rdi in r11
        mov     rdi, rcx                ; move destination pointer to rdi
        mov     rcx, r8                 ; move length to rcx
        mov     r8, rsi                 ; save rsi in r8
        mov     rsi, r10                ; move source pointer to rsi
        **rep     movsb                   ; copy source to destination buffer**
        mov     rsi, r8                 ; restore rsi
        mov     rdi, r11                ; restore rdi
        ret

我改变::memcpy(hCellList, CellList.data(), CellSize);至

for (int e = 0; e < WorldConst.numberOfCells; e++)
    {
        hCellList[e] = CellList[e];
    }

hCellList[e] = CellList[e]; 中出现同样的错误

CellBot的结构

struct CellBot
{
    int mainId;
    int subId;

    Vec3 coord;
    Vec3 speed;
    Vec3 nspeed;
    Vec3 velocity;
    Vec3 nvelocity;

    float radiusView;
    float radiusAttraction;
    float radiusRepulsion;

    float forceAttraction;
    float forceRepulsion;

    float radius;
    float mass;
    float frictionBounce;

    int colorId;
    int groupId;

};

Vec3:

template <typename T=float>
class XVector3
{
public:

    typedef T value_type;

    __host__ __device__ inline XVector3() : x(0.0f), y(0.0f), z(0.0f) {}
    __host__ __device__ inline XVector3(T a) : x(a), y(a), z(a) {}
    __host__ __device__ inline XVector3(const T* p) : x(p[0]), y(p[1]), z(p[2]) {}
    __host__ __device__ inline XVector3(T x_, T y_, T z_) : x(x_), y(y_), z(z_)
    {
        VEC3_VALIDATE();
    }

    __host__ __device__ inline operator T* () { return &x; }
    __host__ __device__ inline operator const T* () const { return &x; };

    __host__ __device__ inline void Set(T x_, T y_, T z_) { VEC3_VALIDATE(); x = x_; y = y_; z = z_;}

    __host__ __device__ inline XVector3<T> operator * (T scale) const { XVector3<T> r(*this); r *= scale; return r; VEC3_VALIDATE();}
    __host__ __device__ inline XVector3<T> operator / (T scale) const { XVector3<T> r(*this); r /= scale; return r; VEC3_VALIDATE();}
    __host__ __device__ inline XVector3<T> operator + (const XVector3<T>& v) const { XVector3<T> r(*this); r += v; return r; VEC3_VALIDATE();}
    __host__ __device__ inline XVector3<T> operator - (const XVector3<T>& v) const { XVector3<T> r(*this); r -= v; return r; VEC3_VALIDATE();}
    __host__ __device__ inline XVector3<T> operator /(const XVector3<T>& v) const { XVector3<T> r(*this); r /= v; return r; VEC3_VALIDATE();}
    __host__ __device__ inline XVector3<T> operator *(const XVector3<T>& v) const { XVector3<T> r(*this); r *= v; return r; VEC3_VALIDATE();}

    __host__ __device__ inline XVector3<T>& operator *=(T scale) {x *= scale; y *= scale; z*= scale; VEC3_VALIDATE(); return *this;}
    __host__ __device__ inline XVector3<T>& operator /=(T scale) {T s(1.0f/scale); x *= s; y *= s; z *= s; VEC3_VALIDATE(); return *this;}
    __host__ __device__ inline XVector3<T>& operator +=(const XVector3<T>& v) {x += v.x; y += v.y; z += v.z; VEC3_VALIDATE(); return *this;}
    __host__ __device__ inline XVector3<T>& operator -=(const XVector3<T>& v) {x -= v.x; y -= v.y; z -= v.z; VEC3_VALIDATE(); return *this;}
    __host__ __device__ inline XVector3<T>& operator /=(const XVector3<T>& v) {x /= v.x; y /= v.y; z /= v.z; VEC3_VALIDATE(); return *this; }
    __host__ __device__ inline XVector3<T>& operator *=(const XVector3<T>& v) {x *= v.x; y *= v.y; z *= v.z; VEC3_VALIDATE(); return *this; }

    __host__ __device__ inline bool operator != (const XVector3<T>& v) const { return (x != v.x || y != v.y || z != v.z); }

    // negate
    __host__ __device__ inline XVector3<T> operator -() const { VEC3_VALIDATE(); return XVector3<T>(-x, -y, -z); }

    __host__ __device__ void Validate()
    {
        VEC3_VALIDATE();
    }

    T x,y,z;
};

typedef XVector3<float> Vec3;
typedef XVector3<float> Vector3;

// lhs scalar scale
template <typename T>
__host__ __device__ XVector3<T> operator *(T lhs, const XVector3<T>& rhs)
{
    XVector3<T> r(rhs);
    r *= lhs;
    return r;
}

template <typename T>
__host__ __device__ bool operator==(const XVector3<T>& lhs, const XVector3<T>& rhs)
{
    return (lhs.x == rhs.x && lhs.y == rhs.y && lhs.z == rhs.z);
}

最佳答案

很难理解你的问题。请写出更完整的错误消息并解释您下次要做什么!

但是我的猜测是，您会遇到以下问题:assert 语句速度很慢，因此通常只能在 Debug模式下编译到代码中。在 Release模式下，它们通常被简单地忽略。

但是，在您的代码中，您在 assert 内使用了 malloc。因此，在调试版本中，您可以获得所需的内存，而在发布版本中，您什么也得不到，并且程序崩溃。该行是:

assert(!((hCellList = (CellBot *)malloc(CellSize)) == NULL));

你应该做的是:

hCellList = (CellBot *)malloc(CellSize);
assert(!(hCellList == NULL));

关于c++ - 在 Debug模式下，所有程序运行良好，但在 Release模式下，我的 cudaMalloc 操作出现错误，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/51560592/

文章推荐： c - uint16_t 与 printf 的值差异

文章推荐： c - 为什么C跳到下一个printf而不是等待scanf？

文章推荐： javascript - 限制在 Node.js 中的循环中产生的并发子进程数

文章推荐： c# - DllImport 用于一组导入函数

c# - Debug.Assert/Debug.Fail 是否自动条件编译#if "DEBUG"
Debug.Assert/Debug.Fail 是否自动条件编译#if "DEBUG"？或者它是否更像是没有附加调试器(即使在发行版中)它什么也做不了？如果是这样，将它们留在您的代码中是否会对性能产生
debugging - react 导航 : how to debug
我有一个应用程序，我配置了多个路由，一切正常，直到我配置的最新路由不起作用(显示错误的屏幕)。我的问题是如何进行调试？没有打印错误日志，我无法找到如何获取有关正在发生的事情的更多日志。我也不知道从哪
debugging - Intellij Debugging 获取旧版本项目文件
我正在 Intellij 中调试代码。我使用 maven 来构建项目，并且在本地 .m2 存储库中有该项目的各种版本。当我开始调试时，Intellij 继续从项目的前一个快照中选择旧版本的代码。如何让
debugging - TCL开发: debug environment
我喜欢在业余时间进行一些 TiVo 黑客事件 - TiVo 使用 Linux 变体和 TCL 。我想在我的 Windows 笔记本电脑上编写 TCL 脚本，测试它们，然后将它们通过 FTP 传输到我的
debugging - DOS DEBUG 跟踪命令无法按我的预期工作
我有 ASM 代码，它使用循环语法打印 abc 。这是我的代码 ;abc.com .model small .code org 100h start: mov ah, 02h mov
c# - 条件 ("Debug") + #if DEBUG
我在 Debugging .net 2.0 Applications 中看到了以下代码 [Conditional("DEBUG")] void AssertTableExists() { #i
c# - #if DEBUG 与条件 ("DEBUG")
在大型项目中哪个更好用，为什么: #if DEBUG public void SetPrivateValue(int value) { ... } #endif 或 [System.D
debugging - 戈格兰 : debugging is grayed out
我似乎无法让调试器运行。调试运行图标变灰，菜单选项丢失。这只是main的情况，我可以很好地调试单元测试。类似的问题提到了项目结构，但我看不出有什么不对: $GOPATH/src/foo.bar.c
debugging - 浏览器链接总是要求 "Do you want to stop debugging"
只是想知道我的浏览器一直询问我是否想在每次点击浏览器链接刷新时停止调试非常烦人，因为这会减慢开发时间。有没有其他人遇到过这个？干杯最佳答案更新的答案，现在找到根本原因经过两年看到这个错误时断
debugging - Cmake 忽略 CMAKE_BUILD_TYPE=Debug
我正在尝试包含调试/发布相关编译器标志，例如: set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=gnu++0x -Wall -DUSE_BOOST") set
debugging - debug.phonegap.com 无法识别远程设备
当我尝试使用 debug.phonegap.com 调试我的phonegap 应用程序时遇到问题。我把这个视频放在 HTML 文档的头部在启动应用程序之前，我从 build.phonegap.
debugging - 我可以在核心转储文件中使用 "Reverse Debugging"吗？
GDB 7.0以后，支持反向调试。生成核心转储时，我可以使用反向调试命令吗？我怎样才能做到这一点？最佳答案你不能。核心文件是某个时间点程序状态的快照。要在该状态下向后移动，您需要程序状态的较早
C 调试，#if DEBUG 与 if (DEBUG)
首先:如果之前有人问过这个问题，我很抱歉。我是一个熟练的谷歌用户，但这确实让我难住了，我找不到任何东西。我目前正在编写一个小型库，我想对其进行调试。我还希望能够完全关闭调试，并且编译后的代码不应包含
debugging - 如何在 Tomcat 中将日志级别设置为 DEBUG？
我想在 tomcat 中将级别日志记录设置为 DEBUG，但在控制台中仍然只有 INFO 和 WARN 输出。谁能告诉我哪里出了问题？我的 C:\tomcat\logging.properties:
c# - Defines.Debug 与 #if DEBUG
我已经开始像这样使用定义类了: internal sealed class Defines { /// /// This constant is set to true iff th
ios - #ifdef DEBUG 与 #if DEBUG
在使用编译器指令时，我不清楚以下两个代码片段中哪一个是正确/首选的，以及为什么。似乎我见过的大多数开发人员和开源项目都使用第一种，但我也看到第二种也经常使用。 #ifdef DEBUG [self d
android - 在 [src/nullnull/debug, src/debug/nullnull, src/nullnull, src/debug, src/nullnullDebug] 中找不到 google-services.json
我遇到错误，无法完成构建。我搜索了 Stackoverflow 和 Github。我已经尝试了很多方法，但我无法修复。请帮忙。 (1) 在 [src/nullnull/debug, src/debug
debugging - 使用 TFS 进行部署使 DEBUG 指令保持打开状态
我刚刚意识到，使用 TFS 部署时，DEBUG 处理器指令仍然有效，有没有办法更改 TFS/Azure 网站或构建定义中的设置，而不是在本地解决方案配置？我仍然希望本地解决方案保持调试状态，只有部署
debugging - 花括号 : debug assertion faild 上的崩溃
我有一段代码在 VS2008，C++ 中以 Debug模式运行。问题是，当我逐行调试代码时，在代码的一个非常奇怪的地方，它崩溃并说: debug assertion faild. Expressio
debugging - Xamarin.Forms - Debug.WriteLine() - 输出去哪里？
我有一个简单的 Xamarin.Forms 项目，我在 Visual Studio 中运行，使用 iphone 模拟器。我在 App.cs 中有以下代码: protected override voi

行者123

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

c++ - 在 Debug模式下，所有程序运行良好，但在 Release模式下，我的 cudaMalloc 操作出现错误