Question

我的问题是，我无法修改内核中的值。

这是不起作用的代码：

1st：内核：

__kernel void GetCellIndex(__global Particle* particles) {
    int globalID = get_global_id(0);
    particles[globalID].position.x = globalID;
};

2nd：内核中使用的结构：

typedef struct _Particle
{
    float3 position;
}Particle;

第3名：从CPU推送到GPU：

(Particle*) particles = (Particle*)malloc(sizeof(Particle)*200);
for (int i = 0; i < 200; i++)
{
    particles[i].position.x = 5f;
}

cl_mem cl_Particles = clCreateBuffer(context, CL_MEM_READ_WRITE |
    CL_MEM_COPY_HOST_PTR, sizeof(Particle)*maxParticle, &particles[0], NULL);



//init of kernel etc.



err = clSetKernelArg(kernel, 0, sizeof(cl_mem), (void *)&cl_Particles);
if (err != 0) {
    std::cout << "Error: setKernelArg 0 does not work!" << std::endl;
    system("Pause");
}

第四：运行内核：

size_t localItem = 1;
err = clEnqueueNDRangeKernel(queue, kernel, 1, 0, &(size_t)200+1, &localItem, 0, NULL, NULL);
if (err != 0) {
    std::cout << "Error: EnqueueNDRange does not work!" << std::endl;
}

err = clFlush(queue);
if (err != 0) {
    std::cout << "Error: Flush does not work: " << err << std::endl;
}

err = clFinish(queue);
if (err != 0) {
    std::cout << "Error: Finish does not work: " << err << std::endl;
}

第五：GPU上使用的结构：

typedef struct _Particle
{
    cl_float3 position;
}Particle;

6th：最后读取缓冲区：

clEnqueueReadBuffer(queue, cl_Particles, CL_TRUE, 0, 200 * sizeof(Particle), particles, 0, NULL, NULL);

执行此步骤后，我的内核不会影响clEnqueueReadBuffer中返回的值...

有谁知道为什么？这是什么问题

Answer 1

解决了问题：

将malloc行更改为

particles = new Particles[200];

还将数据分开写入缓冲区（使用clEnqueueWriteBuffer(...)）

其余应该像上面的代码一样工作

OpenCL - 无法修改值

1 个答案: