__device__ void prefixSumJoin(const bool *g_idata, int *g_odata, int n)
__shared__ int temp[Config::bfr*Config::bfr]; // allocated on invocation
int thid = threadIdx.y*blockDim.x + threadIdx.x;
int offset = 1;
temp[2*thid] = (g_idata[2*thid]?1:0); // load input into shared memory
temp[2*thid+1] = (g_idata[2*thid+1]?1:0);
for (int d = n>>1; d > 0; d >>= 1) // build sum in place up the tree
if (thid < d)
int ai = offset*(2*thid+1)-1; // <-- breakpoint B
int bi = offset*(2*thid+2)-1;
temp[bi] += temp[ai];
offset *= 2;
if (thid == 0) { temp[n - 1] = 0; } // clear the last element
for (int d = 1; d < n; d *= 2) // traverse down tree & build scan
offset >>= 1;
if (thid < d)
int ai = offset*(2*thid+1)-1;
int bi = offset*(2*thid+2)-1;
int t = temp[ai];
temp[ai] = temp[bi];
temp[bi] += t;
g_odata[2*thid] = temp[2*thid]; // write results to device memory
g_odata[2*thid+1] = temp[2*thid+1];
__global__ void selectKernel3(...)
int tidx = threadIdx.x;
int tidy = threadIdx.y;
int bidx = blockIdx.x;
int bidy = blockIdx.y;
int tid = tidy*blockDim.x + tidx;
int bid = bidy*gridDim.x+bidx;
int noOfRows1 = ...;
int noOfRows2 = ...;
__shared__ bool isRecordSelected[Config::bfr*Config::bfr];
__shared__ int selectedRecordsOffset[Config::bfr*Config::bfr];
isRecordSelected[tid] = false;
selectedRecordsOffset[tid] = 0;
if(tidx<noOfRows1 && tidy<noOfRows2)
if(... == ...)
isRecordSelected[tid] = true;
prefixSumJoin(isRecordSelected,selectedRecordsOffset,Config::bfr*Config::bfr); // <-- breakpoint A
some_instruction;// <-- breakpoint C
dim3 dimGrid(13, 5);
dim3 dimBlock(Config::bfr, Config::bfr);
selectKernel3<<<dimGrid, dimBlock>>>(...)
//other file
class Config
static const int bfr = 16; // blocking factor = number of rows per block
好的,现在我设置了3个断点:A,B,C。它应按A,B,C顺序命中。问题是按顺序命中:A,B * x,C,B。所以在C点,selectedRecordsOffset没有准备好,它会导致错误。在A被击中几次之后,但不是全部,然后C被击中,它在代码中进一步发展,然后在循环的其余部分再次进行B. x根据输入而不同(对于某些输入,断点中没有任何反转,因此C是最后一个被击中的。)
此外,如果我查看引起命中的线程数,它是针对A和C threadIdx.y = 0,针对B threadIdx.y = 10.如果它是同一个块,为什么有些线程会忽略同步?没有条件同步。
如果您需要更多说明,请询问 如果有任何建议,请提前感谢如何解决这个问题 亚当