Skip to content

Commit e7f3193

Browse files
authored
add syncthread (PaddlePaddle#53)
1 parent 7263442 commit e7f3193

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

paddle/fluid/framework/data_feed.cu

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -206,6 +206,8 @@ __global__ void GraphFillFeatureKernel(uint64_t *id_tensor, int *fill_ins_num,
206206
}
207207
}
208208

209+
__syncthreads();
210+
209211
if (threadIdx.x == 0) {
210212
global_num = atomicAdd(fill_ins_num, local_num);
211213
}
@@ -245,6 +247,8 @@ __global__ void GraphFillIdKernel(uint64_t *id_tensor, int *fill_ins_num,
245247
}
246248
}
247249

250+
__syncthreads();
251+
248252
if (threadIdx.x == 0) {
249253
global_num = atomicAdd(fill_ins_num, local_num);
250254
}
@@ -340,7 +344,6 @@ int GraphDataGenerator::FillInsBuf() {
340344
int h_pair_num;
341345
cudaMemcpyAsync(&h_pair_num, d_pair_num, sizeof(int), cudaMemcpyDeviceToHost,
342346
stream_);
343-
344347
if (!FLAGS_enable_opt_get_features && slot_num_ > 0) {
345348
uint64_t *feature_buf = reinterpret_cast<uint64_t *>(d_feature_buf_->ptr());
346349
uint64_t *feature = reinterpret_cast<uint64_t *>(d_feature_->ptr());

0 commit comments

Comments
 (0)