Skip to content

Commit 3a59596

Browse files
authored
Merge pull request #424 from denghuilu/master
fix bug of max_nbor_size error
2 parents 0da10cd + 520c308 commit 3a59596

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

source/op/descrpt_se_a_multi_device.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -261,7 +261,7 @@ class DescrptSeAOp : public OpKernel {
261261
cudaErrcheck(cudaMemcpy(jlist, jlist_host, sizeof(int) * mesh_host[3], cudaMemcpyHostToDevice));
262262

263263
max_nbor_size = 0;
264-
for(int ii = 0; ii < mesh_host[2]; ii++) {
264+
for(int ii = 0; ii < mesh_host[2] - 1; ii++) {
265265
max_nbor_size = (jrange_host[ii + 1] - jrange_host[ii]) > max_nbor_size ? (jrange_host[ii + 1] - jrange_host[ii]) : max_nbor_size;
266266
}
267267
assert(max_nbor_size <= GPU_MAX_NBOR_SIZE);

source/op/descrpt_se_r_multi_device.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -250,7 +250,7 @@ class DescrptSeROp : public OpKernel {
250250
cudaErrcheck(cudaMemcpy(jlist, jlist_host, sizeof(int) * mesh_host[3], cudaMemcpyHostToDevice));
251251

252252
max_nbor_size = 0;
253-
for(int ii = 0; ii < mesh_host[2]; ii++) {
253+
for(int ii = 0; ii < mesh_host[2] - 1; ii++) {
254254
max_nbor_size = (jrange_host[ii + 1] - jrange_host[ii]) > max_nbor_size ? (jrange_host[ii + 1] - jrange_host[ii]) : max_nbor_size;
255255
}
256256
assert(max_nbor_size <= GPU_MAX_NBOR_SIZE);

0 commit comments

Comments
 (0)