Skip to content

Commit

Permalink
fix tabulate_fusion_se_a_fifth_order_polynomial for rocm
Browse files Browse the repository at this point in the history
Signed-off-by: Jinzhe Zeng <[email protected]>
  • Loading branch information
njzjz committed Sep 19, 2023
1 parent 245964c commit 15f5729
Showing 1 changed file with 10 additions and 4 deletions.
14 changes: 10 additions & 4 deletions source/lib/src/gpu/tabulate.cu
Original file line number Diff line number Diff line change
Expand Up @@ -748,10 +748,16 @@ void tabulate_fusion_se_a_gpu(FPTYPE* out,
DPErrcheck(gpuGetLastError());
DPErrcheck(gpuDeviceSynchronize());
tabulate_fusion_se_a_fifth_order_polynomial<FPTYPE, MM, KK>
<<<nloc, last_layer_size>>>(out, table, em_x, em, two_embed,
table_info[0], table_info[1], table_info[2],
table_info[3], table_info[4], nnei,
last_layer_size, is_sorted);
#if GOOGLE_CUDA
<<<nloc, last_layer_size>>>
#elif TENSORFLOW_USE_ROCM
<<<nloc, last_layer_size, sizeof(FPTYPE) * MM * last_layer_size>>>
#else
#error "should not touch here"
#endif
(out, table, em_x, em, two_embed, table_info[0], table_info[1],
table_info[2], table_info[3], table_info[4], nnei, last_layer_size,
is_sorted);
DPErrcheck(gpuGetLastError());
DPErrcheck(gpuDeviceSynchronize());
}
Expand Down

0 comments on commit 15f5729

Please sign in to comment.