diff --git a/math_test.cu b/math_test.cu index 8d50786..1be4e27 100644 --- a/math_test.cu +++ b/math_test.cu @@ -185,6 +185,8 @@ __global__ void gemm_kernel(int N, T_weight* A, T_data* B, T_data* C, int lda=M, else { gemm_kernel_inner(weights, n, B, C, ldc); } + + __syncthreads(); } }