fix bug

2023-03-23 23:37:39 +08:00 · 2023-03-23 23:37:39 +08:00 · 4906961bf1
parent 94851cec68
commit 4906961bf1
1 changed files with 1 additions and 1 deletions
--- a/GPTQ-for-LLaMa/quant_cuda_kernel.cu
+++ b/GPTQ-for-LLaMa/quant_cuda_kernel.cu
@ -631,7 +631,7 @@ __global__ void VecQuant4TransposeMatMulHalfKernel(
 #if __CUDA_ARCH__ < 700 && __CUDA_ARCH__ > 600
  atomicAddHalf(&mul2[n_cols * height * 8 + n_rows], res);
 #else
-  atomicAddHalf(&mul2[n_cols * height * 8 + n_rows], res);
+  atomicAdd(&mul2[n_cols * height * 8 + n_rows], res);
 #endif
 #endif
 }