We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c37fb4c commit 26a8406Copy full SHA for 26a8406
ggml/src/ggml-cuda/mmv.cu
@@ -57,7 +57,7 @@ static __global__ void mul_mat_vec(
57
if (block_size > WARP_SIZE) {
58
buf_iw[tid/WARP_SIZE] = sumf;
59
__syncthreads();
60
- if (tid > WARP_SIZE) {
+ if (tid >= WARP_SIZE) {
61
return;
62
}
63
sumf = buf_iw[tid];
0 commit comments