mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-06-05 08:50:41 +00:00
cuda : fix bounds check for src0 rows in MMVQ kernel
This commit is contained in:
parent
20c542c713
commit
9df6298a91
@ -75,7 +75,7 @@ static __global__ void mul_mat_vec_q(
|
|||||||
tmp[j][i] = warp_reduce_sum(tmp[j][i]);
|
tmp[j][i] = warp_reduce_sum(tmp[j][i]);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (threadIdx.x < rows_per_cuda_block) {
|
if (threadIdx.x < rows_per_cuda_block && row0 + threadIdx.x < nrows_dst) {
|
||||||
dst[j*nrows_dst + row0 + threadIdx.x] = tmp[j][threadIdx.x];
|
dst[j*nrows_dst + row0 + threadIdx.x] = tmp[j][threadIdx.x];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
Loading…
x
Reference in New Issue
Block a user