Compare commits

..

2 Commits

Author SHA1 Message Date
13c5446759 Update ggml-cuda/mmvq.cu
Co-authored-by: Johannes Gäßler <johannesg@5d6.de>
2024-06-11 17:37:32 +03:00
9df6298a91 cuda : fix bounds check for src0 rows in MMVQ kernel 2024-06-11 11:30:12 +03:00
2 changed files with 2 additions and 2 deletions

View File

@ -459,7 +459,7 @@ jobs:
path: build/bin/${{ matrix.build }}
windows-cublas:
runs-on: windows-2019
runs-on: windows-latest
strategy:
matrix:

View File

@ -75,7 +75,7 @@ static __global__ void mul_mat_vec_q(
tmp[j][i] = warp_reduce_sum(tmp[j][i]);
}
if (threadIdx.x < rows_per_cuda_block) {
if (threadIdx.x < rows_per_cuda_block && (rows_per_cuda_block == 1 || row0 + threadIdx.x < nrows_dst)) {
dst[j*nrows_dst + row0 + threadIdx.x] = tmp[j][threadIdx.x];
}
}