mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-06-15 05:18:07 +00:00
cuda : fix device sync on buffer clear (llama/14033)
This commit is contained in:
committed by
Georgi Gerganov
parent
26282282fa
commit
e16a84cd95
@ -615,9 +615,8 @@ static void ggml_backend_cuda_buffer_clear(ggml_backend_buffer_t buffer, uint8_t
|
|||||||
ggml_backend_cuda_buffer_context * ctx = (ggml_backend_cuda_buffer_context *)buffer->context;
|
ggml_backend_cuda_buffer_context * ctx = (ggml_backend_cuda_buffer_context *)buffer->context;
|
||||||
|
|
||||||
ggml_cuda_set_device(ctx->device);
|
ggml_cuda_set_device(ctx->device);
|
||||||
CUDA_CHECK(cudaDeviceSynchronize());
|
CUDA_CHECK(cudaMemsetAsync(ctx->dev_ptr, value, buffer->size, cudaStreamPerThread));
|
||||||
CUDA_CHECK(cudaMemset(ctx->dev_ptr, value, buffer->size));
|
CUDA_CHECK(cudaStreamSynchronize(cudaStreamPerThread));
|
||||||
CUDA_CHECK(cudaDeviceSynchronize());
|
|
||||||
}
|
}
|
||||||
|
|
||||||
static const ggml_backend_buffer_i ggml_backend_cuda_buffer_interface = {
|
static const ggml_backend_buffer_i ggml_backend_cuda_buffer_interface = {
|
||||||
|
Reference in New Issue
Block a user