increase cuda_cpy block size (ggml/996)

Co-authored-by: bssrdf <bssrdf@gmail.com>
This commit is contained in:
bssrdf 2024-10-23 14:34:00 -04:00 committed by Georgi Gerganov
parent a3231b2f2e
commit 10eb603a3c

View File

@ -1,6 +1,6 @@
#include "common.cuh" #include "common.cuh"
#define CUDA_CPY_BLOCK_SIZE 32 #define CUDA_CPY_BLOCK_SIZE 64
void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, ggml_tensor * src1); void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, ggml_tensor * src1);