increase cuda_cpy block size (ggml/996)

Co-authored-by: bssrdf <bssrdf@gmail.com>
2025-01-11 19:21:46 +00:00 · 2024-10-23 14:34:00 -04:00 · 2024-10-23 14:34:00 -04:00 · 8c60a8a462
commit 8c60a8a462
parent 9e4a2563ea
1 changed files with 1 additions and 1 deletions
--- a/ggml/src/ggml-cuda/cpy.cuh
+++ b/ggml/src/ggml-cuda/cpy.cuh
@ -1,6 +1,6 @@
 #include "common.cuh"

-#define CUDA_CPY_BLOCK_SIZE 32
+#define CUDA_CPY_BLOCK_SIZE 64

 void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, ggml_tensor * src1);