increase cuda_cpy block size (ggml/996)

Co-authored-by: bssrdf <bssrdf@gmail.com>
2025-11-03 09:22:01 +00:00 · 2024-10-23 14:34:00 -04:00
parent 9e4a2563ea
commit 8c60a8a462
1 changed files with 1 additions and 1 deletions
--- a/ggml/src/ggml-cuda/cpy.cuh
+++ b/ggml/src/ggml-cuda/cpy.cuh
@@ -1,6 +1,6 @@
 #include "common.cuh"

-#define CUDA_CPY_BLOCK_SIZE 32
+#define CUDA_CPY_BLOCK_SIZE 64

 void ggml_cuda_cpy(ggml_backend_cuda_context & ctx, const ggml_tensor * src0, ggml_tensor * src1);