cuda : add softcap fusion (#14907)

2025-11-17 11:37:10 +00:00 · 2025-07-29 14:22:03 +02:00
parent bbd0f91779
commit 138b288b59
4 changed files with 118 additions and 6 deletions
--- a/ggml/src/ggml-cuda/softcap.cuh
+++ b/ggml/src/ggml-cuda/softcap.cuh
@@ -0,0 +1,5 @@
+#include "common.cuh"
+
+#define CUDA_SOFTCAP_BLOCK_SIZE 256
+
+void ggml_cuda_op_softcap(ggml_backend_cuda_context & ctx, ggml_tensor * dst, ggml_tensor * src);