cuda : add softcap fusion (#14907)

This commit is contained in:
Sigbjørn Skjæret
2025-07-29 14:22:03 +02:00
committed by GitHub
parent bbd0f91779
commit 138b288b59
4 changed files with 118 additions and 6 deletions

View File

@@ -0,0 +1,5 @@
#include "common.cuh"
#define CUDA_SOFTCAP_BLOCK_SIZE 256
void ggml_cuda_op_softcap(ggml_backend_cuda_context & ctx, ggml_tensor * dst, ggml_tensor * src);