CUDA: add mean operation (#14313)

* CUDA: add mean operation

* add back sum_rows_f32_cuda

* Review: early exit if col!=0
This commit is contained in:
Aman Gupta
2025-06-22 12:39:54 +08:00
committed by GitHub
parent aa0ef5c578
commit aa064b2eb7
7 changed files with 54 additions and 19 deletions

View File

@@ -1,5 +1,4 @@
#include "common.cuh"
void sum_rows_f32_cuda(const float * x, float * dst, const int ncols, const int nrows, cudaStream_t stream);
void ggml_cuda_op_sum_rows(ggml_backend_cuda_context & ctx, ggml_tensor * dst);