From 982c82f1e64c1de24c16c78f04b0a3fbea234cc2 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Tue, 25 Mar 2025 14:36:22 +0200 Subject: [PATCH] metal : fix comments [no ci] --- ggml/src/ggml-metal/ggml-metal-impl.h | 2 +- ggml/src/ggml-metal/ggml-metal.m | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/ggml/src/ggml-metal/ggml-metal-impl.h b/ggml/src/ggml-metal/ggml-metal-impl.h index 8e8428d381..ca5a00b032 100644 --- a/ggml/src/ggml-metal/ggml-metal-impl.h +++ b/ggml/src/ggml-metal/ggml-metal-impl.h @@ -3,7 +3,7 @@ // kernel parameters for mat-vec threadgroups // -// N_R0: number of src0 rows to process per threadgroup +// N_R0: number of src0 rows to process per simdgroup // N_SG: number of simdgroups per threadgroup // // TODO: for optimal performance, become function of the device and work size diff --git a/ggml/src/ggml-metal/ggml-metal.m b/ggml/src/ggml-metal/ggml-metal.m index 49b6314395..846f822ea1 100644 --- a/ggml/src/ggml-metal/ggml-metal.m +++ b/ggml/src/ggml-metal/ggml-metal.m @@ -2883,7 +2883,7 @@ static void ggml_metal_encode_node( id pipeline = nil; int nsg = 0; // number of simdgroups - int nr0 = 0; // number of src0 rows per threadgroup + int nr0 = 0; // number of src0 rows per simdgroup int nr1 = 1; // number of src1 rows per threadgroup size_t smem = 0; // shared memory