metal : fix batch size for MUL_MAT_ID

This commit is contained in:
Georgi Gerganov
2025-09-08 21:01:25 +03:00
parent c5637cf39c
commit bdff7729b1

View File

@@ -6743,8 +6743,9 @@ static bool ggml_backend_metal_device_supports_buft(ggml_backend_dev_t dev, ggml
static int64_t get_op_batch_size(const struct ggml_tensor * op) {
switch (op->op) {
case GGML_OP_MUL_MAT:
case GGML_OP_MUL_MAT_ID:
return op->ne[1];
case GGML_OP_MUL_MAT_ID:
return op->ne[2];
default:
return ggml_nrows(op);
}