metal : fix batch size for MUL_MAT_ID

This commit is contained in:
Georgi Gerganov 2025-09-08 21:01:25 +03:00
parent c5637cf39c
commit bdff7729b1
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
1 changed files with 2 additions and 1 deletions

View File

@ -6743,8 +6743,9 @@ static bool ggml_backend_metal_device_supports_buft(ggml_backend_dev_t dev, ggml
static int64_t get_op_batch_size(const struct ggml_tensor * op) {
switch (op->op) {
case GGML_OP_MUL_MAT:
case GGML_OP_MUL_MAT_ID:
return op->ne[1];
case GGML_OP_MUL_MAT_ID:
return op->ne[2];
default:
return ggml_nrows(op);
}