Skip to content

Commit ea92828

Browse files
committed
wip
1 parent 3a59971 commit ea92828

File tree

2 files changed

+1
-3
lines changed

2 files changed

+1
-3
lines changed

ggml/src/ggml-metal/ggml-metal-device.m

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -717,8 +717,7 @@ bool ggml_metal_device_supports_op(ggml_metal_device_t dev, const struct ggml_te
717717
return true;
718718
case GGML_OP_MUL_MAT:
719719
case GGML_OP_MUL_MAT_ID:
720-
return has_simdgroup_reduction &&
721-
(op->src[0]->type != GGML_TYPE_F32 || op->src[1]->type == GGML_TYPE_F32);
720+
return has_simdgroup_reduction;
722721
case GGML_OP_CPY:
723722
case GGML_OP_DUP:
724723
case GGML_OP_CONT:

ggml/src/ggml-metal/ggml-metal-ops.cpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1480,7 +1480,6 @@ int ggml_metal_op_mul_mat(ggml_metal_op_t ctx, int idx) {
14801480
// for now the matrix-matrix multiplication kernel only works on A14+/M1+ SoCs
14811481
// AMD GPU and older A-chips will reuse matrix-vector multiplication kernel
14821482
props_dev->has_simdgroup_mm &&
1483-
op->src[1]->type == GGML_TYPE_F32 &&
14841483
ne00 % 32 == 0 && ne00 >= 64 &&
14851484
(ne11 > ne11_mm_min || (ggml_is_quantized(op->src[0]->type) && ne12 > 1))) {
14861485
//printf("matrix: ne00 = %6d, ne01 = %6d, ne02 = %6d, ne11 = %6d, ne12 = %6d\n", ne00, ne01, ne02, ne11, ne12);

0 commit comments

Comments
 (0)