Skip to content

Commit a76a3bb

Browse files
committed
metal : try to unify mul_mv_id kernels
1 parent cc4a954 commit a76a3bb

File tree

2 files changed

+120
-975
lines changed

2 files changed

+120
-975
lines changed

ggml-metal.m

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1926,7 +1926,12 @@ static enum ggml_status ggml_metal_graph_compute(
19261926
{
19271927
nth0 = 4;
19281928
nth1 = 16;
1929+
#if QK_K == 64
1930+
pipeline = ctx->kernels[GGML_METAL_KERNEL_TYPE_MUL_MV_ID_IQ4_NL_F32].pipeline;
1931+
#else
19291932
pipeline = ctx->kernels[GGML_METAL_KERNEL_TYPE_MUL_MV_ID_IQ4_XS_F32].pipeline;
1933+
#endif
1934+
19301935
} break;
19311936
default:
19321937
{

0 commit comments

Comments
 (0)