Skip to content

Commit 961e1ba

Browse files
slarentybalex
authored andcommitted
metal : unify mul_mv_id kernels (ggml-org#6556)
1 parent 6be901c commit 961e1ba

File tree

4 files changed

+141
-1055
lines changed

4 files changed

+141
-1055
lines changed

ggml-metal.m

+5
Original file line numberDiff line numberDiff line change
@@ -1926,7 +1926,12 @@ static enum ggml_status ggml_metal_graph_compute(
19261926
{
19271927
nth0 = 4;
19281928
nth1 = 16;
1929+
#if QK_K == 64
1930+
pipeline = ctx->kernels[GGML_METAL_KERNEL_TYPE_MUL_MV_ID_IQ4_NL_F32].pipeline;
1931+
#else
19291932
pipeline = ctx->kernels[GGML_METAL_KERNEL_TYPE_MUL_MV_ID_IQ4_XS_F32].pipeline;
1933+
#endif
1934+
19301935
} break;
19311936
default:
19321937
{

0 commit comments

Comments
 (0)