From 0629a79d032d1dbfbc25a6ef40e830e895ed2660 Mon Sep 17 00:00:00 2001 From: Justine Tunney Date: Thu, 23 May 2024 03:35:46 -0700 Subject: [PATCH] Disable new mixmul for text generation --- sgemm.cpp | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/sgemm.cpp b/sgemm.cpp index 3c768edc922108..df7419a5df66fb 100644 --- a/sgemm.cpp +++ b/sgemm.cpp @@ -1243,6 +1243,10 @@ class MixMul { assert(params->ith < params->nth); assert(plan->type == GGML_TYPE_I32); + // doesn't help for token generation + if (n < 2) + return false; + // supported types if (result->type != GGML_TYPE_F32) return false;