aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-03-24 23:39:17 +0200
committerGeorgi Gerganov <ggerganov@gmail.com>2023-03-24 23:39:17 +0200
commitb3f460e94139cb24b0af81cc8bc10eb86269d704 (patch)
tree5a333c6c7512783be7915f4f53eb95f6a301265c
parent04c6f5ed6fafd63601fa06757877ed5ccf9d5991 (diff)
Disable BLAS branch in mul_mat - seems there is a bug
-rw-r--r--ggml.c10
1 files changed, 5 insertions, 5 deletions
diff --git a/ggml.c b/ggml.c
index cfdf427..b428d70 100644
--- a/ggml.c
+++ b/ggml.c
@@ -5858,11 +5858,11 @@ static bool ggml_compute_forward_mul_mat_use_blas(
if (ggml_is_contiguous(src0) &&
ggml_is_contiguous(src1) && ((ne0 >= 32 && ne1 >= 32 && ne10 >= 32))) {
- //// disable BLAS for Q4_0 and Q4_1
- //// looks like there is no benefit and we only waste a lot of memory
- //if (src0->type == GGML_TYPE_Q4_0 || src0->type == GGML_TYPE_Q4_1) {
- // return false;
- //}
+ // disable BLAS for Q4_0 and Q4_1
+ // there is a bug that has to be fixed before enabling
+ if (src0->type == GGML_TYPE_Q4_0 || src0->type == GGML_TYPE_Q4_1) {
+ return false;
+ }
//printf("BLAS: %d %d %d %d %d\n", ne0, ne1, ne10, ne00, ne01);
return true;