aboutsummaryrefslogtreecommitdiff
path: root/k_quants.c
diff options
context:
space:
mode:
authorKawrakow <48489457+ikawrakow@users.noreply.github.com>2023-07-24 12:55:02 +0300
committerGitHub <noreply@github.com>2023-07-24 12:55:02 +0300
commit42f70cb2f6a8089e0a0560a459e4ba317bac4d49 (patch)
treef67f27da87ab35a88a09a8fb7456dd4873948a2e /k_quants.c
parent84e09a7d8bc4ab6d658b5cd81295ac0add60be78 (diff)
Fix scalar version of Q5_K when QK_K = 64 (#2362)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'k_quants.c')
-rw-r--r--k_quants.c5
1 files changed, 2 insertions, 3 deletions
diff --git a/k_quants.c b/k_quants.c
index c576fd7..e790abf 100644
--- a/k_quants.c
+++ b/k_quants.c
@@ -3297,8 +3297,7 @@ void ggml_vec_dot_q5_K_q8_K(const int n, float * restrict s, const void * restri
#else
-
- uint8_t aux8[QK_K];
+ int8_t aux8[QK_K];
int16_t aux16[16];
float sums [8];
memset(sums, 0, 8*sizeof(float));
@@ -3308,7 +3307,7 @@ void ggml_vec_dot_q5_K_q8_K(const int n, float * restrict s, const void * restri
const uint8_t * restrict q4 = x[i].qs;
const uint8_t * restrict hm = x[i].qh;
const int8_t * restrict q8 = y[i].qs;
- uint8_t * restrict a = aux8;
+ int8_t * restrict a = aux8;
for (int l = 0; l < 32; ++l) {
a[l+ 0] = q4[l] & 0xF;
a[l+32] = q4[l] >> 4;