aboutsummaryrefslogtreecommitdiff
path: root/ggml.h
diff options
context:
space:
mode:
authorIvan Komarov <Ivan.Komarov@dfyz.info>2023-04-17 15:10:57 +0200
committerGitHub <noreply@github.com>2023-04-17 15:10:57 +0200
commitf266259ad9a2bce5a34d919592310147af23f3dc (patch)
tree34744366054065b866d972834bc3787217099e1a /ggml.h
parent47f61aaa5f76d04286792e2fbd0c95b659ab2af0 (diff)
Speedup the AVX-512 implementation of ggml_vec_dot_q4_0() (#933)
Diffstat (limited to 'ggml.h')
-rw-r--r--ggml.h2
1 files changed, 2 insertions, 0 deletions
diff --git a/ggml.h b/ggml.h
index 241e96a..e693754 100644
--- a/ggml.h
+++ b/ggml.h
@@ -808,6 +808,8 @@ size_t ggml_quantize_q4_1(const float * src, void * dst, int n, int k, int64_t *
int ggml_cpu_has_avx(void);
int ggml_cpu_has_avx2(void);
int ggml_cpu_has_avx512(void);
+int ggml_cpu_has_avx512_vbmi(void);
+int ggml_cpu_has_avx512_vnni(void);
int ggml_cpu_has_fma(void);
int ggml_cpu_has_neon(void);
int ggml_cpu_has_arm_fma(void);