aboutsummaryrefslogtreecommitdiff
path: root/ggml.h
diff options
context:
space:
mode:
authorStephan Walter <stephan@walter.name>2023-03-22 17:29:06 +0000
committerGitHub <noreply@github.com>2023-03-22 19:29:06 +0200
commit69c92298a9e36dc2363b3bf50452976ce49487b3 (patch)
tree685e3fc7582eab3173a87d6efd94b3f92070839d /ggml.h
parent97940520e8fd49c56bb29b71cc350190b723513f (diff)
Deduplicate q4 quantization functions (#383)
* Deduplicate q4 quantization functions * Use const; add basic test * Re-enable quantization test * Disable AVX2 flags in CI --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'ggml.h')
-rw-r--r--ggml.h4
1 files changed, 2 insertions, 2 deletions
diff --git a/ggml.h b/ggml.h
index 48b6cc0..c7e6814 100644
--- a/ggml.h
+++ b/ggml.h
@@ -745,8 +745,8 @@ enum ggml_opt_result ggml_opt(
// quantization
//
-size_t ggml_quantize_q4_0(float * src, void * dst, int n, int k, int qk, int64_t * hist);
-size_t ggml_quantize_q4_1(float * src, void * dst, int n, int k, int qk, int64_t * hist);
+size_t ggml_quantize_q4_0(const float * src, void * dst, int n, int k, int qk, int64_t * hist);
+size_t ggml_quantize_q4_1(const float * src, void * dst, int n, int k, int qk, int64_t * hist);
//
// system info