aboutsummaryrefslogtreecommitdiff
path: root/ggml.h
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-04-30 19:07:00 +0300
committerGeorgi Gerganov <ggerganov@gmail.com>2023-04-30 19:07:43 +0300
commit6bc4400e67e6bc4faad3ad3d5e9d8a6576a9752d (patch)
tree409352b146e6701cd9562d33df5fa7a206507d40 /ggml.h
parentf0d70f147d969e41fa410b8af2965a27aa901eb9 (diff)
ggml : add Q5 WASM SIMD + GGML_FTYPE
Diffstat (limited to 'ggml.h')
-rw-r--r--ggml.h17
1 files changed, 17 insertions, 0 deletions
diff --git a/ggml.h b/ggml.h
index c1c5495..d6feacd 100644
--- a/ggml.h
+++ b/ggml.h
@@ -232,6 +232,20 @@ extern "C" {
GGML_TYPE_COUNT,
};
+ // model file types
+ enum ggml_ftype {
+ GGML_FTYPE_UNKNOWN = -1,
+ GGML_FTYPE_ALL_F32 = 0,
+ GGML_FTYPE_MOSTLY_F16 = 1, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q4_0 = 2, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q4_1 = 3, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4, // tok_embeddings.weight and output.weight are F16
+ GGML_FTYPE_MOSTLY_Q4_2 = 5, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q8_0 = 7, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q5_0 = 8, // except 1d tensors
+ GGML_FTYPE_MOSTLY_Q5_1 = 9, // except 1d tensors
+ };
+
// available tensor operations:
enum ggml_op {
GGML_OP_NONE = 0,
@@ -385,6 +399,9 @@ extern "C" {
GGML_API bool ggml_is_quantized(enum ggml_type type);
+ // TODO: temporary until model loading of ggml examples is refactored
+ GGML_API enum ggml_type ggml_ftype_to_ggml_type(enum ggml_ftype ftype);
+
// main
GGML_API struct ggml_context * ggml_init(struct ggml_init_params params);