From 2e075bfaf65e13c4c81fe3d3f9f4c28e9f354cf4 Mon Sep 17 00:00:00 2001 From: JacobLinCool Date: Thu, 28 Mar 2024 00:30:06 +0800 Subject: [PATCH 1/2] spec: add missing semicolons in GGUF structs MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-Authored-By: 郝東彥 Arthur Hao <41247050s@gapps.ntnu.edu.tw> --- docs/gguf.md | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/docs/gguf.md b/docs/gguf.md index fa9abea74..41b61214b 100644 --- a/docs/gguf.md +++ b/docs/gguf.md @@ -85,7 +85,7 @@ enum gguf_metadata_value_type: uint32_t { GGUF_METADATA_VALUE_TYPE_INT64 = 11, // The value is a 64-bit IEEE754 floating point number. GGUF_METADATA_VALUE_TYPE_FLOAT64 = 12, -} +}; // A string in GGUF. struct gguf_string_t { @@ -93,7 +93,7 @@ struct gguf_string_t { uint64_t len; // The string as a UTF-8 non-null-terminated string. char string[len]; -} +}; union gguf_metadata_value_t { uint8_t uint8; From 45729b8dda9559d75e27edb396d395e9b4b1300b Mon Sep 17 00:00:00 2001 From: JacobLinCool Date: Thu, 28 Mar 2024 00:42:32 +0800 Subject: [PATCH 2/2] spec: update GGUF tensor types --- docs/gguf.md | 48 +++++++++++++++++++++++++++++------------------- 1 file changed, 29 insertions(+), 19 deletions(-) diff --git a/docs/gguf.md b/docs/gguf.md index 41b61214b..d6ad5e276 100644 --- a/docs/gguf.md +++ b/docs/gguf.md @@ -31,26 +31,36 @@ Models are little-endian by default. They can also come in big-endian for use wi ```c enum ggml_type: uint32_t { - GGML_TYPE_F32 = 0, - GGML_TYPE_F16 = 1, - GGML_TYPE_Q4_0 = 2, - GGML_TYPE_Q4_1 = 3, + GGML_TYPE_F32 = 0, + GGML_TYPE_F16 = 1, + GGML_TYPE_Q4_0 = 2, + GGML_TYPE_Q4_1 = 3, // GGML_TYPE_Q4_2 = 4, support has been removed - // GGML_TYPE_Q4_3 (5) support has been removed - GGML_TYPE_Q5_0 = 6, - GGML_TYPE_Q5_1 = 7, - GGML_TYPE_Q8_0 = 8, - GGML_TYPE_Q8_1 = 9, - // k-quantizations - GGML_TYPE_Q2_K = 10, - GGML_TYPE_Q3_K = 11, - GGML_TYPE_Q4_K = 12, - GGML_TYPE_Q5_K = 13, - GGML_TYPE_Q6_K = 14, - GGML_TYPE_Q8_K = 15, - GGML_TYPE_I8, - GGML_TYPE_I16, - GGML_TYPE_I32, + // GGML_TYPE_Q4_3 = 5, support has been removed + GGML_TYPE_Q5_0 = 6, + GGML_TYPE_Q5_1 = 7, + GGML_TYPE_Q8_0 = 8, + GGML_TYPE_Q8_1 = 9, + GGML_TYPE_Q2_K = 10, + GGML_TYPE_Q3_K = 11, + GGML_TYPE_Q4_K = 12, + GGML_TYPE_Q5_K = 13, + GGML_TYPE_Q6_K = 14, + GGML_TYPE_Q8_K = 15, + GGML_TYPE_IQ2_XXS = 16, + GGML_TYPE_IQ2_XS = 17, + GGML_TYPE_IQ3_XXS = 18, + GGML_TYPE_IQ1_S = 19, + GGML_TYPE_IQ4_NL = 20, + GGML_TYPE_IQ3_S = 21, + GGML_TYPE_IQ2_S = 22, + GGML_TYPE_IQ4_XS = 23, + GGML_TYPE_I8 = 24, + GGML_TYPE_I16 = 25, + GGML_TYPE_I32 = 26, + GGML_TYPE_I64 = 27, + GGML_TYPE_F64 = 28, + GGML_TYPE_IQ1_M = 29, GGML_TYPE_COUNT, };