From c7ea4fd23536185ebe3f4760e456f379918e9ae0 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sat, 27 Jul 2024 17:17:04 +0300 Subject: [PATCH] common : handle new quant types (ggml/0) --- examples/common-ggml.cpp | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/examples/common-ggml.cpp b/examples/common-ggml.cpp index d8dbc88..a3f2c12 100644 --- a/examples/common-ggml.cpp +++ b/examples/common-ggml.cpp @@ -72,6 +72,9 @@ bool ggml_common_quantize_0( case GGML_FTYPE_MOSTLY_IQ4_XS: case GGML_FTYPE_MOSTLY_IQ1_M: case GGML_FTYPE_MOSTLY_BF16: + case GGML_FTYPE_MOSTLY_Q4_0_4_4: + case GGML_FTYPE_MOSTLY_Q4_0_4_8: + case GGML_FTYPE_MOSTLY_Q4_0_8_8: { fprintf(stderr, "%s: invalid model type %d\n", __func__, ftype); return false; @@ -209,6 +212,9 @@ bool ggml_common_quantize_0( case GGML_TYPE_IQ4_XS: case GGML_TYPE_IQ1_M: case GGML_TYPE_BF16: + case GGML_TYPE_Q4_0_4_4: + case GGML_TYPE_Q4_0_4_8: + case GGML_TYPE_Q4_0_8_8: case GGML_TYPE_COUNT: { fprintf(stderr, "%s: unsupported quantization type %d (%s)\n", __func__, ttype, ggml_type_name((ggml_type) ttype));