From 38eea116b85eab3d3a0d77be34d2d653b02389a0 Mon Sep 17 00:00:00 2001 From: saharNooby Date: Mon, 17 Apr 2023 18:53:48 +0400 Subject: [PATCH] Restore Q4_1_O support --- rwkv.cpp | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/rwkv.cpp b/rwkv.cpp index e194bc4..47fefed 100644 --- a/rwkv.cpp +++ b/rwkv.cpp @@ -48,8 +48,7 @@ static const ggml_type FORMAT_TYPE_TO_GGML_TYPE[5] = { GGML_TYPE_F16, GGML_TYPE_Q4_0, GGML_TYPE_Q4_1, - // TODO Restore - //GGML_TYPE_Q4_1_O + GGML_TYPE_Q4_1_O }; // --- Model definition and loading utilities --- @@ -756,11 +755,10 @@ bool rwkv_quantize_model_file(const char * model_file_path_in, const char * mode { cur_size = ggml_quantize_q4_1(data_f32.data(), work.data(), nelements, ne[0], hist_cur.data()); } break; - // TODO Restore - /*case GGML_TYPE_Q4_1_O: + case GGML_TYPE_Q4_1_O: { cur_size = ggml_quantize_q4_1_o(data_f32.data(), work.data(), nelements, ne[0], hist_cur.data()); - } break;*/ + } break; default: { fprintf(stderr, "unsupported quantization type %d\n", type);