diff --git a/llmodel/gptj.cpp b/llmodel/gptj.cpp index 8e5145f4..837fd1f8 100644 --- a/llmodel/gptj.cpp +++ b/llmodel/gptj.cpp @@ -210,6 +210,7 @@ bool gptj_model_load(const std::string &fname, std::istream &fin, gptj_model & m case 1: wtype = GGML_TYPE_F16; break; case 2: wtype = GGML_TYPE_Q4_0; break; case 3: wtype = GGML_TYPE_Q4_1; break; + case 5: wtype = GGML_TYPE_Q4_2; break; default: { fprintf(stderr, "%s: invalid model file '%s' (bad f16 value %d)\n",