Skip to content

Commit

Permalink
Restore Q4_1_O support
Browse files Browse the repository at this point in the history
  • Loading branch information
saharNooby committed Apr 17, 2023
1 parent 28e354c commit 38eea11
Showing 1 changed file with 3 additions and 5 deletions.
8 changes: 3 additions & 5 deletions rwkv.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -48,8 +48,7 @@ static const ggml_type FORMAT_TYPE_TO_GGML_TYPE[5] = {
GGML_TYPE_F16,
GGML_TYPE_Q4_0,
GGML_TYPE_Q4_1,
// TODO Restore
//GGML_TYPE_Q4_1_O
GGML_TYPE_Q4_1_O
};

// --- Model definition and loading utilities ---
Expand Down Expand Up @@ -756,11 +755,10 @@ bool rwkv_quantize_model_file(const char * model_file_path_in, const char * mode
{
cur_size = ggml_quantize_q4_1(data_f32.data(), work.data(), nelements, ne[0], hist_cur.data());
} break;
// TODO Restore
/*case GGML_TYPE_Q4_1_O:
case GGML_TYPE_Q4_1_O:
{
cur_size = ggml_quantize_q4_1_o(data_f32.data(), work.data(), nelements, ne[0], hist_cur.data());
} break;*/
} break;
default:
{
fprintf(stderr, "unsupported quantization type %d\n", type);
Expand Down

0 comments on commit 38eea11

Please sign in to comment.