Skip to content

Commit b562d16

Browse files
committed
add other quantization types
1 parent 14206fd commit b562d16

File tree

1 file changed

+45
-1
lines changed

1 file changed

+45
-1
lines changed

examples/cli/main.cpp

Lines changed: 45 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -336,14 +336,58 @@ void parse_args(int argc, const char** argv, SDParams& params) {
336336
params.wtype = SD_TYPE_Q5_1;
337337
} else if (type == "q8_0") {
338338
params.wtype = SD_TYPE_Q8_0;
339+
} else if (type == "q8_1") {
340+
params.wtype = SD_TYPE_Q8_1;
339341
} else if (type == "q2_k") {
340342
params.wtype = SD_TYPE_Q2_K;
341343
} else if (type == "q3_k") {
342344
params.wtype = SD_TYPE_Q3_K;
343345
} else if (type == "q4_k") {
344346
params.wtype = SD_TYPE_Q4_K;
347+
} else if (type == "q5_k") {
348+
params.wtype = SD_TYPE_Q5_K;
349+
} else if (type == "q6_k") {
350+
params.wtype = SD_TYPE_Q6_K;
351+
} else if (type == "q8_k") {
352+
params.wtype = SD_TYPE_Q8_K;
353+
} else if (type == "iq2_xxs") {
354+
params.wtype = SD_TYPE_IQ2_XXS;
355+
} else if (type == "iq2_xs") {
356+
params.wtype = SD_TYPE_IQ2_XS;
357+
} else if (type == "iq3_xxs") {
358+
params.wtype = SD_TYPE_IQ3_XXS;
359+
} else if (type == "iq1_s") {
360+
params.wtype = SD_TYPE_IQ1_S;
361+
} else if (type == "iq4_nl") {
362+
params.wtype = SD_TYPE_IQ4_NL;
363+
} else if (type == "iq3_s") {
364+
params.wtype = SD_TYPE_IQ3_S;
365+
} else if (type == "iq2_s") {
366+
params.wtype = SD_TYPE_IQ2_S;
367+
} else if (type == "iq4_xs") {
368+
params.wtype = SD_TYPE_IQ4_XS;
369+
} else if (type == "i8") {
370+
params.wtype = SD_TYPE_I8;
371+
} else if (type == "i16") {
372+
params.wtype = SD_TYPE_I16;
373+
} else if (type == "i32") {
374+
params.wtype = SD_TYPE_I32;
375+
} else if (type == "i64") {
376+
params.wtype = SD_TYPE_I64;
377+
} else if (type == "f64") {
378+
params.wtype = SD_TYPE_F64;
379+
} else if (type == "iq1_m") {
380+
params.wtype = SD_TYPE_IQ1_M;
381+
} else if (type == "bf16") {
382+
params.wtype = SD_TYPE_BF16;
383+
} else if (type == "q4_0_4_4") {
384+
params.wtype = SD_TYPE_Q4_0_4_4;
385+
} else if (type == "q4_0_4_8") {
386+
params.wtype = SD_TYPE_Q4_0_4_8;
387+
} else if (type == "q4_0_8_8") {
388+
params.wtype = SD_TYPE_Q4_0_8_8;
345389
} else {
346-
fprintf(stderr, "error: invalid weight format %s, must be one of [f32, f16, q4_0, q4_1, q5_0, q5_1, q8_0, q2_k, q3_k, q4_k]\n",
390+
fprintf(stderr, "error: invalid weight format %s, must be one of [f32, f16, q4_0, q4_1, q5_0, q5_1, q8_0, q8_1, q2_k, q3_k, q4_k, q5_k, q6_k, q8_k, iq2_xxs, iq2_xs, iq3_xxs, iq1_s, iq4_nl, iq3_s, iq2_s, iq4_xs, i8, i16, i32, i64, f64, iq1_m, bf16, q4_0_4_4, q4_0_4_8, q4_0_8_8]\n",
347391
type.c_str());
348392
exit(1);
349393
}

0 commit comments

Comments
 (0)