Spaces:
Running
Running
sync : llama.cpp (ggml/0)
Browse files- examples/common-ggml.cpp +4 -0
examples/common-ggml.cpp
CHANGED
|
@@ -64,10 +64,12 @@ bool ggml_common_quantize_0(
|
|
| 64 |
case GGML_FTYPE_MOSTLY_Q4_1_SOME_F16:
|
| 65 |
case GGML_FTYPE_MOSTLY_IQ2_XXS:
|
| 66 |
case GGML_FTYPE_MOSTLY_IQ2_XS:
|
|
|
|
| 67 |
case GGML_FTYPE_MOSTLY_IQ3_XXS:
|
| 68 |
case GGML_FTYPE_MOSTLY_IQ3_S:
|
| 69 |
case GGML_FTYPE_MOSTLY_IQ1_S:
|
| 70 |
case GGML_FTYPE_MOSTLY_IQ4_NL:
|
|
|
|
| 71 |
{
|
| 72 |
fprintf(stderr, "%s: invalid model type %d\n", __func__, ftype);
|
| 73 |
return false;
|
|
@@ -199,10 +201,12 @@ bool ggml_common_quantize_0(
|
|
| 199 |
case GGML_TYPE_Q8_K:
|
| 200 |
case GGML_TYPE_IQ2_XXS:
|
| 201 |
case GGML_TYPE_IQ2_XS:
|
|
|
|
| 202 |
case GGML_TYPE_IQ3_XXS:
|
| 203 |
case GGML_TYPE_IQ3_S:
|
| 204 |
case GGML_TYPE_IQ1_S:
|
| 205 |
case GGML_TYPE_IQ4_NL:
|
|
|
|
| 206 |
case GGML_TYPE_COUNT:
|
| 207 |
{
|
| 208 |
fprintf(stderr, "%s: unsupported quantization type %d (%s)\n", __func__, ttype, ggml_type_name((ggml_type) ttype));
|
|
|
|
| 64 |
case GGML_FTYPE_MOSTLY_Q4_1_SOME_F16:
|
| 65 |
case GGML_FTYPE_MOSTLY_IQ2_XXS:
|
| 66 |
case GGML_FTYPE_MOSTLY_IQ2_XS:
|
| 67 |
+
case GGML_FTYPE_MOSTLY_IQ2_S:
|
| 68 |
case GGML_FTYPE_MOSTLY_IQ3_XXS:
|
| 69 |
case GGML_FTYPE_MOSTLY_IQ3_S:
|
| 70 |
case GGML_FTYPE_MOSTLY_IQ1_S:
|
| 71 |
case GGML_FTYPE_MOSTLY_IQ4_NL:
|
| 72 |
+
case GGML_FTYPE_MOSTLY_IQ4_XS:
|
| 73 |
{
|
| 74 |
fprintf(stderr, "%s: invalid model type %d\n", __func__, ftype);
|
| 75 |
return false;
|
|
|
|
| 201 |
case GGML_TYPE_Q8_K:
|
| 202 |
case GGML_TYPE_IQ2_XXS:
|
| 203 |
case GGML_TYPE_IQ2_XS:
|
| 204 |
+
case GGML_TYPE_IQ2_S:
|
| 205 |
case GGML_TYPE_IQ3_XXS:
|
| 206 |
case GGML_TYPE_IQ3_S:
|
| 207 |
case GGML_TYPE_IQ1_S:
|
| 208 |
case GGML_TYPE_IQ4_NL:
|
| 209 |
+
case GGML_TYPE_IQ4_XS:
|
| 210 |
case GGML_TYPE_COUNT:
|
| 211 |
{
|
| 212 |
fprintf(stderr, "%s: unsupported quantization type %d (%s)\n", __func__, ttype, ggml_type_name((ggml_type) ttype));
|