ggerganov commited on
Commit
8ea3a45
·
unverified ·
1 Parent(s): 9a07f42

sync : llama.cpp (ggml/0)

Browse files
Files changed (1) hide show
  1. examples/common-ggml.cpp +4 -0
examples/common-ggml.cpp CHANGED
@@ -64,10 +64,12 @@ bool ggml_common_quantize_0(
64
  case GGML_FTYPE_MOSTLY_Q4_1_SOME_F16:
65
  case GGML_FTYPE_MOSTLY_IQ2_XXS:
66
  case GGML_FTYPE_MOSTLY_IQ2_XS:
 
67
  case GGML_FTYPE_MOSTLY_IQ3_XXS:
68
  case GGML_FTYPE_MOSTLY_IQ3_S:
69
  case GGML_FTYPE_MOSTLY_IQ1_S:
70
  case GGML_FTYPE_MOSTLY_IQ4_NL:
 
71
  {
72
  fprintf(stderr, "%s: invalid model type %d\n", __func__, ftype);
73
  return false;
@@ -199,10 +201,12 @@ bool ggml_common_quantize_0(
199
  case GGML_TYPE_Q8_K:
200
  case GGML_TYPE_IQ2_XXS:
201
  case GGML_TYPE_IQ2_XS:
 
202
  case GGML_TYPE_IQ3_XXS:
203
  case GGML_TYPE_IQ3_S:
204
  case GGML_TYPE_IQ1_S:
205
  case GGML_TYPE_IQ4_NL:
 
206
  case GGML_TYPE_COUNT:
207
  {
208
  fprintf(stderr, "%s: unsupported quantization type %d (%s)\n", __func__, ttype, ggml_type_name((ggml_type) ttype));
 
64
  case GGML_FTYPE_MOSTLY_Q4_1_SOME_F16:
65
  case GGML_FTYPE_MOSTLY_IQ2_XXS:
66
  case GGML_FTYPE_MOSTLY_IQ2_XS:
67
+ case GGML_FTYPE_MOSTLY_IQ2_S:
68
  case GGML_FTYPE_MOSTLY_IQ3_XXS:
69
  case GGML_FTYPE_MOSTLY_IQ3_S:
70
  case GGML_FTYPE_MOSTLY_IQ1_S:
71
  case GGML_FTYPE_MOSTLY_IQ4_NL:
72
+ case GGML_FTYPE_MOSTLY_IQ4_XS:
73
  {
74
  fprintf(stderr, "%s: invalid model type %d\n", __func__, ftype);
75
  return false;
 
201
  case GGML_TYPE_Q8_K:
202
  case GGML_TYPE_IQ2_XXS:
203
  case GGML_TYPE_IQ2_XS:
204
+ case GGML_TYPE_IQ2_S:
205
  case GGML_TYPE_IQ3_XXS:
206
  case GGML_TYPE_IQ3_S:
207
  case GGML_TYPE_IQ1_S:
208
  case GGML_TYPE_IQ4_NL:
209
+ case GGML_TYPE_IQ4_XS:
210
  case GGML_TYPE_COUNT:
211
  {
212
  fprintf(stderr, "%s: unsupported quantization type %d (%s)\n", __func__, ttype, ggml_type_name((ggml_type) ttype));