Spaces:
Running
Running
ggml : designate enum vals for integer types (llama/6050)
Browse files
ggml.h
CHANGED
|
@@ -337,24 +337,24 @@ extern "C" {
|
|
| 337 |
struct ggml_object;
|
| 338 |
struct ggml_context;
|
| 339 |
|
|
|
|
| 340 |
enum ggml_type {
|
| 341 |
-
GGML_TYPE_F32
|
| 342 |
-
GGML_TYPE_F16
|
| 343 |
-
GGML_TYPE_Q4_0
|
| 344 |
-
GGML_TYPE_Q4_1
|
| 345 |
// GGML_TYPE_Q4_2 = 4, support has been removed
|
| 346 |
-
// GGML_TYPE_Q4_3
|
| 347 |
-
GGML_TYPE_Q5_0
|
| 348 |
-
GGML_TYPE_Q5_1
|
| 349 |
-
GGML_TYPE_Q8_0
|
| 350 |
-
GGML_TYPE_Q8_1
|
| 351 |
-
|
| 352 |
-
|
| 353 |
-
|
| 354 |
-
|
| 355 |
-
|
| 356 |
-
|
| 357 |
-
GGML_TYPE_Q8_K = 15,
|
| 358 |
GGML_TYPE_IQ2_XXS = 16,
|
| 359 |
GGML_TYPE_IQ2_XS = 17,
|
| 360 |
GGML_TYPE_IQ3_XXS = 18,
|
|
@@ -363,9 +363,9 @@ extern "C" {
|
|
| 363 |
GGML_TYPE_IQ3_S = 21,
|
| 364 |
GGML_TYPE_IQ2_S = 22,
|
| 365 |
GGML_TYPE_IQ4_XS = 23,
|
| 366 |
-
GGML_TYPE_I8,
|
| 367 |
-
GGML_TYPE_I16,
|
| 368 |
-
GGML_TYPE_I32,
|
| 369 |
GGML_TYPE_COUNT,
|
| 370 |
};
|
| 371 |
|
|
@@ -383,20 +383,20 @@ extern "C" {
|
|
| 383 |
|
| 384 |
// model file types
|
| 385 |
enum ggml_ftype {
|
| 386 |
-
GGML_FTYPE_UNKNOWN
|
| 387 |
-
GGML_FTYPE_ALL_F32
|
| 388 |
-
GGML_FTYPE_MOSTLY_F16
|
| 389 |
-
GGML_FTYPE_MOSTLY_Q4_0
|
| 390 |
-
GGML_FTYPE_MOSTLY_Q4_1
|
| 391 |
GGML_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4, // tok_embeddings.weight and output.weight are F16
|
| 392 |
-
GGML_FTYPE_MOSTLY_Q8_0
|
| 393 |
-
GGML_FTYPE_MOSTLY_Q5_0
|
| 394 |
-
GGML_FTYPE_MOSTLY_Q5_1
|
| 395 |
-
GGML_FTYPE_MOSTLY_Q2_K
|
| 396 |
-
GGML_FTYPE_MOSTLY_Q3_K
|
| 397 |
-
GGML_FTYPE_MOSTLY_Q4_K
|
| 398 |
-
GGML_FTYPE_MOSTLY_Q5_K
|
| 399 |
-
GGML_FTYPE_MOSTLY_Q6_K
|
| 400 |
GGML_FTYPE_MOSTLY_IQ2_XXS = 15, // except 1d tensors
|
| 401 |
GGML_FTYPE_MOSTLY_IQ2_XS = 16, // except 1d tensors
|
| 402 |
GGML_FTYPE_MOSTLY_IQ3_XXS = 17, // except 1d tensors
|
|
|
|
| 337 |
struct ggml_object;
|
| 338 |
struct ggml_context;
|
| 339 |
|
| 340 |
+
// NOTE: always add types at the end of the enum to keep backward compatibility
|
| 341 |
enum ggml_type {
|
| 342 |
+
GGML_TYPE_F32 = 0,
|
| 343 |
+
GGML_TYPE_F16 = 1,
|
| 344 |
+
GGML_TYPE_Q4_0 = 2,
|
| 345 |
+
GGML_TYPE_Q4_1 = 3,
|
| 346 |
// GGML_TYPE_Q4_2 = 4, support has been removed
|
| 347 |
+
// GGML_TYPE_Q4_3 = 5, support has been removed
|
| 348 |
+
GGML_TYPE_Q5_0 = 6,
|
| 349 |
+
GGML_TYPE_Q5_1 = 7,
|
| 350 |
+
GGML_TYPE_Q8_0 = 8,
|
| 351 |
+
GGML_TYPE_Q8_1 = 9,
|
| 352 |
+
GGML_TYPE_Q2_K = 10,
|
| 353 |
+
GGML_TYPE_Q3_K = 11,
|
| 354 |
+
GGML_TYPE_Q4_K = 12,
|
| 355 |
+
GGML_TYPE_Q5_K = 13,
|
| 356 |
+
GGML_TYPE_Q6_K = 14,
|
| 357 |
+
GGML_TYPE_Q8_K = 15,
|
|
|
|
| 358 |
GGML_TYPE_IQ2_XXS = 16,
|
| 359 |
GGML_TYPE_IQ2_XS = 17,
|
| 360 |
GGML_TYPE_IQ3_XXS = 18,
|
|
|
|
| 363 |
GGML_TYPE_IQ3_S = 21,
|
| 364 |
GGML_TYPE_IQ2_S = 22,
|
| 365 |
GGML_TYPE_IQ4_XS = 23,
|
| 366 |
+
GGML_TYPE_I8 = 24,
|
| 367 |
+
GGML_TYPE_I16 = 25,
|
| 368 |
+
GGML_TYPE_I32 = 26,
|
| 369 |
GGML_TYPE_COUNT,
|
| 370 |
};
|
| 371 |
|
|
|
|
| 383 |
|
| 384 |
// model file types
|
| 385 |
enum ggml_ftype {
|
| 386 |
+
GGML_FTYPE_UNKNOWN = -1,
|
| 387 |
+
GGML_FTYPE_ALL_F32 = 0,
|
| 388 |
+
GGML_FTYPE_MOSTLY_F16 = 1, // except 1d tensors
|
| 389 |
+
GGML_FTYPE_MOSTLY_Q4_0 = 2, // except 1d tensors
|
| 390 |
+
GGML_FTYPE_MOSTLY_Q4_1 = 3, // except 1d tensors
|
| 391 |
GGML_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4, // tok_embeddings.weight and output.weight are F16
|
| 392 |
+
GGML_FTYPE_MOSTLY_Q8_0 = 7, // except 1d tensors
|
| 393 |
+
GGML_FTYPE_MOSTLY_Q5_0 = 8, // except 1d tensors
|
| 394 |
+
GGML_FTYPE_MOSTLY_Q5_1 = 9, // except 1d tensors
|
| 395 |
+
GGML_FTYPE_MOSTLY_Q2_K = 10, // except 1d tensors
|
| 396 |
+
GGML_FTYPE_MOSTLY_Q3_K = 11, // except 1d tensors
|
| 397 |
+
GGML_FTYPE_MOSTLY_Q4_K = 12, // except 1d tensors
|
| 398 |
+
GGML_FTYPE_MOSTLY_Q5_K = 13, // except 1d tensors
|
| 399 |
+
GGML_FTYPE_MOSTLY_Q6_K = 14, // except 1d tensors
|
| 400 |
GGML_FTYPE_MOSTLY_IQ2_XXS = 15, // except 1d tensors
|
| 401 |
GGML_FTYPE_MOSTLY_IQ2_XS = 16, // except 1d tensors
|
| 402 |
GGML_FTYPE_MOSTLY_IQ3_XXS = 17, // except 1d tensors
|