@@ -337,24 +337,24 @@ extern "C" {
337337 struct ggml_object ;
338338 struct ggml_context ;
339339
340+ // NOTE: always add types at the end of the enum to keep backward compatibility
340341 enum ggml_type {
341- GGML_TYPE_F32 = 0 ,
342- GGML_TYPE_F16 = 1 ,
343- GGML_TYPE_Q4_0 = 2 ,
344- GGML_TYPE_Q4_1 = 3 ,
342+ GGML_TYPE_F32 = 0 ,
343+ GGML_TYPE_F16 = 1 ,
344+ GGML_TYPE_Q4_0 = 2 ,
345+ GGML_TYPE_Q4_1 = 3 ,
345346 // GGML_TYPE_Q4_2 = 4, support has been removed
346- // GGML_TYPE_Q4_3 (5) support has been removed
347- GGML_TYPE_Q5_0 = 6 ,
348- GGML_TYPE_Q5_1 = 7 ,
349- GGML_TYPE_Q8_0 = 8 ,
350- GGML_TYPE_Q8_1 = 9 ,
351- // k-quantizations
352- GGML_TYPE_Q2_K = 10 ,
353- GGML_TYPE_Q3_K = 11 ,
354- GGML_TYPE_Q4_K = 12 ,
355- GGML_TYPE_Q5_K = 13 ,
356- GGML_TYPE_Q6_K = 14 ,
357- GGML_TYPE_Q8_K = 15 ,
347+ // GGML_TYPE_Q4_3 = 5, support has been removed
348+ GGML_TYPE_Q5_0 = 6 ,
349+ GGML_TYPE_Q5_1 = 7 ,
350+ GGML_TYPE_Q8_0 = 8 ,
351+ GGML_TYPE_Q8_1 = 9 ,
352+ GGML_TYPE_Q2_K = 10 ,
353+ GGML_TYPE_Q3_K = 11 ,
354+ GGML_TYPE_Q4_K = 12 ,
355+ GGML_TYPE_Q5_K = 13 ,
356+ GGML_TYPE_Q6_K = 14 ,
357+ GGML_TYPE_Q8_K = 15 ,
358358 GGML_TYPE_IQ2_XXS = 16 ,
359359 GGML_TYPE_IQ2_XS = 17 ,
360360 GGML_TYPE_IQ3_XXS = 18 ,
@@ -363,9 +363,9 @@ extern "C" {
363363 GGML_TYPE_IQ3_S = 21 ,
364364 GGML_TYPE_IQ2_S = 22 ,
365365 GGML_TYPE_IQ4_XS = 23 ,
366- GGML_TYPE_I8 ,
367- GGML_TYPE_I16 ,
368- GGML_TYPE_I32 ,
366+ GGML_TYPE_I8 = 24 ,
367+ GGML_TYPE_I16 = 25 ,
368+ GGML_TYPE_I32 = 26 ,
369369 GGML_TYPE_COUNT ,
370370 };
371371
@@ -383,20 +383,20 @@ extern "C" {
383383
384384 // model file types
385385 enum ggml_ftype {
386- GGML_FTYPE_UNKNOWN = -1 ,
387- GGML_FTYPE_ALL_F32 = 0 ,
388- GGML_FTYPE_MOSTLY_F16 = 1 , // except 1d tensors
389- GGML_FTYPE_MOSTLY_Q4_0 = 2 , // except 1d tensors
390- GGML_FTYPE_MOSTLY_Q4_1 = 3 , // except 1d tensors
386+ GGML_FTYPE_UNKNOWN = -1 ,
387+ GGML_FTYPE_ALL_F32 = 0 ,
388+ GGML_FTYPE_MOSTLY_F16 = 1 , // except 1d tensors
389+ GGML_FTYPE_MOSTLY_Q4_0 = 2 , // except 1d tensors
390+ GGML_FTYPE_MOSTLY_Q4_1 = 3 , // except 1d tensors
391391 GGML_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4 , // tok_embeddings.weight and output.weight are F16
392- GGML_FTYPE_MOSTLY_Q8_0 = 7 , // except 1d tensors
393- GGML_FTYPE_MOSTLY_Q5_0 = 8 , // except 1d tensors
394- GGML_FTYPE_MOSTLY_Q5_1 = 9 , // except 1d tensors
395- GGML_FTYPE_MOSTLY_Q2_K = 10 , // except 1d tensors
396- GGML_FTYPE_MOSTLY_Q3_K = 11 , // except 1d tensors
397- GGML_FTYPE_MOSTLY_Q4_K = 12 , // except 1d tensors
398- GGML_FTYPE_MOSTLY_Q5_K = 13 , // except 1d tensors
399- GGML_FTYPE_MOSTLY_Q6_K = 14 , // except 1d tensors
392+ GGML_FTYPE_MOSTLY_Q8_0 = 7 , // except 1d tensors
393+ GGML_FTYPE_MOSTLY_Q5_0 = 8 , // except 1d tensors
394+ GGML_FTYPE_MOSTLY_Q5_1 = 9 , // except 1d tensors
395+ GGML_FTYPE_MOSTLY_Q2_K = 10 , // except 1d tensors
396+ GGML_FTYPE_MOSTLY_Q3_K = 11 , // except 1d tensors
397+ GGML_FTYPE_MOSTLY_Q4_K = 12 , // except 1d tensors
398+ GGML_FTYPE_MOSTLY_Q5_K = 13 , // except 1d tensors
399+ GGML_FTYPE_MOSTLY_Q6_K = 14 , // except 1d tensors
400400 GGML_FTYPE_MOSTLY_IQ2_XXS = 15 , // except 1d tensors
401401 GGML_FTYPE_MOSTLY_IQ2_XS = 16 , // except 1d tensors
402402 GGML_FTYPE_MOSTLY_IQ3_XXS = 17 , // except 1d tensors
0 commit comments