File tree 2 files changed +4
-1
lines changed 2 files changed +4
-1
lines changed Original file line number Diff line number Diff line change @@ -827,7 +827,9 @@ static const char *llama_ftype_name(enum llama_ftype ftype) {
827
827
case LLAMA_FTYPE_MOSTLY_F16: return " mostly F16" ;
828
828
case LLAMA_FTYPE_MOSTLY_Q4_0: return " mostly Q4_0" ;
829
829
case LLAMA_FTYPE_MOSTLY_Q4_1: return " mostly Q4_1" ;
830
- default : LLAMA_ASSERT (false );
830
+ case LLAMA_FTYPE_MOSTLY_Q4_1_SOME_F16:
831
+ return " mostly Q4_1, some F16" ;
832
+ default : return " unknown, may not work" ;
831
833
}
832
834
}
833
835
Original file line number Diff line number Diff line change @@ -71,6 +71,7 @@ extern "C" {
71
71
LLAMA_FTYPE_MOSTLY_F16 = 1 , // except 1d tensors
72
72
LLAMA_FTYPE_MOSTLY_Q4_0 = 2 , // except 1d tensors
73
73
LLAMA_FTYPE_MOSTLY_Q4_1 = 3 , // except 1d tensors
74
+ LLAMA_FTYPE_MOSTLY_Q4_1_SOME_F16 = 4 , // tok_embeddings.weight and output.weight are F16
74
75
};
75
76
76
77
LLAMA_API struct llama_context_params llama_context_default_params ();
You can’t perform that action at this time.
0 commit comments