File tree Expand file tree Collapse file tree 1 file changed +3
-1
lines changed Expand file tree Collapse file tree 1 file changed +3
-1
lines changed Original file line number Diff line number Diff line change @@ -597,6 +597,9 @@ def build_model_from_args(args: argparse.Namespace):
597
597
"`num_shards` should be used together with "
598
598
"`--build-model-only` and `--convert-weight-only`"
599
599
)
600
+ use_ft_quant = args .quantization .name in ["q4f16_ft" , "q8f16_ft" ]
601
+ if use_ft_quant :
602
+ raise ValueError ("Multi-GPU deployments are not available for ft quantization." )
600
603
os .makedirs (args .artifact_path , exist_ok = True )
601
604
if args .debug_dump :
602
605
os .makedirs (os .path .join (args .artifact_path , "debug" ), exist_ok = True )
@@ -614,7 +617,6 @@ def build_model_from_args(args: argparse.Namespace):
614
617
config = json .load (i_f )
615
618
616
619
if not use_cache or args .convert_weight_only :
617
-
618
620
model_generators = {
619
621
"llama" : llama ,
620
622
"mistral" : llama ,
You can’t perform that action at this time.
0 commit comments