File tree 4 files changed +10
-122
lines changed 4 files changed +10
-122
lines changed Original file line number Diff line number Diff line change @@ -41,7 +41,7 @@ echo PASS
41
41
echo
42
42
43
43
# 2b. Test the sharded model is loading properly
44
- $MAIN --model $WORK_PATH /ggml-model-split-00001-of-00006.gguf --n-predict 32
44
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-00001-of-00006.gguf --n-predict 32
45
45
echo PASS
46
46
echo
47
47
@@ -51,7 +51,7 @@ echo PASS
51
51
echo
52
52
53
53
# 3b. Test the merged model is loading properly
54
- $MAIN --model $WORK_PATH /ggml-model-merge.gguf --n-predict 32
54
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-merge.gguf --n-predict 32
55
55
echo PASS
56
56
echo
57
57
@@ -61,7 +61,7 @@ echo PASS
61
61
echo
62
62
63
63
# 4b. Test the sharded model is loading properly
64
- $MAIN --model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00007.gguf --n-predict 32
64
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00007.gguf --n-predict 32
65
65
echo PASS
66
66
echo
67
67
71
71
# echo
72
72
73
73
# 5b. Test the merged model is loading properly
74
- # $MAIN --model $WORK_PATH/ggml-model-merge-2.gguf --n-predict 32
74
+ # $MAIN -no-cnv - -model $WORK_PATH/ggml-model-merge-2.gguf --n-predict 32
75
75
# echo PASS
76
76
# echo
77
77
@@ -81,7 +81,7 @@ echo PASS
81
81
echo
82
82
83
83
# 6b. Test the sharded model is loading properly
84
- $MAIN --model $WORK_PATH /ggml-model-split-2G-00001-of-00002.gguf --n-predict 32
84
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-2G-00001-of-00002.gguf --n-predict 32
85
85
echo PASS
86
86
echo
87
87
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ echo PASS
47
47
echo
48
48
49
49
# 3a. Test the requanted model is loading properly
50
- $MAIN --model $WORK_PATH /ggml-model-requant-00001-of-00006.gguf --n-predict 32
50
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-requant-00001-of-00006.gguf --n-predict 32
51
51
echo PASS
52
52
echo
53
53
@@ -57,7 +57,7 @@ echo PASS
57
57
echo
58
58
59
59
# 4b. Test the requanted model is loading properly
60
- $MAIN --model $WORK_PATH /ggml-model-requant-merge.gguf --n-predict 32
60
+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-requant-merge.gguf --n-predict 32
61
61
echo PASS
62
62
echo
63
63
Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -80,18 +80,18 @@ run_conversion_and_inference_lora() {
80
80
# Run inference
81
81
echo -e " \n\n---------------------------\n\n"
82
82
echo " Running llama-cli without lora for $model_name with hidden_size $hidden_size ..."
83
- OUTPUT_BASE=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
83
+ OUTPUT_BASE=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
84
84
-p " $EXPECTED_BASE_FIRST_WORD " -n 50 --seed 42 --temp 0)
85
85
86
86
echo -e " \n\n---------------------------\n\n"
87
87
echo " Running llama-cli with hot lora for $model_name with hidden_size $hidden_size ..."
88
- OUTPUT_LORA_HOT=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
88
+ OUTPUT_LORA_HOT=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
89
89
--lora $MODELS_REPO /$model_name /hidden_size=$hidden_size /lora/Lora-F32-LoRA.gguf \
90
90
-p " $EXPECTED_LORA_FIRST_WORD " -n 50 --seed 42 --temp 0)
91
91
92
92
echo -e " \n\n---------------------------\n\n"
93
93
echo " Running llama-cli with merged lora for $model_name with hidden_size $hidden_size ..."
94
- OUTPUT_LORA_MERGED=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32-lora-merged.gguf \
94
+ OUTPUT_LORA_MERGED=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32-lora-merged.gguf \
95
95
-p " $EXPECTED_LORA_FIRST_WORD " -n 50 --seed 42 --temp 0)
96
96
97
97
# Remove any initial white space
You can’t perform that action at this time.
0 commit comments