You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
* ci : add lora test
ggml-ci
* move lora summary to the top, add lora logs
ggml-ci
* ci : decrease CPU ppl runs to 2 to avoide 20 min timeout
ggml-ci
* add 7b lora test
use 1 thread for CUDA generation tests
ggml-ci
* add test with q8_0 (cpu only)
ggml-ci
---------
Co-authored-by: Georgi Gerganov <[email protected]>
gg_printf '- shakespeare (q8_0 / f16 base lora):\n```\n%s\n```\n'"$(cat $OUT/${ci}-ppl-shakespeare-lora-q8_0-f16.log)"
256
304
}
257
305
258
306
# open_llama_7b_v2
@@ -310,17 +358,17 @@ function gg_run_open_llama_7b_v2 {
310
358
./bin/quantize ${model_f16}${model_q5_k} q5_k
311
359
./bin/quantize ${model_f16}${model_q6_k} q6_k
312
360
313
-
(time ./bin/main --model ${model_f16} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-f16.log
314
-
(time ./bin/main --model ${model_q8_0} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q8_0.log
315
-
(time ./bin/main --model ${model_q4_0} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_0.log
316
-
(time ./bin/main --model ${model_q4_1} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_1.log
317
-
(time ./bin/main --model ${model_q5_0} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_0.log
318
-
(time ./bin/main --model ${model_q5_1} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_1.log
319
-
(time ./bin/main --model ${model_q2_k} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q2_k.log
320
-
(time ./bin/main --model ${model_q3_k} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q3_k.log
321
-
(time ./bin/main --model ${model_q4_k} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_k.log
322
-
(time ./bin/main --model ${model_q5_k} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_k.log
323
-
(time ./bin/main --model ${model_q6_k} -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q6_k.log
361
+
(time ./bin/main --model ${model_f16} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-f16.log
362
+
(time ./bin/main --model ${model_q8_0} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q8_0.log
363
+
(time ./bin/main --model ${model_q4_0} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_0.log
364
+
(time ./bin/main --model ${model_q4_1} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_1.log
365
+
(time ./bin/main --model ${model_q5_0} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_0.log
366
+
(time ./bin/main --model ${model_q5_1} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_1.log
367
+
(time ./bin/main --model ${model_q2_k} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q2_k.log
368
+
(time ./bin/main --model ${model_q3_k} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q3_k.log
369
+
(time ./bin/main --model ${model_q4_k} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q4_k.log
370
+
(time ./bin/main --model ${model_q5_k} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q5_k.log
371
+
(time ./bin/main --model ${model_q6_k} -t 1 -ngl 999 -s 1234 -n 256 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q6_k.log
0 commit comments