diff --git a/.github/workflows/unit_tests.yml b/.github/workflows/unit_tests.yml index b1e8fb9d5..623c2eb7c 100644 --- a/.github/workflows/unit_tests.yml +++ b/.github/workflows/unit_tests.yml @@ -387,7 +387,7 @@ jobs: - name: Install wheel run: | - uv pip install colorlog git+https://github.com/ModelCloud/Tokenicer -U + uv pip install colorlog logbar git+https://github.com/ModelCloud/Tokenicer -U echo "===== install optimum bitblas parameterized uvicorn =====" uv pip install optimum bitblas==0.0.1.dev13 parameterized uvicorn -i http://${{ needs.check-vm.outputs.ip }}/simple/ --trusted-host ${{ needs.check-vm.outputs.ip }} --extra-index-url https://pypi.org/simple echo "===== install dist/whl =====" @@ -547,7 +547,7 @@ jobs: - name: Install wheel run: | - uv pip install -U transformers colorlog + uv pip install -U transformers colorlog logbar if [ "${{ matrix.test_script }}" == "test_perplexity" ] || \ [ "${{ matrix.test_script }}" == "test_q4_bitblas" ] || \ [ "${{ matrix.test_script }}" == "test_save_loaded_quantized_model" ]; then diff --git a/tests/inference_speed.py b/tests/inference_speed.py index a2f8816e6..1e6d5102c 100644 --- a/tests/inference_speed.py +++ b/tests/inference_speed.py @@ -95,7 +95,7 @@ def inference(self, model_path, backend, tokens_per_second, assert_result=True, print(f"New Token Per Second: {avg_tokens_per_second} token/s") print(f"**************** {backend} Warm-up Result Info End****************") - pb = ProgressBar(range(self.NUM_RUNS)).title("Run") + pb = logger.pb(range(self.NUM_RUNS)).title("Run") for _ in pb: start_time = time.time() result = model.generate(**inp, max_new_tokens=self.MAX_NEW_TOKENS, pad_token_id=tokenizer.pad_token_id)