4747 - name : Ensure NVIDIA SDK available
4848 run : |
4949 sudo apt-get -y install cuda-toolkit
50- echo "/usr/local/cuda-12.5 /bin" >> $GITHUB_PATH
50+ echo "/usr/local/cuda-12.6 /bin" >> $GITHUB_PATH
5151 - name : Install dependencies
5252 run : |
5353 python -m pip install --upgrade pip
@@ -75,10 +75,10 @@ jobs:
7575 env :
7676 HF_TOKEN : ${{ secrets.HF_TOKEN }}
7777 # Configure endpoints for Azure OpenAI
78- AZUREAI_CHAT_ENDPOINT : ${{ secrets .AZUREAI_CHAT_ENDPOINT }}
79- AZUREAI_CHAT_MODEL : ${{ secrets .AZUREAI_CHAT_MODEL }}
80- AZUREAI_COMPLETION_ENDPOINT : ${{ secrets .AZUREAI_COMPLETION_ENDPOINT }}
81- AZUREAI_COMPLETION_MODEL : ${{ secrets .AZUREAI_COMPLETION_MODEL }}
78+ AZUREAI_CHAT_ENDPOINT : ${{ vars .AZUREAI_CHAT_ENDPOINT }}
79+ AZUREAI_CHAT_MODEL : ${{ vars .AZUREAI_CHAT_MODEL }}
80+ AZUREAI_COMPLETION_ENDPOINT : ${{ vars .AZUREAI_COMPLETION_ENDPOINT }}
81+ AZUREAI_COMPLETION_MODEL : ${{ vars .AZUREAI_COMPLETION_MODEL }}
8282 # Configure endpoints for Azure AI Studio
8383 AZURE_AI_STUDIO_PHI3_ENDPOINT : ${{ vars.AZURE_AI_STUDIO_PHI3_ENDPOINT }}
8484 AZURE_AI_STUDIO_PHI3_DEPLOYMENT : ${{ vars.AZURE_AI_STUDIO_PHI3_DEPLOYMENT }}
@@ -132,7 +132,7 @@ jobs:
132132 - name : Ensure NVIDIA SDK available
133133 run : |
134134 sudo apt-get -y install cuda-toolkit
135- echo "/usr/local/cuda-12.5 /bin" >> $GITHUB_PATH
135+ echo "/usr/local/cuda-12.6 /bin" >> $GITHUB_PATH
136136 - name : Install dependencies
137137 shell : bash
138138 run : |
@@ -150,6 +150,9 @@ jobs:
150150 run : |
151151 pip install accelerate
152152 pip uninstall -y llama-cpp-python
153+ echo "======================"
154+ nvcc --version
155+ echo "======================"
153156 CMAKE_ARGS="-DGGML_CUDA=on" pip install "llama-cpp-python!=0.2.58,!=0.2.75"
154157 - name : Check GPU available
155158 run : |
0 commit comments