remove macos-12 test (#501)

mikekgfb · malfet · commit 3c66c45603e7 · 2024-07-17T09:55:44.000-07:00
diff --git a/.github/workflows/pull.yml b/.github/workflows/pull.yml
@@ -458,81 +458,6 @@ jobs:
           python torchchat.py generate stories15M
           python torchchat.py remove stories15m
 
-  test-tinystories-eager:
-    strategy:
-      matrix:
-        runner: [macos-12]
-    runs-on: ${{matrix.runner}}
-    steps:
-      - name: Checkout repo
-        uses: actions/checkout@v2
-      - name: Setup Python
-        uses: actions/setup-python@v2
-        with:
-          python-version: 3.11
-      - name: Print machine info
-        run: |
-          uname -a
-          if [ $(uname -s) == Darwin ]; then
-            sysctl machdep.cpu.brand_string
-            sysctl machdep.cpu.core_count
-          fi
-      - name: Install requirements
-        run: |
-          pip install --pre torch  --index-url https://download.pytorch.org/whl/nightly/cpu
-          pip install -r requirements.txt
-          python3 -c 'import torch;print(f"torch: {torch.__version__, torch.version.git_version}")'
-      - name: Download checkpoints
-        run: |
-          mkdir -p checkpoints/stories15M
-          pushd checkpoints/stories15M
-          wget https://huggingface.co/karpathy/tinyllamas/resolve/main/stories15M.pt
-          wget https://github.com/karpathy/llama2.c/raw/master/tokenizer.model
-          popd
-      - name: Run inference
-        run: |
-          export MODEL_PATH=checkpoints/stories15M/stories15M.pt
-          export MODEL_NAME=stories15M
-          export MODEL_DIR=/tmp
-          for DTYPE in bfloat16 float16 float32; do
-            # if [ $(uname -s) == Darwin ]; then
-            #   export DTYPE=float16
-            # fi
-            python3 torchchat.py generate --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "******************************************"
-            echo "******* Emb: channel-wise quantized ******"
-            echo "******************************************"
-            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "******************************************"
-            echo "******** Emb: group-wise quantized *******"
-            echo "******************************************"
-            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "******************************************"
-            echo "******* INT8 channel-wise quantized ******"
-            echo "******************************************"
-            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "******************************************"
-            echo "******** INT8 group-wise quantized *******"
-            echo "******************************************"
-            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "******************************************"
-            echo "******** INT4 group-wise quantized *******"
-            echo "******************************************"
-
-            echo "INT4 should work on MacOS on x86, but cannot be tested"
-            echo "because nightlies are too old!"
-
-            # python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0
-
-            echo "tests complete for ${DTYPE}"
-            done
-
-            echo "tests complete for all dtypes!"
   test-mps:
     uses: pytorch/test-infra/.github/workflows/macos_job.yml@main
     with:
diff --git a/parking_lot/macos-12-x86.yml b/parking_lot/macos-12-x86.yml
@@ -0,0 +1,75 @@
+  test-tinystories-eager:
+    strategy:
+      matrix:
+        runner: [macos-12]
+    runs-on: ${{matrix.runner}}
+    steps:
+      - name: Checkout repo
+        uses: actions/checkout@v2
+      - name: Setup Python
+        uses: actions/setup-python@v2
+        with:
+          python-version: 3.11
+      - name: Print machine info
+        run: |
+          uname -a
+          if [ $(uname -s) == Darwin ]; then
+            sysctl machdep.cpu.brand_string
+            sysctl machdep.cpu.core_count
+          fi
+      - name: Install requirements
+        run: |
+          pip install --pre torch  --index-url https://download.pytorch.org/whl/nightly/cpu
+          pip install -r requirements.txt
+          python3 -c 'import torch;print(f"torch: {torch.__version__, torch.version.git_version}")'
+      - name: Download checkpoints
+        run: |
+          mkdir -p checkpoints/stories15M
+          pushd checkpoints/stories15M
+          wget https://huggingface.co/karpathy/tinyllamas/resolve/main/stories15M.pt
+          wget https://github.com/karpathy/llama2.c/raw/master/tokenizer.model
+          popd
+      - name: Run inference
+        run: |
+          export MODEL_PATH=checkpoints/stories15M/stories15M.pt
+          export MODEL_NAME=stories15M
+          export MODEL_DIR=/tmp
+          for DTYPE in bfloat16 float16 float32; do
+            # if [ $(uname -s) == Darwin ]; then
+            #   export DTYPE=float16
+            # fi
+            python3 torchchat.py generate --dtype ${DTYPE} --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "******************************************"
+            echo "******* Emb: channel-wise quantized ******"
+            echo "******************************************"
+            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "******************************************"
+            echo "******** Emb: group-wise quantized *******"
+            echo "******************************************"
+            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"embedding" : {"bitwidth": 8, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "******************************************"
+            echo "******* INT8 channel-wise quantized ******"
+            echo "******************************************"
+            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize": 0}}' --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "******************************************"
+            echo "******** INT8 group-wise quantized *******"
+            echo "******************************************"
+            python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int8" : {"bitwidth": 8, "groupsize": 8}}' --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "******************************************"
+            echo "******** INT4 group-wise quantized *******"
+            echo "******************************************"
+
+            echo "INT4 should work on MacOS on x86, but cannot be tested"
+            echo "because nightlies are too old!"
+
+            # python3 torchchat.py generate --dtype ${DTYPE} --quant '{"linear:int4" : {"groupsize": 32}}' --checkpoint-path ${MODEL_PATH} --temperature 0
+
+            echo "tests complete for ${DTYPE}"
+            done
+
+            echo "tests complete for all dtypes!"