pytorch
diff --git a/‎.github/scripts/ci_test_xpu.sh‎
Lines changed: 1 addition & 1 deletion b/‎.github/scripts/ci_test_xpu.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/scripts/torchao_model_releases/eval_mm_quality.sh‎
Lines changed: 98 additions & 0 deletions b/‎.github/scripts/torchao_model_releases/eval_mm_quality.sh‎
Lines changed: 98 additions & 0 deletions
diff --git a/‎.github/workflows/1xH100_tests.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/1xH100_tests.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/1xL4_tests.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/1xL4_tests.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/4xH100_tests.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/4xH100_tests.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/build_wheels_linux.yml‎
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/build_wheels_linux.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎.github/workflows/dashboard_perf_test.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/dashboard_perf_test.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/doc_build.yml‎
Lines changed: 1 addition & 2 deletions b/‎.github/workflows/doc_build.yml‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎.github/workflows/nightly_smoke_test.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/nightly_smoke_test.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/regression_test.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/regression_test.yml‎
Lines changed: 2 additions & 2 deletions
@@ -8,7 +8,7 @@ export CXX=/usr/bin/g++
 export SCCACHE_DISABLE=1
 
 python3 -m pip install torch torchvision torchaudio pytorch-triton-xpu --index-url https://download.pytorch.org/whl/nightly/xpu --force-reinstall --no-cache-dir 
-cd torchao && python3 setup.py install && cd ..
+cd torchao && pip install . --no-build-isolation && cd ..
 
 python3 -c "import torch; import torchao; print(f'Torch version: {torch.__version__}')"
 
 
@@ -0,0 +1,98 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD 3-Clause license found in the
+# LICENSE file in the root directory of this source tree.
+
+#!/bin/bash
+set -e
+source eval_env_checks.sh
+check_lmms_eval
+
+usage() {
+  echo "Usage: $0 --model_id <model_id> --model_type <model_type> [--tasks <tasks> (comma-separated, e.g. mmlu,arc_challenge, default mmlu)] [--use_cache]"
+  exit 1
+}
+
+MODEL_ID_ARRAY=()
+MODEL_TYPE=""
+TASK_ARRAY=("chartqa")  # default can be overwritten by user input
+BATCH_SIZE=1
+USE_CACHE=false      # default: do not use cache
+# Parse arguments
+while [[ $# -gt 0 ]]; do
+  case "$1" in
+    --model_ids)
+      shift
+      while [[ $# -gt 0 && ! "$1" =~ ^-- ]]; do
+        MODEL_ID_ARRAY+=("$1")
+        shift
+      done
+      ;;
+    --model_type)
+      MODEL_TYPE="$2"
+      shift 2
+      ;;
+    --batch_size)
+      BATCH_SIZE="$2"
+      shift 2
+      ;;
+    --tasks)
+      shift
+      TASK_ARRAY=()
+      while [[ $# -gt 0 && ! "$1" =~ ^-- ]]; do
+        TASK_ARRAY+=("$1")
+        shift
+      done
+      ;;
+    --use_cache)
+      USE_CACHE=true
+      shift
+      ;;
+    *)
+      echo "Unknown argument: $1"
+      usage
+      exit 1
+      ;;
+  esac
+done
+if [[ ${#MODEL_ID_ARRAY[@]} -eq 0 ]]; then
+  echo "Error: --model_ids is required"
+  usage
+  exit 1
+fi
+if [[ -z "$MODEL_TYPE" ]]; then
+  echo "Error: --model_type is required"
+  usage
+  exit 1
+fi
+RESULTS_DIR="$(pwd)/mm_quality_eval_results"
+for MODEL_ID in "${MODEL_ID_ARRAY[@]}"; do
+    # Replace all '/' with '_'
+    SAFE_MODEL_ID="${MODEL_ID//\//_}"
+    echo "======================== Eval Multi-modal Model Quality $MODLE_ID ======================"
+    for TASK in "${TASK_ARRAY[@]}"; do
+        OUTPUT_FILE="$(pwd)/${SAFE_MODEL_ID}_mm_quality_${TASK}.log"
+        EVAL_CACHE_DB_PREFIX="/tmp/${SAFE_MODEL_ID}_mm_quality_${TASK}"
+        mkdir -p "${EVAL_CACHE_DB_PREFIX}"
+        echo "Running multi-modal model quality (accuracy) evaluation for model $MODEL_ID on task $TASK"
+
+        MAIN_PORT=12356
+        LMMS_EVAL_CMD="accelerate launch \
+           --main_process_port \"$MAIN_PORT\" \
+           -m lmms_eval \
+           --model \"$MODEL_TYPE\" \
+           --model_args \"pretrained=$MODEL_ID\" \
+           --tasks \"$TASK\" \
+          --batch_size \"$BATCH_SIZE\" \
+          --output_path \"$RESULTS_DIR\""
+
+        if $USE_CACHE; then
+            LMMS_EVAL_CMD="$LMMS_EVAL_CMD --use_cache \"$EVAL_CACHE_DB_PREFIX\""
+        fi
+
+        eval "$LMMS_EVAL_CMD" > "$OUTPUT_FILE" 2>&1
+        echo "Quality eval output for task '$TASK' saved to $OUTPUT_FILE"
+    done
+    echo "======================== Eval Model Quality $MODEL_ID End =================="
+done
@@ -46,7 +46,7 @@ jobs:
         pip install uv
         pip install ${{ matrix.torch-spec }}
         uv pip install -r dev-requirements.txt
-        pip install .
+        pip install . --no-build-isolation
         pytest test/integration --verbose -s
         pytest test/dtypes/test_affine_quantized_float.py --verbose -s
         python test/quantization/quantize_/workflows/float8/test_float8_tensor.py
 
@@ -46,7 +46,7 @@ jobs:
         pip install uv
         pip install ${{ matrix.torch-spec }}
         uv pip install -r dev-requirements.txt
-        pip install .
+        pip install . --no-build-isolation
         pytest test/integration --verbose -s
         pytest test/dtypes/test_affine_quantized_float.py --verbose -s
         ./test/float8/test_everything_single_gpu.sh
 
@@ -44,6 +44,6 @@ jobs:
         pip install uv
         pip install ${{ matrix.torch-spec }}
         uv pip install -r dev-requirements.txt
-        pip install .
+        pip install . --no-build-isolation
         ./test/float8/test_everything_multi_gpu.sh
         ./test/prototype/mx_formats/test_mx_dtensor.sh
@@ -8,6 +8,7 @@ on:
       - packaging/**
       - .github/workflows/build_wheels_linux.yml
       - setup.py
+      - .github/scripts/**
   push:
     branches:
       - nightly
 
@@ -30,7 +30,7 @@ jobs:
           ${CONDA_RUN} python -m pip install --upgrade pip
           ${CONDA_RUN} pip install ${{ matrix.torch-spec }}
           ${CONDA_RUN} pip install -r dev-requirements.txt
-          ${CONDA_RUN} pip install .
+          ${CONDA_RUN} pip install . --no-build-isolation
           # SAM 2.1
           ${CONDA_RUN} pip install -r examples/sam2_amg_server/requirements.txt
 
 
@@ -43,8 +43,7 @@ jobs:
       - name: Install dependencies
         run: |
           python -m pip install torch
-          python -m pip install setuptools==78.1.1 --force-reinstall
-          python -m pip install -e .
+          python -m pip install -e . --no-build-isolation
           pip install -r dev-requirements.txt
           python -m pip install -r docs/requirements.txt
       - name: Build docs
 
@@ -38,5 +38,5 @@ jobs:
         python -m pip install --upgrade pip
         pip install ${{ matrix.torch-spec }}
         pip install -r dev-requirements.txt
-        python setup.py install
+        pip install . --no-build-isolation
         pytest test --verbose -s
@@ -50,7 +50,7 @@ jobs:
         python -m pip install --upgrade pip
         pip install ${{ matrix.torch-spec }}
         pip install -r dev-requirements.txt
-        pip install .
+        pip install . --no-build-isolation
         export CONDA=$(dirname $(dirname $(which conda)))
         export LD_LIBRARY_PATH=$CONDA/lib/:$LD_LIBRARY_PATH
         pytest test --verbose -s
@@ -114,7 +114,7 @@ jobs:
         pip install ${{ matrix.torch-spec }}
         sed -i '${{ matrix.dev-requirements-overrides }}' dev-requirements.txt
         pip install -r dev-requirements.txt
-        pip install .
+        pip install . --no-build-isolation
         export CONDA=$(dirname $(dirname $(which conda)))
         export LD_LIBRARY_PATH=$CONDA/lib/:$LD_LIBRARY_PATH
         pytest test --verbose -s