More cleanup on period job (#299)

guangy10 · malfet · commit 7ebe4d18fc9d · 2024-07-17T09:55:42.000-07:00
diff --git a/.ci/scripts/validate.sh b/.ci/scripts/validate.sh
@@ -25,7 +25,7 @@ function generate_compiled_model_output() {
     local MODEL_DIR="${CHECKPOINT_PATH%/*}"
     local MODEL_NAME=$(basename "$CHECKPOINT_PATH" | sed 's/\.[^.]*$//')
 
-    for DTYPE in float32 bfloat16 float16; do
+    for DTYPE in bfloat16 float16 float32; do
         echo ""############### Run inference with torch.compile for dtype $DTYPE "###############"
         echo ""
         echo "******************************************"
@@ -98,7 +98,7 @@ function generate_aoti_model_output() {
     local MODEL_DIR="${CHECKPOINT_PATH%/*}"
     local MODEL_NAME=$(basename "$CHECKPOINT_PATH" | sed 's/\.[^.]*$//')
 
-    for DTYPE in float32 bfloat16 float16; do
+    for DTYPE in bfloat16 float16 float32; do
         echo ""############### Run inference with AOT Inductor  for dtype $DTYPE "###############"
         echo ""
         echo "******************************************"
diff --git a/.github/workflows/periodic.yml b/.github/workflows/periodic.yml
@@ -124,7 +124,7 @@ jobs:
         echo "::endgroup::"
 
         echo "::group::Install required packages"
-        pip install --pre torch  --index-url https://download.pytorch.org/whl/nightly/cu121
+        pip install --pre torch --index-url https://download.pytorch.org/whl/nightly/cu121
         pip install -r ./requirements.txt
         pip list
         echo "::endgroup::"
@@ -140,37 +140,5 @@ jobs:
 
         echo "::group::Run inference"
         bash .ci/scripts/validate.sh "./checkpoints/${REPO_NAME}/model.pth" "cuda" "compile"
-  test-gpu-aoti:
-    uses: pytorch/test-infra/.github/workflows/linux_job.yml@main
-    name: test-gpu-aoti (${{ matrix.platform }}, ${{ matrix.model_name }})
-    needs: gather-models-gpu
-    strategy:
-      matrix: ${{ fromJSON(needs.gather-models-gpu.outputs.models) }}
-      fail-fast: false
-    with:
-      runner: linux.g5.4xlarge.nvidia.gpu
-      gpu-arch-type: cuda
-      gpu-arch-version: "12.1"
-      script: |
-        echo "::group::Print machine info"
-        nvidia-smi
-        echo "::endgroup::"
-
-        echo "::group::Install required packages"
-        pip install --pre torch  --index-url https://download.pytorch.org/whl/nightly/cu121
-        pip install -r ./requirements.txt
-        pip list
-        echo "::endgroup::"
-
-        echo "::group::Download checkpoint"
-        export REPO_NAME=${{ matrix.repo_name }}
-        bash .ci/scripts/wget_checkpoint.sh ${REPO_NAME} ${{ matrix.resources }}
-        echo "::endgroup::"
-
-        echo "::group::Convert checkpoint"
-        bash .ci/scripts/convert_checkpoint.sh ${REPO_NAME}
-        echo "::endgroup::"
-
-        echo "::group::Run inference"
         bash .ci/scripts/validate.sh "./checkpoints/${REPO_NAME}/model.pth" "cuda" "aoti"
         echo "::endgroup::"