Skip to content

Commit 7ebe4d1

Browse files
guangy10malfet
authored andcommitted
More cleanup on period job (#299)
1 parent d42c5c5 commit 7ebe4d1

File tree

2 files changed

+3
-35
lines changed

2 files changed

+3
-35
lines changed

.ci/scripts/validate.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ function generate_compiled_model_output() {
2525
local MODEL_DIR="${CHECKPOINT_PATH%/*}"
2626
local MODEL_NAME=$(basename "$CHECKPOINT_PATH" | sed 's/\.[^.]*$//')
2727

28-
for DTYPE in float32 bfloat16 float16; do
28+
for DTYPE in bfloat16 float16 float32; do
2929
echo ""############### Run inference with torch.compile for dtype $DTYPE "###############"
3030
echo ""
3131
echo "******************************************"
@@ -98,7 +98,7 @@ function generate_aoti_model_output() {
9898
local MODEL_DIR="${CHECKPOINT_PATH%/*}"
9999
local MODEL_NAME=$(basename "$CHECKPOINT_PATH" | sed 's/\.[^.]*$//')
100100

101-
for DTYPE in float32 bfloat16 float16; do
101+
for DTYPE in bfloat16 float16 float32; do
102102
echo ""############### Run inference with AOT Inductor for dtype $DTYPE "###############"
103103
echo ""
104104
echo "******************************************"

.github/workflows/periodic.yml

Lines changed: 1 addition & 33 deletions
Original file line numberDiff line numberDiff line change
@@ -124,7 +124,7 @@ jobs:
124124
echo "::endgroup::"
125125
126126
echo "::group::Install required packages"
127-
pip install --pre torch --index-url https://download.pytorch.org/whl/nightly/cu121
127+
pip install --pre torch --index-url https://download.pytorch.org/whl/nightly/cu121
128128
pip install -r ./requirements.txt
129129
pip list
130130
echo "::endgroup::"
@@ -140,37 +140,5 @@ jobs:
140140
141141
echo "::group::Run inference"
142142
bash .ci/scripts/validate.sh "./checkpoints/${REPO_NAME}/model.pth" "cuda" "compile"
143-
test-gpu-aoti:
144-
uses: pytorch/test-infra/.github/workflows/linux_job.yml@main
145-
name: test-gpu-aoti (${{ matrix.platform }}, ${{ matrix.model_name }})
146-
needs: gather-models-gpu
147-
strategy:
148-
matrix: ${{ fromJSON(needs.gather-models-gpu.outputs.models) }}
149-
fail-fast: false
150-
with:
151-
runner: linux.g5.4xlarge.nvidia.gpu
152-
gpu-arch-type: cuda
153-
gpu-arch-version: "12.1"
154-
script: |
155-
echo "::group::Print machine info"
156-
nvidia-smi
157-
echo "::endgroup::"
158-
159-
echo "::group::Install required packages"
160-
pip install --pre torch --index-url https://download.pytorch.org/whl/nightly/cu121
161-
pip install -r ./requirements.txt
162-
pip list
163-
echo "::endgroup::"
164-
165-
echo "::group::Download checkpoint"
166-
export REPO_NAME=${{ matrix.repo_name }}
167-
bash .ci/scripts/wget_checkpoint.sh ${REPO_NAME} ${{ matrix.resources }}
168-
echo "::endgroup::"
169-
170-
echo "::group::Convert checkpoint"
171-
bash .ci/scripts/convert_checkpoint.sh ${REPO_NAME}
172-
echo "::endgroup::"
173-
174-
echo "::group::Run inference"
175143
bash .ci/scripts/validate.sh "./checkpoints/${REPO_NAME}/model.pth" "cuda" "aoti"
176144
echo "::endgroup::"

0 commit comments

Comments
 (0)