@@ -50,13 +50,13 @@ jobs:
5050 - name : Build
5151 run : |
5252 pushd experimental/jetstream-maxtext-stable-stack
53- ./build.sh \
53+ # ./build.sh \
5454 LOCAL_IMAGE_TAG="${LOCAL_IMAGE_TAG}"
5555 popd
5656 - name : Test
5757 run : |
5858 pushd experimental/jetstream-maxtext-stable-stack
59- ./test.sh \
59+ # ./test.sh \
6060 LOCAL_IMAGE_TAG=${LOCAL_IMAGE_TAG}
6161 popd
6262 - name : Upload image
@@ -65,42 +65,48 @@ jobs:
6565 docker tag ${LOCAL_IMAGE_TAG} ${UPLOAD_IMAGE_TAG}
6666 docker push ${UPLOAD_IMAGE_TAG}
6767
68+
6869 benchmark_report :
6970 name : Benchmark Report
7071 needs : build_stable_stack
7172 runs-on : ["self-hosted", "tpu", "v6e-8"]
72- container :
73- # sync with the image uploaded from build_stable_stack stage
74- image : gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }}
75- options : " --privileged"
7673 env :
77- OUTPUT_DIR : /workspace /test_dir/
74+ OUTPUT_DIR : . /test_dir/
7875 steps :
79- - name : Create output directory # Ensure directory exists in container
80- run : mkdir -p ${OUTPUT_DIR}
8176 - name : Test MOEBenchmarks
82- # Report should generated in OUTPUT_DIR depend on ENV
83- run : bash JetStream/.github/workflows/test_moe_benchmarks.sh
77+ run : |
78+ mkdir -p ${OUTPUT_DIR}
79+ # sync with the image uploaded from build_stable_stack stage
80+ # Report should generated in OUTPUT_DIR depend on ENV
81+ DOCKER_OUTPUT_DIR=/output
82+ docker run \
83+ -v ${OUTPUT_DIR}:${DOCKER_OUTPUT_DIR}} \
84+ --env OUTPUT_DIR:${DOCKER_OUTPUT_DIR} \
85+ --privileged --net=host --rm -i \
86+ gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} \
87+ bash -c "
88+ bash JetStream/.github/workflows/test_moe_benchmarks.sh
89+ "
8490 - name : Upload build artifact
8591 uses : actions/upload-artifact@v4
8692 with :
8793 name : benchmark_report
8894 path : ${{ env.OUTPUT_DIR }}
8995
90- clean_up_on_fail :
91- if : ${{ failure() }}
92- needs : [build_stable_stack, benchmark_report]
93- name : " Clean up"
94- runs-on : ["self-hosted"]
95- permissions :
96- contents : read
97- issues : write # for failed-build-issue
98- steps :
99- - name : Authenticate gcloud
100- run : gcloud auth configure-docker gcr.io --quiet
101- - name : Delete TPU image
102- # sync with the image uploaded from build_stable_stack stage
103- run : gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
96+ # clean_up_on_fail:
97+ # if: ${{ failure() }}
98+ # needs: [build_stable_stack, benchmark_report]
99+ # name: "Clean up"
100+ # runs-on: ["self-hosted"]
101+ # permissions:
102+ # contents: read
103+ # issues: write # for failed-build-issue
104+ # steps:
105+ # - name: Authenticate gcloud
106+ # run: gcloud auth configure-docker gcr.io --quiet
107+ # - name: Delete TPU image
108+ # # sync with the image uploaded from build_stable_stack stage
109+ # run: gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
104110
105111 tag_night_image :
106112 needs : [build_stable_stack, benchmark_report]
0 commit comments