@@ -50,57 +50,65 @@ jobs:
5050 - name : Build
5151 run : |
5252 pushd experimental/jetstream-maxtext-stable-stack
53- ./build.sh \
53+ # ./build.sh \
5454 LOCAL_IMAGE_TAG="${LOCAL_IMAGE_TAG}"
5555 popd
5656 - name : Test
5757 run : |
5858 pushd experimental/jetstream-maxtext-stable-stack
59- ./test.sh \
59+ # ./test.sh \
6060 LOCAL_IMAGE_TAG=${LOCAL_IMAGE_TAG}
6161 popd
6262 - name : Upload image
6363 run : |
64+ # UPLOAD_IMAGE_TAG=gcr.io/cloud-ml-auto-solutions/${LOCAL_IMAGE_TAG}
65+ # docker tag ${LOCAL_IMAGE_TAG} ${UPLOAD_IMAGE_TAG}
66+ # docker push ${UPLOAD_IMAGE_TAG}
6467 UPLOAD_IMAGE_TAG=gcr.io/cloud-ml-auto-solutions/${LOCAL_IMAGE_TAG}
65- docker tag ${LOCAL_IMAGE_TAG} ${UPLOAD_IMAGE_TAG}
66- docker push ${UPLOAD_IMAGE_TAG}
68+ gcloud container images add- tag gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:nightly ${UPLOAD_IMAGE_TAG} --quiet
69+
6770
6871 benchmark_report :
6972 name : Benchmark Report
7073 needs : build_stable_stack
7174 runs-on : ["self-hosted", "tpu", "v6e-8"]
72- container :
73- # sync with the image uploaded from build_stable_stack stage
74- image : gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }}
75- options : " --privileged"
7675 env :
77- OUTPUT_DIR : /workspace /test_dir/
76+ OUTPUT_DIR : . /test_dir/
7877 steps :
79- - name : Create output directory # Ensure directory exists in container
80- run : mkdir -p ${OUTPUT_DIR}
8178 - name : Test MOEBenchmarks
82- # Report should generated in OUTPUT_DIR depend on ENV
83- run : bash JetStream/.github/workflows/test_moe_benchmarks.sh
79+ run : |
80+ mkdir -p ${OUTPUT_DIR}
81+ # sync with the image uploaded from build_stable_stack stage
82+ # Report should generated in OUTPUT_DIR depend on ENV
83+ DOCKER_OUTPUT_DIR=/output
84+ docker run \
85+ -v ${OUTPUT_DIR}:${DOCKER_OUTPUT_DIR}} \
86+ --env OUTPUT_DIR:${DOCKER_OUTPUT_DIR} \
87+ --privileged --net=host --rm -i \
88+ gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} \
89+ bash -c "
90+ bash JetStream/.github/workflows/test_moe_benchmarks.sh
91+ "
8492 - name : Upload build artifact
8593 uses : actions/upload-artifact@v4
8694 with :
8795 name : benchmark_report
8896 path : ${{ env.OUTPUT_DIR }}
8997
90- clean_up_on_fail :
91- if : ${{ failure() }}
92- needs : [build_stable_stack, benchmark_report]
93- name : " Clean up"
94- runs-on : ["self-hosted"]
95- permissions :
96- contents : read
97- issues : write # for failed-build-issue
98- steps :
99- - name : Authenticate gcloud
100- run : gcloud auth configure-docker gcr.io --quiet
101- - name : Delete TPU image
102- # sync with the image uploaded from build_stable_stack stage
103- run : gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
98+ # clean_up_on_fail:
99+ # if: ${{ failure() }}
100+ # needs: [build_stable_stack, benchmark_report]
101+ # name: "Clean up"
102+ # runs-on: ["self-hosted"]
103+ # permissions:
104+ # contents: read
105+ # issues: write # for failed-build-issue
106+ # steps:
107+ # - name: Authenticate gcloud
108+ # run: gcloud auth configure-docker gcr.io --quiet
109+ # - name: Delete TPU image
110+ # # sync with the image uploaded from build_stable_stack stage
111+ # run: gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
104112
105113 tag_night_image :
106114 needs : [build_stable_stack, benchmark_report]
0 commit comments