@@ -50,57 +50,66 @@ jobs:
5050 - name : Build
5151 run : |
5252 pushd experimental/jetstream-maxtext-stable-stack
53- ./build.sh \
53+ # ./build.sh \
5454 LOCAL_IMAGE_TAG="${LOCAL_IMAGE_TAG}"
5555 popd
5656 - name : Test
5757 run : |
5858 pushd experimental/jetstream-maxtext-stable-stack
59- ./test.sh \
59+ # ./test.sh \
6060 LOCAL_IMAGE_TAG=${LOCAL_IMAGE_TAG}
6161 popd
6262 - name : Upload image
6363 run : |
64+ # UPLOAD_IMAGE_TAG=gcr.io/cloud-ml-auto-solutions/${LOCAL_IMAGE_TAG}
65+ # docker tag ${LOCAL_IMAGE_TAG} ${UPLOAD_IMAGE_TAG}
66+ # docker push ${UPLOAD_IMAGE_TAG}
6467 UPLOAD_IMAGE_TAG=gcr.io/cloud-ml-auto-solutions/${LOCAL_IMAGE_TAG}
65- docker tag ${LOCAL_IMAGE_TAG} ${UPLOAD_IMAGE_TAG}
66- docker push ${UPLOAD_IMAGE_TAG}
68+ gcloud container images add- tag gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:nightly ${UPLOAD_IMAGE_TAG} --quiet
69+
6770
6871 benchmark_report :
6972 name : Benchmark Report
7073 needs : build_stable_stack
7174 runs-on : ["self-hosted", "tpu", "v6e-8"]
72- container :
73- # sync with the image uploaded from build_stable_stack stage
74- image : gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }}
75- options : " --privileged"
7675 env :
77- OUTPUT_DIR : /workspace/ test_dir/
76+ OUTPUT_DIR : ./ test_dir
7877 steps :
79- - name : Create output directory # Ensure directory exists in container
80- run : mkdir -p ${OUTPUT_DIR}
8178 - name : Test MOEBenchmarks
82- # Report should generated in OUTPUT_DIR depend on ENV
83- run : bash JetStream/.github/workflows/test_moe_benchmarks.sh
79+ run : |
80+ rm -rf ${OUTPUT_DIR}
81+ mkdir -p ${OUTPUT_DIR}
82+ # sync with the image uploaded from build_stable_stack stage
83+ # Report should generated in OUTPUT_DIR depend on ENV
84+ DOCKER_OUTPUT_DIR=/output
85+ docker run \
86+ -v ${OUTPUT_DIR}:${DOCKER_OUTPUT_DIR} \
87+ --env OUTPUT_DIR=${DOCKER_OUTPUT_DIR} \
88+ --privileged --net=host --rm -i \
89+ gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} \
90+ bash -c "
91+ bash JetStream/.github/workflows/test_moe_benchmarks.sh
92+ "
8493 - name : Upload build artifact
8594 uses : actions/upload-artifact@v4
8695 with :
8796 name : benchmark_report
8897 path : ${{ env.OUTPUT_DIR }}
8998
90- clean_up_on_fail :
91- if : ${{ failure() }}
92- needs : [build_stable_stack, benchmark_report]
93- name : " Clean up"
94- runs-on : ["self-hosted"]
95- permissions :
96- contents : read
97- issues : write # for failed-build-issue
98- steps :
99- - name : Authenticate gcloud
100- run : gcloud auth configure-docker gcr.io --quiet
101- - name : Delete TPU image
102- # sync with the image uploaded from build_stable_stack stage
103- run : gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
99+ # clean_up_on_fail:
100+ # if: ${{ failure() }}
101+ # needs: [build_stable_stack, benchmark_report]
102+ # name: "Clean up"
103+ # runs-on: ["self-hosted"]
104+ # permissions:
105+ # contents: read
106+ # issues: write # for failed-build-issue
107+ # steps:
108+ # - name: Authenticate gcloud
109+ # run: gcloud auth configure-docker gcr.io --quiet
110+ # - name: Delete TPU image
111+ # # sync with the image uploaded from build_stable_stack stage
112+ # run: gcloud container images delete gcr.io/cloud-ml-auto-solutions/jetstream-maxtext-stable-stack/tpu:github_${{ github.run_id }} --force-delete-tags --quiet
104113
105114 tag_night_image :
106115 needs : [build_stable_stack, benchmark_report]
@@ -126,12 +135,16 @@ jobs:
126135 name : Notify test build # creates an issue or modifies last open existing issue for failed build
127136 needs : [build_stable_stack, benchmark_report]
128137 runs-on : ["self-hosted", "tpu", "v6e-8"]
138+ env :
139+ BENCHMARK_REPORT_DIR : ./benchmark_report
129140 steps :
141+ - name : Clean previous artifact
142+ run : rm -rf ${{ env.OUTPUT_DIR }}
130143 - name : Download benchmark artifact
131144 uses : actions/download-artifact@v4
132145 with :
133146 name : benchmark_report
134- path : ./benchmark_report
147+ path : ${{ env.OUTPUT_DIR }}
135148 - name : Check whether one of the jobs failed
136149 if : ${{ failure() }}
137150 uses : jayqi/failed-build-issue-action@1a893bbf43ef1c2a8705e2b115cd4f0fe3c5649b # v1.2.0
@@ -140,16 +153,19 @@ jobs:
140153 - name : Log message if dependent job succeeded
141154 if : ${{ ! (failure() && github.event.pull_request == null) }}
142155 run : echo "Conditions for creating/updating issue not met. Skipping."
143- - name : Send email
144- uses : dawidd6/action-send-mail@v3.6.0
145- with :
146- server_address : smtp.gmail.com
147- server_port : 465
148- username : ${{secrets.MAIL_USERNAME}}
149- password : ${{secrets.MAIL_PASSWORD}}
150- subject : Message from Inference Stable Stack Runs.
151- to : singhvijaya@google.com, yuyanpeng@google.com, vipannalla@google.com
152- from : JetStream Runs
153- secure : true
154- attachments : ./benchmark_report/moe_8x7b.txt,./benchmark_report/moe_8x22b.txt,./benchmark_report/moe_8x22b_long_context_8k_prefill.txt,./benchmark_report/moe_8x7b_jetstream.txt
155- body : workflow for ${{github.repository}} completed successfully!
156+ - name : cat report
157+ run : |
158+ cat ${{ env.OUTPUT_DIR }}/moe_8x7b.txt ${{ env.OUTPUT_DIR }}/moe_8x22b.txt ${{ env.OUTPUT_DIR }}/moe_8x22b_long_context_8k_prefill.txt ${{ env.OUTPUT_DIR }}/moe_8x7b_jetstream.txt
159+ # - name: Send email
160+ # uses: dawidd6/action-send-mail@v3.6.0
161+ # with:
162+ # server_address: smtp.gmail.com
163+ # server_port: 465
164+ # username: ${{secrets.MAIL_USERNAME}}
165+ # password: ${{secrets.MAIL_PASSWORD}}
166+ # subject: Message from Inference Stable Stack Runs.
167+ # to: singhvijaya@google.com, yuyanpeng@google.com, vipannalla@google.com
168+ # from: JetStream Runs
169+ # secure: true
170+ # attachments: ./benchmark_report/moe_8x7b.txt,./benchmark_report/moe_8x22b.txt,./benchmark_report/moe_8x22b_long_context_8k_prefill.txt,./benchmark_report/moe_8x7b_jetstream.txt
171+ # body: workflow for ${{github.repository}} completed successfully!
0 commit comments