Skip to content

Commit 72ce770

Browse files
[wip][ci] Add metrics tracking and publishing in CI workflows
1 parent e966ed1 commit 72ce770

1 file changed

Lines changed: 25 additions & 0 deletions

File tree

.github/workflows/build-and-run.yml

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -94,13 +94,23 @@ jobs:
9494
tornado --version
9595
./mvnw clean package -DskipTests
9696
- name: FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Standard
97+
env:
98+
JAVA_TOOL_OPTIONS: >-
99+
-Dllama.metrics.format=github
100+
-Dllama.metrics.output=file
101+
-Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-standard.md
97102
run: |
98103
cd ${{ github.workspace }}
99104
export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
100105
./llama-tornado --gpu --${{ matrix.backend.name }} \
101106
--model $MODELS_DIR/Llama-3.2-1B-Instruct-F16.gguf \
102107
--prompt "Say hello"
103108
- name: FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Prefill-Decode
109+
env:
110+
JAVA_TOOL_OPTIONS: >-
111+
-Dllama.metrics.format=github
112+
-Dllama.metrics.output=file
113+
-Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-prefill-decode.md
104114
run: |
105115
cd ${{ github.workspace }}
106116
export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
@@ -109,6 +119,11 @@ jobs:
109119
--prompt "Say hello" \
110120
--with-prefill-decode
111121
- name: FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Batch-Prefill-Decode
122+
env:
123+
JAVA_TOOL_OPTIONS: >-
124+
-Dllama.metrics.format=github
125+
-Dllama.metrics.output=file
126+
-Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-batch-prefill-decode.md
112127
run: |
113128
cd ${{ github.workspace }}
114129
export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
@@ -227,4 +242,14 @@ jobs:
227242
./llama-tornado --gpu --${{ matrix.backend.name }} \
228243
--model /$MODELS_DIR/granite-4.0-1b-Q8_0.gguf \
229244
--prompt "Say hello"
245+
- name: Publish performance summary
246+
if: always()
247+
run: |
248+
echo "## Llama-3.2-1B FP16 — ${{ matrix.backend.name }}" >> $GITHUB_STEP_SUMMARY
249+
echo "### Standard" >> $GITHUB_STEP_SUMMARY
250+
cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-standard.md >> $GITHUB_STEP_SUMMARY
251+
echo "### Prefill-Decode" >> $GITHUB_STEP_SUMMARY
252+
cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-prefill-decode.md >> $GITHUB_STEP_SUMMARY
253+
echo "### Batch-Prefill-Decode" >> $GITHUB_STEP_SUMMARY
254+
cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-batch-prefill-decode.md >> $GITHUB_STEP_SUMMARY
230255

0 commit comments

Comments
 (0)