@@ -94,13 +94,23 @@ jobs:
9494 tornado --version
9595 ./mvnw clean package -DskipTests
9696 - name : FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Standard
97+ env :
98+ JAVA_TOOL_OPTIONS : >-
99+ -Dllama.metrics.format=github
100+ -Dllama.metrics.output=file
101+ -Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-standard.md
97102 run : |
98103 cd ${{ github.workspace }}
99104 export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
100105 ./llama-tornado --gpu --${{ matrix.backend.name }} \
101106 --model $MODELS_DIR/Llama-3.2-1B-Instruct-F16.gguf \
102107 --prompt "Say hello"
103108 - name : FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Prefill-Decode
109+ env :
110+ JAVA_TOOL_OPTIONS : >-
111+ -Dllama.metrics.format=github
112+ -Dllama.metrics.output=file
113+ -Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-prefill-decode.md
104114 run : |
105115 cd ${{ github.workspace }}
106116 export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
@@ -109,6 +119,11 @@ jobs:
109119 --prompt "Say hello" \
110120 --with-prefill-decode
111121 - name : FP16 - Run Llama-3.2-1B-Instruct-F16.gguf - Batch-Prefill-Decode
122+ env :
123+ JAVA_TOOL_OPTIONS : >-
124+ -Dllama.metrics.format=github
125+ -Dllama.metrics.output=file
126+ -Dllama.metrics.file=${{ runner.temp }}/metrics-${{ matrix.backend.name }}-batch-prefill-decode.md
112127 run : |
113128 cd ${{ github.workspace }}
114129 export PATH="$TORNADOVM_HOME/bin:$JAVA_HOME/bin:$PATH"
@@ -227,4 +242,14 @@ jobs:
227242 ./llama-tornado --gpu --${{ matrix.backend.name }} \
228243 --model /$MODELS_DIR/granite-4.0-1b-Q8_0.gguf \
229244 --prompt "Say hello"
245+ - name : Publish performance summary
246+ if : always()
247+ run : |
248+ echo "## Llama-3.2-1B FP16 — ${{ matrix.backend.name }}" >> $GITHUB_STEP_SUMMARY
249+ echo "### Standard" >> $GITHUB_STEP_SUMMARY
250+ cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-standard.md >> $GITHUB_STEP_SUMMARY
251+ echo "### Prefill-Decode" >> $GITHUB_STEP_SUMMARY
252+ cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-prefill-decode.md >> $GITHUB_STEP_SUMMARY
253+ echo "### Batch-Prefill-Decode" >> $GITHUB_STEP_SUMMARY
254+ cat ${{ runner.temp }}/metrics-${{ matrix.backend.name }}-batch-prefill-decode.md >> $GITHUB_STEP_SUMMARY
230255
0 commit comments