Skip to content

Commit 968819d

Browse files
Merge pull request #517 from janhq/update-dev-from-master-2026-05-16-01-02
Sync master with upstream release b9173
2 parents ed758db + 49d1701 commit 968819d

104 files changed

Lines changed: 15678 additions & 14138 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.github/workflows/release.yml

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -104,7 +104,7 @@ jobs:
104104
id: pack_artifacts
105105
run: |
106106
cp LICENSE ./build/bin/
107-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-macos-${{ matrix.build }}.tar.gz -s ",./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
107+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-macos-${{ matrix.build }}.tar.gz -s ",^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
108108
109109
- name: Upload artifacts
110110
uses: actions/upload-artifact@v6
@@ -182,7 +182,7 @@ jobs:
182182
id: pack_artifacts
183183
run: |
184184
cp LICENSE ./build/bin/
185-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-${{ matrix.build }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
185+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-${{ matrix.build }}.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
186186
187187
- name: Upload artifacts
188188
uses: actions/upload-artifact@v6
@@ -259,7 +259,7 @@ jobs:
259259
id: pack_artifacts
260260
run: |
261261
cp LICENSE ./build/bin/
262-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-vulkan-${{ matrix.build }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
262+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-vulkan-${{ matrix.build }}.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
263263
264264
- name: Upload artifacts
265265
uses: actions/upload-artifact@v6
@@ -337,7 +337,7 @@ jobs:
337337
id: pack_artifacts
338338
run: |
339339
cp LICENSE ./build/bin/
340-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-android-arm64.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
340+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-android-arm64.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
341341
342342
- name: Upload artifacts
343343
uses: actions/upload-artifact@v6
@@ -426,7 +426,7 @@ jobs:
426426
id: pack_artifacts
427427
run: |
428428
cp LICENSE ./build/ReleaseOV/bin/
429-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-openvino-${{ env.OPENVINO_VERSION_MAJOR }}-x64.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/ReleaseOV/bin .
429+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-openvino-${{ env.OPENVINO_VERSION_MAJOR }}-x64.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/ReleaseOV/bin .
430430
431431
- name: Upload artifacts
432432
uses: actions/upload-artifact@v6
@@ -867,7 +867,7 @@ jobs:
867867
id: pack_artifacts
868868
run: |
869869
cp LICENSE ./build/bin/
870-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-sycl-${{ matrix.build }}-x64.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
870+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-sycl-${{ matrix.build }}-x64.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
871871
872872
- name: Upload artifacts
873873
uses: actions/upload-artifact@v6
@@ -979,7 +979,7 @@ jobs:
979979
id: pack_artifacts
980980
run: |
981981
cp LICENSE ./build/bin/
982-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ env.ROCM_VERSION_SHORT }}-${{ matrix.build }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
982+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-ubuntu-rocm-${{ env.ROCM_VERSION_SHORT }}-${{ matrix.build }}.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
983983
984984
- name: Upload artifacts
985985
uses: actions/upload-artifact@v6
@@ -1240,7 +1240,7 @@ jobs:
12401240
- name: Pack artifacts
12411241
run: |
12421242
cp LICENSE ./build/bin/
1243-
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-${{ matrix.chip_type }}-openEuler-${{ matrix.arch }}${{ matrix.use_acl_graph == 'on' && '-aclgraph' || '' }}.tar.gz --transform "s,./,llama-${{ steps.tag.outputs.name }}/," -C ./build/bin .
1243+
tar -czvf llama-${{ steps.tag.outputs.name }}-bin-${{ matrix.chip_type }}-openEuler-${{ matrix.arch }}${{ matrix.use_acl_graph == 'on' && '-aclgraph' || '' }}.tar.gz --transform "s,^\.,llama-${{ steps.tag.outputs.name }}," -C ./build/bin .
12441244
12451245
- name: Upload artifacts
12461246
uses: actions/upload-artifact@v6

README.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -172,6 +172,7 @@ Instructions for adding support for new models: [HOWTO-add-model.md](docs/develo
172172
- JavaScript/Wasm (works in browser): [tangledgroup/llama-cpp-wasm](https://github.com/tangledgroup/llama-cpp-wasm)
173173
- Typescript/Wasm (nicer API, available on npm): [ngxson/wllama](https://github.com/ngxson/wllama)
174174
- Ruby: [yoshoku/llama_cpp.rb](https://github.com/yoshoku/llama_cpp.rb)
175+
- Ruby: [docusealco/rllama](https://github.com/docusealco/rllama)
175176
- Rust (more features): [edgenai/llama_cpp-rs](https://github.com/edgenai/llama_cpp-rs)
176177
- Rust (nicer API): [mdrokz/rust-llama.cpp](https://github.com/mdrokz/rust-llama.cpp)
177178
- Rust (more direct bindings): [utilityai/llama-cpp-rs](https://github.com/utilityai/llama-cpp-rs)

common/reasoning-budget.cpp

Lines changed: 10 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -171,22 +171,12 @@ static void common_reasoning_budget_reset(struct llama_sampler * smpl) {
171171
ctx->force_pos = 0;
172172
}
173173

174-
// forward declaration for use in clone
175174
static struct llama_sampler * common_reasoning_budget_init_state(
176175
const struct llama_vocab * vocab, const std::vector<llama_token> & start_tokens,
177176
const std::vector<llama_token> & end_tokens, const std::vector<llama_token> & forced_tokens,
178177
int32_t budget, common_reasoning_budget_state initial_state);
179178

180-
static struct llama_sampler * common_reasoning_budget_clone(const struct llama_sampler * smpl) {
181-
const auto * ctx = (const common_reasoning_budget_ctx *) smpl->ctx;
182-
return common_reasoning_budget_init_state(
183-
ctx->vocab,
184-
ctx->start_matcher.tokens,
185-
ctx->end_matcher.tokens,
186-
ctx->forced_tokens,
187-
ctx->budget,
188-
ctx->state);
189-
}
179+
static struct llama_sampler * common_reasoning_budget_clone(const struct llama_sampler * smpl);
190180

191181
static void common_reasoning_budget_free(struct llama_sampler * smpl) {
192182
delete (common_reasoning_budget_ctx *) smpl->ctx;
@@ -205,6 +195,15 @@ static struct llama_sampler_i common_reasoning_budget_i = {
205195
/* .backend_set_input = */ nullptr,
206196
};
207197

198+
static struct llama_sampler * common_reasoning_budget_clone(const struct llama_sampler * smpl) {
199+
const auto * ctx = (const common_reasoning_budget_ctx *) smpl->ctx;
200+
201+
return llama_sampler_init(
202+
/* .iface = */ &common_reasoning_budget_i,
203+
/* .ctx = */ new common_reasoning_budget_ctx(*ctx)
204+
);
205+
}
206+
208207
static struct llama_sampler * common_reasoning_budget_init_state(
209208
const struct llama_vocab * vocab,
210209
const std::vector<llama_token> & start_tokens,

0 commit comments

Comments
 (0)