fix(ci): clean up KVarN cache warnings

Anbeeld · Anbeeld · commit 6914c6ec9067 · 2026-06-05T13:32:28.000+02:00
diff --git a/src/llama-kv-cache-iswa.cpp b/src/llama-kv-cache-iswa.cpp
@@ -210,7 +210,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_batch(llama_batch_allocr & ba
         }
 
         return std::make_unique<llama_kv_cache_iswa_context>(
-                this, std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));
+                std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));
     } while (false);
 
     // if it fails, try equal split
@@ -244,7 +244,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_batch(llama_batch_allocr & ba
         }
 
         return std::make_unique<llama_kv_cache_iswa_context>(
-                this, std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));
+                std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));
     } while (false);
 
     // TODO: if we fail again, we should attempt different splitting strategies
@@ -277,7 +277,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_kv_batch(const std::vector<ll
     }
 
     return std::make_unique<llama_kv_cache_iswa_context>(
-            this, std::move(ctx_base), std::move(ctx_swa), ubatches);
+            std::move(ctx_base), std::move(ctx_swa), ubatches);
 }
 
 bool llama_kv_cache_iswa::get_can_shift() const {
@@ -333,7 +333,6 @@ llama_kv_cache_iswa_context::llama_kv_cache_iswa_context(
 }
 
 llama_kv_cache_iswa_context::llama_kv_cache_iswa_context(
-        llama_kv_cache_iswa * kv,
         llama_memory_context_ptr ctx_base_in,
         llama_memory_context_ptr ctx_swa_in,
         std::vector<llama_ubatch> ubatches) :
diff --git a/src/llama-kv-cache-iswa.h b/src/llama-kv-cache-iswa.h
@@ -108,7 +108,6 @@ class llama_kv_cache_iswa_context : public llama_memory_context_i {
 
     // used to create a batch processing context from a batch
     llama_kv_cache_iswa_context(
-            llama_kv_cache_iswa * kv,
             llama_memory_context_ptr ctx_base_in,
             llama_memory_context_ptr ctx_swa_in,
             std::vector<llama_ubatch> ubatches);
diff --git a/src/llama-kv-cache-kvarn.cpp b/src/llama-kv-cache-kvarn.cpp
@@ -233,7 +233,6 @@ llama_kv_cache_kvarn::llama_kv_cache_kvarn(
         llama_swa_type swa_type,
         const layer_filter_cb & filter,
         const layer_reuse_cb & reuse) :
-    model(model),
     hparams(hparams),
     params(params),
     n_stream(unified ? 1u : n_seq_max),
@@ -565,11 +564,11 @@ void llama_kv_cache_kvarn::seq_keep(llama_seq_id seq_id) {
     metadata->seq_keep(seq_id);
 }
 
-void llama_kv_cache_kvarn::seq_add(llama_seq_id, llama_pos, llama_pos, llama_pos) {
+GGML_NORETURN void llama_kv_cache_kvarn::seq_add(llama_seq_id, llama_pos, llama_pos, llama_pos) {
     GGML_ABORT("KVarN does not support position shifts");
 }
 
-void llama_kv_cache_kvarn::seq_div(llama_seq_id, llama_pos, llama_pos, int) {
+GGML_NORETURN void llama_kv_cache_kvarn::seq_div(llama_seq_id, llama_pos, llama_pos, int) {
     GGML_ABORT("KVarN does not support position division");
 }
 
diff --git a/src/llama-kv-cache-kvarn.h b/src/llama-kv-cache-kvarn.h
@@ -108,8 +108,8 @@ class llama_kv_cache_kvarn : public llama_memory_i {
     void seq_cp(llama_seq_id seq_id_src, llama_seq_id seq_id_dst, llama_pos p0, llama_pos p1) override;
     void seq_cp_recurrent(llama_seq_id, llama_seq_id, llama_pos, llama_pos) override {}
     void seq_keep(llama_seq_id seq_id) override;
-    void seq_add(llama_seq_id seq_id, llama_pos p0, llama_pos p1, llama_pos shift) override;
-    void seq_div(llama_seq_id seq_id, llama_pos p0, llama_pos p1, int d) override;
+    GGML_NORETURN void seq_add(llama_seq_id seq_id, llama_pos p0, llama_pos p1, llama_pos shift) override;
+    GGML_NORETURN void seq_div(llama_seq_id seq_id, llama_pos p0, llama_pos p1, int d) override;
     llama_pos seq_pos_min(llama_seq_id seq_id) const override;
     llama_pos seq_pos_max(llama_seq_id seq_id) const override;
 
@@ -159,7 +159,6 @@ class llama_kv_cache_kvarn : public llama_memory_i {
     bool can_remove(llama_seq_id seq_id, llama_pos p0, llama_pos p1) const;
     void copy_kvarn_stream(uint32_t stream_src, uint32_t stream_dst);
 
-    const llama_model & model;
     const llama_hparams & hparams;
     const llama_kvarn_params params;
     const uint32_t n_stream;

Original file line number	Diff line number	Diff line change
`@@ -210,7 +210,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_batch(llama_batch_allocr & ba`
`210`	`210`	`}`
`211`	`211`
`212`	`212`	`return std::make_unique<llama_kv_cache_iswa_context>(`
`213`		`- this, std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));`
	`213`	`+ std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));`
`214`	`214`	`} while (false);`
`215`	`215`
`216`	`216`	`// if it fails, try equal split`
`@@ -244,7 +244,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_batch(llama_batch_allocr & ba`
`244`	`244`	`}`
`245`	`245`
`246`	`246`	`return std::make_unique<llama_kv_cache_iswa_context>(`
`247`		`- this, std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));`
	`247`	`+ std::move(ctx_base), std::move(ctx_swa), std::move(ubatches));`
`248`	`248`	`} while (false);`
`249`	`249`
`250`	`250`	`// TODO: if we fail again, we should attempt different splitting strategies`
`@@ -277,7 +277,7 @@ llama_memory_context_ptr llama_kv_cache_iswa::init_kv_batch(const std::vector<ll`
`277`	`277`	`}`
`278`	`278`
`279`	`279`	`return std::make_unique<llama_kv_cache_iswa_context>(`
`280`		`- this, std::move(ctx_base), std::move(ctx_swa), ubatches);`
	`280`	`+ std::move(ctx_base), std::move(ctx_swa), ubatches);`
`281`	`281`	`}`
`282`	`282`
`283`	`283`	`bool llama_kv_cache_iswa::get_can_shift() const {`
`@@ -333,7 +333,6 @@ llama_kv_cache_iswa_context::llama_kv_cache_iswa_context(`
`333`	`333`	`}`
`334`	`334`
`335`	`335`	`llama_kv_cache_iswa_context::llama_kv_cache_iswa_context(`
`336`		`- llama_kv_cache_iswa * kv,`
`337`	`336`	`llama_memory_context_ptr ctx_base_in,`
`338`	`337`	`llama_memory_context_ptr ctx_swa_in,`
`339`	`338`	`std::vector<llama_ubatch> ubatches) :`
Original file line number	Diff line number	Diff line change
`@@ -233,7 +233,6 @@ llama_kv_cache_kvarn::llama_kv_cache_kvarn(`
`233`	`233`	`llama_swa_type swa_type,`
`234`	`234`	`const layer_filter_cb & filter,`
`235`	`235`	`const layer_reuse_cb & reuse) :`
`236`		`- model(model),`
`237`	`236`	`hparams(hparams),`
`238`	`237`	`params(params),`
`239`	`238`	`n_stream(unified ? 1u : n_seq_max),`
`@@ -565,11 +564,11 @@ void llama_kv_cache_kvarn::seq_keep(llama_seq_id seq_id) {`
`565`	`564`	`metadata->seq_keep(seq_id);`
`566`	`565`	`}`
`567`	`566`
`568`		`-void llama_kv_cache_kvarn::seq_add(llama_seq_id, llama_pos, llama_pos, llama_pos) {`
	`567`	`+GGML_NORETURN void llama_kv_cache_kvarn::seq_add(llama_seq_id, llama_pos, llama_pos, llama_pos) {`
`569`	`568`	`GGML_ABORT("KVarN does not support position shifts");`
`570`	`569`	`}`
`571`	`570`
`572`		`-void llama_kv_cache_kvarn::seq_div(llama_seq_id, llama_pos, llama_pos, int) {`
	`571`	`+GGML_NORETURN void llama_kv_cache_kvarn::seq_div(llama_seq_id, llama_pos, llama_pos, int) {`
`573`	`572`	`GGML_ABORT("KVarN does not support position division");`
`574`	`573`	`}`
`575`	`574`