talk-llama : sync llama.cpp

ggml-ci
2025-08-10 01:09:17 +02:00 · 2025-06-20 21:18:44 +03:00
parent d65a579a0a
commit e6c10cf3d5
28 changed files with 2521 additions and 1738 deletions
--- a/examples/talk-llama/llama-kv-cache-unified-iswa.h
+++ b/examples/talk-llama/llama-kv-cache-unified-iswa.h
@ -32,7 +32,7 @@ public:
    //

    llama_memory_state_ptr init_batch(
-            const llama_batch & batch,
+            llama_batch_allocr & balloc,
            uint32_t n_ubatch,
            bool embd_all) override;

@ -90,7 +90,6 @@ public:
    // used to create a state from a batch
    llama_kv_cache_unified_iswa_state(
            llama_kv_cache_unified_iswa * kv,
-            llama_sbatch sbatch,
            std::vector<uint32_t> heads_base,
            std::vector<uint32_t> heads_swa,
            std::vector<llama_ubatch> ubatches);
@ -104,8 +103,6 @@ public:
    bool next()  override;
    bool apply() override;

-    std::vector<int64_t> & out_ids() override;
-
    llama_memory_status  get_status() const override;
    const llama_ubatch & get_ubatch() const override;

@ -117,17 +114,15 @@ public:
    const llama_kv_cache_unified_state * get_swa()  const;

 private:
-    llama_memory_status status;
-
    //llama_kv_cache_unified_iswa * kv;

-    llama_sbatch sbatch;
-
    // the index of the next ubatch to process
    size_t i_next = 0;

    std::vector<llama_ubatch> ubatches;

-    llama_memory_state_ptr state_base;
-    llama_memory_state_ptr state_swa;
+    const llama_memory_state_ptr state_base;
+    const llama_memory_state_ptr state_swa;
+
+    const llama_memory_status status;
 };