talk-llama : sync llama.cpp

ggml-ci
2025-08-09 20:38:53 +02:00 · 2025-06-18 10:22:47 +03:00
parent 69061e356f
commit 2f60ebc3c2
26 changed files with 1454 additions and 504 deletions
--- a/examples/talk-llama/llama-cparams.h
+++ b/examples/talk-llama/llama-cparams.h
@ -4,7 +4,7 @@

 #include <cstdint>

-#define LLAMA_MAX_PARALLEL_SEQUENCES 64
+#define LLAMA_MAX_SEQ 64

 struct llama_cparams {
    uint32_t n_ctx;           // context size used during inference