mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-08-09 10:35:51 +02:00
talk-llama : sync llama.cpp
This commit is contained in:
@ -52,7 +52,7 @@ uint32_t llama_hparams::n_embd_v_gqa(uint32_t il) const {
|
||||
uint32_t llama_hparams::n_embd_k_s() const {
|
||||
if (wkv_head_size != 0) {
|
||||
// for RWKV models
|
||||
return 2 * n_embd;
|
||||
return token_shift_count * n_embd;
|
||||
}
|
||||
|
||||
// TODO: maybe support other convolution strides than 1
|
||||
|
Reference in New Issue
Block a user