mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-14 19:09:45 +00:00
memory : handle kv_unified for hybrid models (#15050)
This commit is contained in:
parent
97366dc6ab
commit
11a3811164
3 changed files with 4 additions and 1 deletions
|
@ -25,6 +25,7 @@ llama_memory_hybrid::llama_memory_hybrid(
|
|||
/* common */
|
||||
uint32_t n_seq_max,
|
||||
bool offload,
|
||||
bool unified,
|
||||
/* layer filters */
|
||||
layer_filter_cb && filter_attn,
|
||||
layer_filter_cb && filter_recr) :
|
||||
|
@ -38,7 +39,7 @@ llama_memory_hybrid::llama_memory_hybrid(
|
|||
type_v,
|
||||
v_trans,
|
||||
offload,
|
||||
1,
|
||||
unified,
|
||||
kv_size,
|
||||
n_seq_max,
|
||||
n_pad,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue