mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-05-02 13:41:15 +00:00
add prefix cache support for kvc2.
This commit is contained in:
parent
b154441072
commit
3b4a1c7532
9 changed files with 399 additions and 52 deletions
|
|
@ -67,6 +67,6 @@ attn:
|
|||
page_size: 256
|
||||
chunk_size: 256
|
||||
kvc2:
|
||||
gpu_only: true
|
||||
gpu_only: false
|
||||
utilization_percentage: 1.0
|
||||
cpu_memory_size_GB: 500
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue