add prefix cache support for kvc2.

This commit is contained in:
ouqingliang 2025-06-26 04:57:25 +00:00
parent b154441072
commit 3b4a1c7532
9 changed files with 399 additions and 52 deletions

View file

@ -67,6 +67,6 @@ attn:
page_size: 256
chunk_size: 256
kvc2:
gpu_only: true
gpu_only: false
utilization_percentage: 1.0
cpu_memory_size_GB: 500