mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-04 03:29:49 +00:00
change inject yaml
This commit is contained in:
parent
2a224b256e
commit
48dfbc8f9f
1 changed files with 1 additions and 1 deletions
|
@ -44,7 +44,7 @@
|
|||
- match:
|
||||
name: "^model\\.layers\\..*\\.self_attn$"
|
||||
replace:
|
||||
class: ktransformers.operators.attention.flashinfer_attn # optimized MLA implementation
|
||||
class: ktransformers.operators.balance_serve_attention.flashinfer_attn # optimized MLA implementation
|
||||
kwargs:
|
||||
generate_device: "cuda"
|
||||
prefill_device: "cuda"
|
||||
|
|
Loading…
Add table
Reference in a new issue