mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-16 18:19:42 +00:00
support smt and glm4
This commit is contained in:
parent
613f0b7c37
commit
590fcb41cd
5 changed files with 95 additions and 7 deletions
|
@ -49,7 +49,7 @@
|
|||
- match:
|
||||
name: "^model\\.layers\\..*\\.mlp\\.experts$"
|
||||
replace:
|
||||
class: ktransformers.operators.experts.KTransformersExpertsV2 # custom MoE Kernel with expert paralleism
|
||||
class: ktransformers.operators.experts.KGlm4Experts # custom MoE Kernel with expert paralleism
|
||||
kwargs:
|
||||
prefill_device: "cuda"
|
||||
prefill_op: None
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue