This commit is contained in:
TangJingqi 2024-08-15 11:25:12 +08:00
parent 67043b4b5c
commit c47205dce9
6 changed files with 6 additions and 6 deletions

View file

@ -190,7 +190,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KDeepseekV2Model" class: "ktransformers.operators.models.KDeepseekV2Model"
kwargs: kwargs:
per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill
transfer_map: transfer_map:

View file

@ -103,7 +103,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KDeepseekV2Model" class: "ktransformers.operators.models.KDeepseekV2Model"
kwargs: kwargs:
per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill
transfer_map: transfer_map:

View file

@ -55,7 +55,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KDeepseekV2Model" class: "ktransformers.operators.models.KDeepseekV2Model"
kwargs: kwargs:
generate_device: "cuda" generate_device: "cuda"
prefill_device: "cuda" prefill_device: "cuda"

View file

@ -103,7 +103,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KDeepseekV2Model" class: "ktransformers.operators.models.KDeepseekV2Model"
kwargs: kwargs:
per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill
transfer_map: transfer_map:

View file

@ -89,7 +89,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KQwen2MoeModel" class: "ktransformers.operators.models.KQwen2MoeModel"
kwargs: kwargs:
per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill
transfer_map: transfer_map:

View file

@ -38,7 +38,7 @@
- match: - match:
name: "^model$" name: "^model$"
replace: replace:
class: "ktransformers.operators.layer_wise_prefill.KQwen2MoeModel" class: "ktransformers.operators.models.KQwen2MoeModel"
kwargs: kwargs:
per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill per_layer_prefill_intput_threshold: 0 # 0 is close layer wise prefill
- match: - match: