[fix] bugs about Qwen57B, install requirement, Dockerfile

This commit is contained in:
chenxl 2024-08-30 03:24:26 +00:00
parent c80490a95e
commit 49cce0c437
3 changed files with 3 additions and 8 deletions

View file

@ -1,10 +1,3 @@
- match:
name: "^model\\.layers\\..*\\."
replace:
class: "default"
kwargs:
generate_device: "cuda"
prefill_device: "cuda"
- match:
class: ktransformers.models.modeling_qwen2_moe.Qwen2MoeRotaryEmbedding
replace: