mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-12 08:09:42 +00:00
smallthink run
This commit is contained in:
parent
590fcb41cd
commit
71c1d4eed7
7 changed files with 123 additions and 32 deletions
|
@ -153,7 +153,7 @@ class ArgumentParser:
|
|||
raise ValueError(f"Model {args.model_name} not supported. Please check your model directory or model name.")
|
||||
|
||||
|
||||
if model_config.architectures[0] == "Qwen3MoeForCausalLM" or model_config.architectures[0] == "Qwen2MoeForCausalLM" :
|
||||
if model_config.architectures[0] == "Qwen3MoeForCausalLM" or model_config.architectures[0] == "Qwen2MoeForCausalLM" or model_config.architectures[0] == "SmallthinkerForCausalLM" or model_config.architectures[0] == "Glm4MoeForCausalLM":
|
||||
args.gpu_memory_size = args.cache_lens*2*2*model_config.num_hidden_layers*model_config.num_key_value_heads*model_config.head_dim
|
||||
args.architectures = model_config.architectures[0]
|
||||
else:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue