| .. |
|
ascend
|
适配npu-models/operators文件夹3
|
2025-09-08 19:42:41 +08:00 |
|
__init__.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
|
configuration_deepseek.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
|
configuration_deepseek_v3.py
|
add balance-serve, support concurrence
|
2025-03-31 22:55:32 +08:00 |
|
configuration_glm4_moe.py
|
support smt and glm4
|
2025-07-24 09:39:19 +00:00 |
|
configuration_llama.py
|
[feature] release 0.1.3
|
2024-08-28 16:11:43 +00:00 |
|
configuration_qwen2_moe.py
|
support qwen3, dont speak human language
|
2025-04-28 08:44:47 +00:00 |
|
configuration_qwen3_moe.py
|
support qwen3, dont speak human language
|
2025-04-28 08:44:47 +00:00 |
|
configuration_smallthinker.py
|
smallthinker right
|
2025-07-25 12:46:14 +00:00 |
|
custom_cache.py
|
fix local chat on npu
|
2025-09-26 09:30:27 +08:00 |
|
custom_modeling_deepseek_v2.py
|
fix-hopper-flashinfer
|
2025-04-29 11:06:34 +08:00 |
|
custom_modeling_deepseek_v3.py
|
fix-hopper-flashinfer
|
2025-04-29 11:06:34 +08:00 |
|
custom_modeling_glm4_moe.py
|
support smt and qlm4
|
2025-07-25 12:48:51 +00:00 |
|
custom_modeling_qwen2_moe.py
|
support safetensor load, delete architectures argument
|
2025-05-09 10:38:29 +00:00 |
|
custom_modeling_qwen3_moe.py
|
support safetensor load, delete architectures argument
|
2025-05-09 10:38:29 +00:00 |
|
custom_modeling_smallthinker.py
|
support smt and glm4
|
2025-07-25 15:03:27 +00:00 |
|
modeling_deepseek.py
|
Enable support for Intel XPU devices, add support for DeepSeek V2/V3 first
|
2025-05-14 19:37:27 +00:00 |
|
modeling_deepseek_v3.py
|
npu enabling for deepseekv3 model and expert.py
|
2025-09-09 15:35:42 +08:00 |
|
modeling_glm4_moe.py
|
support smt and qlm4
|
2025-07-25 12:48:51 +00:00 |
|
modeling_llama.py
|
[feature] release 0.1.3
|
2024-08-28 16:11:43 +00:00 |
|
modeling_mixtral.py
|
[ADD] support multi-gpu qlen>1 q5_k
|
2024-08-12 11:41:26 +00:00 |
|
modeling_qwen2_moe.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
|
modeling_qwen3_moe.py
|
support qwen3, dont speak human language
|
2025-04-28 08:44:47 +00:00 |
|
modeling_smallthinker.py
|
smallthinker right
|
2025-07-25 12:46:14 +00:00 |