__init__.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
attention.py
|
fix qlen > 1000 mask is none error
|
2024-09-02 02:58:10 +00:00 |
base_operator.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
cpuinfer.py
|
[feature] release 0.1.3
|
2024-08-28 16:11:43 +00:00 |
dynamic_attention.py
|
[feature] release 0.1.3
|
2024-08-28 16:11:43 +00:00 |
experts.py
|
Fix cannot offload whole layer in cpu
|
2024-08-29 19:10:14 +08:00 |
linear.py
|
Fix cannot offload whole layer in cpu
|
2024-08-29 19:10:14 +08:00 |
models.py
|
Fix cannot offload whole layer in cpu
|
2024-08-29 19:10:14 +08:00 |
RoPE.py
|
[feature] release 0.1.3
|
2024-08-28 16:11:43 +00:00 |