__init__.py
|
Initial commit
|
2024-07-27 16:06:58 +08:00 |
attention.py
|
rollback-triton-prefill
|
2025-03-15 14:21:21 +00:00 |
dynamic_attention.py
|
merge main; Add torch q8 linear
|
2025-03-14 05:52:07 -04:00 |
experts.py
|
fix-singleton
|
2025-03-14 04:16:53 +00:00 |
flashinfer_wrapper.py
|
fix flashinfer precision
|
2025-03-07 14:07:00 +00:00 |
gate.py
|
Update gate.py
|
2025-03-19 12:16:48 +08:00 |
linear.py
|
Merge pull request #178 from fxzjshm/hip
|
2025-03-15 02:31:07 +08:00 |
models.py
|
merge main; Add torch q8 linear
|
2025-03-14 05:52:07 -04:00 |
triton_attention.py
|
merge main; Add torch q8 linear
|
2025-03-14 05:52:07 -04:00 |
triton_attention_prefill.py
|
merge main; Add torch q8 linear
|
2025-03-14 05:52:07 -04:00 |