mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-10 23:34:35 +00:00
fix rope; update moegate
This commit is contained in:
parent
f873558a89
commit
f748cd29f0
5 changed files with 54 additions and 21 deletions
|
@ -222,7 +222,7 @@ class KLinearMarlin(KLinearBase):
|
|||
x = x.to(self.device)
|
||||
orig_shape = list(x.shape)
|
||||
orig_dtype = x.dtype
|
||||
x = x.reshape(-1, x.shape[-1])
|
||||
x = x.reshape(-1, orig_shape[-1])
|
||||
marlin_s = self.marlin_s.to(x.dtype)
|
||||
x = KTransformersOps.gptq_marlin_gemm(
|
||||
x,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue