mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-10 15:29:39 +00:00
[fix] f16 dequantize device ignored
This commit is contained in:
parent
cbc47d0b68
commit
29f4151ebc
1 changed files with 1 additions and 1 deletions
|
@ -681,7 +681,7 @@ def dequantize_f16_gpu(data, device):
|
||||||
res = torch.from_numpy(data)
|
res = torch.from_numpy(data)
|
||||||
res_gpu = torch.empty_like(res, device=device)
|
res_gpu = torch.empty_like(res, device=device)
|
||||||
res_gpu.copy_(res)
|
res_gpu.copy_(res)
|
||||||
return res
|
return res_gpu
|
||||||
|
|
||||||
GGML_DEQUANTIZE = {
|
GGML_DEQUANTIZE = {
|
||||||
"F32": dequantize_f32,
|
"F32": dequantize_f32,
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue