Fix rocm example yaml

This commit is contained in:
Azure-Tang 2025-03-15 22:27:02 -04:00
parent 4a31237346
commit 85c32fdd10

View file

@ -12,7 +12,7 @@
replace:
class: ktransformers.operators.linear.KTransformersLinear # optimized Kernel on quantized data types
kwargs:
generate_device: "cuda"
generate_device: "cpu"
prefill_device: "cuda"
generate_op: "KLinearCPUInfer"
prefill_op: "KLinearTorch"
@ -23,7 +23,7 @@
replace:
class: ktransformers.operators.linear.KTransformersLinear # optimized Kernel on quantized data types
kwargs:
generate_device: "cpu"
generate_device: "cuda"
prefill_device: "cuda"
generate_op: "KLinearQ8"
prefill_op: "KLinearTorch"