raise exception on device error (#1342)

* display the unavailable torch device on error * Raise exception on device error --------- Signed-off-by: Emmanuel Ferdman <emmanuelferdman@gmail.com>
2025-09-07 13:09:50 +00:00 · 2025-05-29 10:37:41 +03:00 · 2025-05-29 10:37:41 +03:00 · d8bc6402b5
commit d8bc6402b5
parent ce75fcd7dd
1 changed files with 2 additions and 2 deletions
--- a/ktransformers/util/utils.py
+++ b/ktransformers/util/utils.py
@ -243,7 +243,7 @@ def prefill_and_generate(model, tokenizer, inputs, max_new_tokens=10000, use_cud
            elif torch.xpu.is_available():
                torch.xpu.set_device(torch_device)
            else:
-                RuntimeError("The device: {torch_device} is not available")
+                raise RuntimeError(f"The device: {torch_device} is not available")
            inputs_embeds = model.model.embed_tokens(cur_token.to("cpu")).to(torch_device)
            # with torch.cuda.stream(custom_stream):
            logits=model(inputs_embeds=inputs_embeds,
@ -284,7 +284,7 @@ def prefill_and_generate(model, tokenizer, inputs, max_new_tokens=10000, use_cud
    elif torch.xpu.is_available():
        torch.xpu.set_device(torch_device)
    else:
-        RuntimeError("The device: {torch_device} is not available")
+        raise RuntimeError(f"The device: {torch_device} is not available")
    with torch.no_grad():
        stream = TextStreamer(tokenizer)