Merge pull request #1303 from rnwang04/fix_typo_and_style

fix typo and code style, and update setup.py ValueError message
2025-09-07 04:59:55 +00:00 · 2025-05-15 10:55:58 +08:00 · 2025-05-15 10:55:58 +08:00 · 09f0ddc00b
commit 09f0ddc00b
parent 07c5f23da5 2f6e14a54b
4 changed files with 5 additions and 5 deletions
--- a/doc/README.md
+++ b/doc/README.md
@ -21,6 +21,7 @@ interface, RESTful APIs compliant with OpenAI and Ollama, and even a simplified
 Our vision for KTransformers is to serve as a flexible platform for experimenting with innovative LLM inference optimizations. Please let us know if you need any other features.

 <h2 id="Updates">🔥 Updates</h2>
+
 * **May 14, 2025**: Support Intel Arc GPU ([Tutorial](./en/xpu.md)).
 * **Apr 9, 2025**: Experimental support for LLaMA 4 models ([Tutorial](./en/llama4.md)).
 * **Apr 2, 2025**: Support Multi-concurrency. ([Tutorial](./en/balance-serve.md)).
--- a/doc/en/xpu.md
+++ b/doc/en/xpu.md
@ -41,7 +41,6 @@ Install PyTorch with XPU backend support and [IPEX-LLM](https://github.com/intel
 pip install --pre --upgrade ipex-llm[xpu_2.6] --extra-index-url https://download.pytorch.org/whl/xpu
 pip uninstall torch torchvision torchaudio
 pip install torch==2.7+xpu torchvision torchaudio --index-url https://download.pytorch.org/whl/test/xpu # install torch2.7
-pip install packaging ninja cpufeature numpy
 pip uninstall intel-opencl-rt dpcpp-cpp-rt
 ```

--- a/ktransformers/models/custom_cache.py
+++ b/ktransformers/models/custom_cache.py
@ -293,7 +293,7 @@ class KGQACache(nn.Module):
        self.v_caches = []
        

-    def load(self, inference_context: "sched_ext.InferenceContext"): 
+    def load(self, inference_context: "sched_ext.InferenceContext"):
        print(self.config.num_hidden_layers)
        for i in range(self.config.num_hidden_layers):
            self.k_caches.append(
--- a/setup.py
+++ b/setup.py
@ -229,7 +229,7 @@ class VersionInfo:
        elif torch.xpu.is_available():
            backend_version = f"xpu"
        else:
-            raise ValueError("Unsupported backend: CUDA_HOME MUSA_HOME ROCM_HOME all not set.")
+            raise ValueError("Unsupported backend: CUDA_HOME MUSA_HOME ROCM_HOME all not set and XPU is not available.")
        package_version = f"{flash_version}+{backend_version}torch{torch_version}{cpu_instruct}"
        if full_version:
            return package_version
@ -501,7 +501,7 @@ class CMakeBuild(BuildExtension):
        elif KTRANSFORMERS_BUILD_XPU:
            cmake_args += ["-DKTRANSFORMERS_USE_XPU=ON", "-DKTRANSFORMERS_USE_CUDA=OFF"]
        else:
-            raise ValueError("Unsupported backend: CUDA_HOME, MUSA_HOME, and ROCM_HOME are not set.")
+            raise ValueError("Unsupported backend: CUDA_HOME, MUSA_HOME, and ROCM_HOME are not set and XPU is not available.")
        
        cmake_args = get_cmake_abi_args(cmake_args)
        # log cmake_args
@ -628,7 +628,7 @@ elif MUSA_HOME is not None:
 elif torch.xpu.is_available(): #XPUExtension is not available now.
    ops_module = None
 else:
-    raise ValueError("Unsupported backend: CUDA_HOME and MUSA_HOME are not set.")
+    raise ValueError("Unsupported backend: CUDA_HOME ROCM_HOME MUSA_HOME are not set and XPU is not available.")

 if not torch.xpu.is_available():
    ext_modules = [