From 49cce0c4373db3f5bc0b7748269eb6ac03576e18 Mon Sep 17 00:00:00 2001 From: chenxl Date: Fri, 30 Aug 2024 03:24:26 +0000 Subject: [PATCH] [fix] bugs about Qwen57B, install requirement, Dockerfile --- Dockerfile | 3 ++- .../optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml | 7 ------- pyproject.toml | 1 + 3 files changed, 3 insertions(+), 8 deletions(-) diff --git a/Dockerfile b/Dockerfile index 707c1a8..d56a607 100644 --- a/Dockerfile +++ b/Dockerfile @@ -12,6 +12,7 @@ EOF FROM pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server WORKDIR /workspace +ENV CUDA_HOME /usr/local/cuda COPY --from=web_compile /home/ktransformers /workspace/ktransformers RUN <= 2.3.0", "transformers == 4.43.2", "fastapi >= 0.111.0", + "uvicorn >= 0.30.1", "langchain >= 0.2.0", "blessed >= 1.20.0", "accelerate >= 0.31.0",