mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-07 13:09:50 +00:00
commit
1264f9407b
4 changed files with 13 additions and 2 deletions
|
@ -1,4 +1,4 @@
|
||||||
FROM pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
|
FROM pytorch/pytorch:2.5.1-cuda12.1-cudnn9-devel as compile_server
|
||||||
WORKDIR /workspace
|
WORKDIR /workspace
|
||||||
ENV CUDA_HOME /usr/local/cuda
|
ENV CUDA_HOME /usr/local/cuda
|
||||||
RUN <<EOF
|
RUN <<EOF
|
||||||
|
@ -10,6 +10,7 @@ apt update -y && apt install -y --no-install-recommends \
|
||||||
g++ \
|
g++ \
|
||||||
cmake &&
|
cmake &&
|
||||||
rm -rf /var/lib/apt/lists/* &&
|
rm -rf /var/lib/apt/lists/* &&
|
||||||
|
pip install --upgrade pip &&
|
||||||
pip install ninja pyproject numpy cpufeature &&
|
pip install ninja pyproject numpy cpufeature &&
|
||||||
pip install flash-attn &&
|
pip install flash-attn &&
|
||||||
cp /usr/lib/x86_64-linux-gnu/libstdc++.so.6 /opt/conda/lib/
|
cp /usr/lib/x86_64-linux-gnu/libstdc++.so.6 /opt/conda/lib/
|
||||||
|
|
8
.github/workflows/docker-image.yml
vendored
8
.github/workflows/docker-image.yml
vendored
|
@ -3,6 +3,14 @@ name: DockerHub CI
|
||||||
on:
|
on:
|
||||||
release:
|
release:
|
||||||
types: [published]
|
types: [published]
|
||||||
|
workflow_dispatch:
|
||||||
|
inputs:
|
||||||
|
choose:
|
||||||
|
description: 'Will you push the image to DockerHub? 0 for No, 1 for Yes'
|
||||||
|
required: true
|
||||||
|
default: '0'
|
||||||
|
type: string
|
||||||
|
|
||||||
# push:
|
# push:
|
||||||
# branches:
|
# branches:
|
||||||
# - main
|
# - main
|
||||||
|
|
1
.gitignore
vendored
1
.gitignore
vendored
|
@ -25,3 +25,4 @@ book
|
||||||
ktransformers/tests/chat_txt.txt
|
ktransformers/tests/chat_txt.txt
|
||||||
mmlu_result*
|
mmlu_result*
|
||||||
ktransformers/ktransformers_ext/cuda_musa/
|
ktransformers/ktransformers_ext/cuda_musa/
|
||||||
|
test_prompt.txt
|
||||||
|
|
|
@ -10,7 +10,7 @@ EOF
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
FROM pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
|
FROM pytorch/pytorch:2.5.1-cuda12.1-cudnn9-devel as compile_server
|
||||||
ARG CPU_INSTRUCT=NATIVE
|
ARG CPU_INSTRUCT=NATIVE
|
||||||
WORKDIR /workspace
|
WORKDIR /workspace
|
||||||
ENV CUDA_HOME /usr/local/cuda
|
ENV CUDA_HOME /usr/local/cuda
|
||||||
|
@ -27,6 +27,7 @@ rm -rf /var/lib/apt/lists/* &&
|
||||||
cd ktransformers &&
|
cd ktransformers &&
|
||||||
git submodule init &&
|
git submodule init &&
|
||||||
git submodule update &&
|
git submodule update &&
|
||||||
|
pip install --upgrade pip &&
|
||||||
pip install ninja pyproject numpy cpufeature &&
|
pip install ninja pyproject numpy cpufeature &&
|
||||||
pip install flash-attn &&
|
pip install flash-attn &&
|
||||||
CPU_INSTRUCT=${CPU_INSTRUCT} KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9;9.0+PTX" pip install . --no-build-isolation --verbose &&
|
CPU_INSTRUCT=${CPU_INSTRUCT} KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9;9.0+PTX" pip install . --no-build-isolation --verbose &&
|
||||||
|
|
Loading…
Add table
Reference in a new issue