mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-08 05:29:29 +00:00
⚡ update git ignore add docker dev container
This commit is contained in:
parent
5474be5299
commit
0ca0b99fab
4 changed files with 57 additions and 8 deletions
19
.devcontainer/Dockerfile
Normal file
19
.devcontainer/Dockerfile
Normal file
|
@ -0,0 +1,19 @@
|
||||||
|
FROM pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
|
||||||
|
WORKDIR /workspace
|
||||||
|
ENV CUDA_HOME /usr/local/cuda
|
||||||
|
RUN <<EOF
|
||||||
|
apt update -y && apt install -y --no-install-recommends \
|
||||||
|
git \
|
||||||
|
wget \
|
||||||
|
vim \
|
||||||
|
gcc \
|
||||||
|
g++ \
|
||||||
|
cmake &&
|
||||||
|
rm -rf /var/lib/apt/lists/* &&
|
||||||
|
cd ktransformers &&
|
||||||
|
pip install ninja pyproject numpy cpufeature &&
|
||||||
|
pip install flash-attn &&
|
||||||
|
cp /usr/lib/x86_64-linux-gnu/libstdc++.so.6 /opt/conda/lib/
|
||||||
|
EOF
|
||||||
|
# Set the default shell to bash
|
||||||
|
CMD ["/bin/bash"]
|
34
.devcontainer/devcontainer.json
Normal file
34
.devcontainer/devcontainer.json
Normal file
|
@ -0,0 +1,34 @@
|
||||||
|
{
|
||||||
|
"name": "Ktrans Dev Container",
|
||||||
|
"privileged": true,
|
||||||
|
"build": {
|
||||||
|
"dockerfile": "Dockerfile",
|
||||||
|
"context": "..",
|
||||||
|
"args": {
|
||||||
|
"http_proxy": "${env:http_proxy}",
|
||||||
|
"https_proxy": "${env:https_proxy}",
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"runArgs": [
|
||||||
|
"--network=host",
|
||||||
|
"--gpus",
|
||||||
|
"all"
|
||||||
|
// "--gpu all"
|
||||||
|
],
|
||||||
|
"workspaceFolder": "/workspace",
|
||||||
|
"workspaceMount": "source=${localWorkspaceFolder},target=/workspace,type=bind,consistency=cached",
|
||||||
|
"mounts": [
|
||||||
|
"source=/mnt/data,target=/mnt/incontainer,type=bind,consistency=cached"
|
||||||
|
],
|
||||||
|
"customizations": {
|
||||||
|
"vscode": {
|
||||||
|
"extensions": [
|
||||||
|
],
|
||||||
|
"settings": {
|
||||||
|
"terminal.integrated.shell.linux": "/bin/bash",
|
||||||
|
"cmake.configureOnOpen": true,
|
||||||
|
"cmake.generator": "Ninja"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
8
.gitignore
vendored
8
.gitignore
vendored
|
@ -19,13 +19,9 @@ ktransformers/server/local_store/
|
||||||
ktransformers/server_test1.db
|
ktransformers/server_test1.db
|
||||||
*.patch
|
*.patch
|
||||||
img/
|
img/
|
||||||
tmp1.txt
|
tmp*.txt
|
||||||
test_65_300_1536.txt
|
|
||||||
test.txt
|
test.txt
|
||||||
book
|
book
|
||||||
ktransformers/tests/mmlu_result_silicon.json
|
|
||||||
ktransformers/tests/chat_txt.txt
|
ktransformers/tests/chat_txt.txt
|
||||||
mmlu_result_q4km.json
|
mmlu_result*
|
||||||
mmlu_result_q4km.log
|
|
||||||
ktransformers/tests/mmlu_result_silicon.log
|
|
||||||
ktransformers/ktransformers_ext/cuda_musa/
|
ktransformers/ktransformers_ext/cuda_musa/
|
||||||
|
|
|
@ -173,8 +173,8 @@ if __name__ == "__main__":
|
||||||
parser = argparse.ArgumentParser(description="API Generate Tester")
|
parser = argparse.ArgumentParser(description="API Generate Tester")
|
||||||
parser.add_argument("--concurrent", type=int, default=1000, help="Number of concurrent evaluations")
|
parser.add_argument("--concurrent", type=int, default=1000, help="Number of concurrent evaluations")
|
||||||
parser.add_argument("--file", type=str, default="TIGER-Lab/MMLU-Pro", help="Path to the mmlu.jsonl file")
|
parser.add_argument("--file", type=str, default="TIGER-Lab/MMLU-Pro", help="Path to the mmlu.jsonl file")
|
||||||
parser.add_argument("--result", type=str, default="./mmlu_pro.json", help="Path to save the result JSON file")
|
parser.add_argument("--result", type=str, default="./mmlu_result_pro.json", help="Path to save the result JSON file")
|
||||||
parser.add_argument("--log", type=str, default="./mmlu_pro.log", help="Path to save the log file")
|
parser.add_argument("--log", type=str, default="./mmlu_result_pro.log", help="Path to save the log file")
|
||||||
parser.add_argument("--model", type=str, default="Pro/deepseek-ai/DeepSeek-V3", help="Model name or path")
|
parser.add_argument("--model", type=str, default="Pro/deepseek-ai/DeepSeek-V3", help="Model name or path")
|
||||||
parser.add_argument("--api_url", type=str, default="http://localhost:15488/v1/chat/completions", help="API URL")
|
parser.add_argument("--api_url", type=str, default="http://localhost:15488/v1/chat/completions", help="API URL")
|
||||||
# parser.add_argument("--api_url", type=str, default="https://api.siliconflow.cn/v1/chat/completions", help="API URL")
|
# parser.add_argument("--api_url", type=str, default="https://api.siliconflow.cn/v1/chat/completions", help="API URL")
|
||||||
|
|
Loading…
Add table
Reference in a new issue