From 171578a7ec4f3cf8f4fa89389ad667bd86b61372 Mon Sep 17 00:00:00 2001 From: Peilin Li Date: Mon, 17 Nov 2025 11:48:42 +0800 Subject: [PATCH] [refactor]: Change named 'KT-SFT' to 'kt-sft' (#1626) * Change named 'KT-SFT' to 'kt-sft' * [docs]: update kt-sft name --------- Co-authored-by: ZiWei Yuan --- README.md | 12 ++++++------ README_ZH.md | 12 ++++++------ archive/README.md | 10 +++++----- archive/README_ZH.md | 10 +++++----- doc/SUMMARY.md | 6 +++--- doc/en/SFT/README.md | 2 +- {KT-SFT => kt-sft}/.flake8 | 0 {KT-SFT => kt-sft}/.gitignore | 0 {KT-SFT => kt-sft}/.gitmodules | 0 {KT-SFT => kt-sft}/.pylintrc | 0 {KT-SFT => kt-sft}/Dockerfile | 0 {KT-SFT => kt-sft}/Dockerfile.xpu | 0 {KT-SFT => kt-sft}/LICENSE | 0 {KT-SFT => kt-sft}/MANIFEST.in | 0 {KT-SFT => kt-sft}/Makefile | 0 {KT-SFT => kt-sft}/README.md | 0 {KT-SFT => kt-sft}/SECURITY.md | 0 {KT-SFT => kt-sft}/WeChatGroup.png | Bin {KT-SFT => kt-sft}/autosetup.sh | 0 {KT-SFT => kt-sft}/book.toml | 0 {KT-SFT => kt-sft}/csrc/custom_marlin/__init__.py | 0 {KT-SFT => kt-sft}/csrc/custom_marlin/binding.cpp | 0 .../csrc/custom_marlin/gptq_marlin/gptq_marlin.cu | 0 .../csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh | 0 .../gptq_marlin/gptq_marlin_dtypes.cuh | 0 .../custom_marlin/gptq_marlin/gptq_marlin_repack.cu | 0 .../csrc/custom_marlin/gptq_marlin/ops.h | 0 {KT-SFT => kt-sft}/csrc/custom_marlin/setup.py | 0 .../csrc/custom_marlin/test_cuda_graph.py | 0 .../csrc/custom_marlin/utils/__init__.py | 0 .../csrc/custom_marlin/utils/format24.py | 0 .../csrc/custom_marlin/utils/marlin_24_perms.py | 0 .../csrc/custom_marlin/utils/marlin_perms.py | 0 .../csrc/custom_marlin/utils/marlin_utils.py | 0 .../csrc/custom_marlin/utils/quant_utils.py | 0 .../csrc/ktransformers_ext/CMakeLists.txt | 0 .../csrc/ktransformers_ext/bench/bench_attention.py | 0 .../bench/bench_attention_torch.py | 0 .../csrc/ktransformers_ext/bench/bench_linear.py | 0 .../ktransformers_ext/bench/bench_linear_torch.py | 0 .../csrc/ktransformers_ext/bench/bench_mlp.py | 0 .../csrc/ktransformers_ext/bench/bench_mlp_torch.py | 0 .../csrc/ktransformers_ext/bench/bench_moe.py | 0 .../csrc/ktransformers_ext/bench/bench_moe_amx.py | 0 .../csrc/ktransformers_ext/bench/bench_moe_torch.py | 0 .../csrc/ktransformers_ext/cmake/FindSIMD.cmake | 0 .../csrc/ktransformers_ext/cpu_backend/backend.cpp | 0 .../csrc/ktransformers_ext/cpu_backend/backend.h | 0 .../csrc/ktransformers_ext/cpu_backend/cpuinfer.h | 0 .../cpu_backend/shared_mem_buffer.cpp | 0 .../cpu_backend/shared_mem_buffer.h | 0 .../ktransformers_ext/cpu_backend/task_queue.cpp | 0 .../csrc/ktransformers_ext/cpu_backend/task_queue.h | 0 .../ktransformers_ext/cpu_backend/vendors/README.md | 0 .../ktransformers_ext/cpu_backend/vendors/cuda.h | 0 .../ktransformers_ext/cpu_backend/vendors/hip.h | 0 .../ktransformers_ext/cpu_backend/vendors/musa.h | 0 .../ktransformers_ext/cpu_backend/vendors/vendor.h | 0 .../csrc/ktransformers_ext/cuda/binding.cpp | 0 .../ktransformers_ext/cuda/custom_gguf/dequant.cu | 0 .../csrc/ktransformers_ext/cuda/custom_gguf/ops.h | 0 .../cuda/gptq_marlin/gptq_marlin.cu | 0 .../cuda/gptq_marlin/gptq_marlin.cuh | 0 .../cuda/gptq_marlin/gptq_marlin_dtypes.cuh | 0 .../csrc/ktransformers_ext/cuda/gptq_marlin/ops.h | 0 .../csrc/ktransformers_ext/cuda/setup.py | 0 .../csrc/ktransformers_ext/cuda/test_dequant.py | 0 .../ktransformers_ext/examples/test_attention.py | 0 .../csrc/ktransformers_ext/examples/test_linear.py | 0 .../csrc/ktransformers_ext/examples/test_mlp.py | 0 .../csrc/ktransformers_ext/examples/test_moe.py | 0 .../ktransformers_ext/examples/test_sft_amx_moe.py | 10 +++++----- .../csrc/ktransformers_ext/examples/test_sft_moe.py | 0 .../csrc/ktransformers_ext/ext_bindings.cpp | 0 .../operators/amx/debug_sft_moe.hpp | 0 .../operators/amx/debug_tools_sft_moe.hpp | 0 .../csrc/ktransformers_ext/operators/amx/la/amx.hpp | 0 .../ktransformers_ext/operators/amx/la/utils.hpp | 0 .../csrc/ktransformers_ext/operators/amx/moe.hpp | 0 .../ktransformers_ext/operators/amx/sft_moe.hpp | 0 .../ktransformers_ext/operators/kvcache/kvcache.h | 0 .../operators/kvcache/kvcache_attn.cpp | 0 .../operators/kvcache/kvcache_load_dump.cpp | 0 .../operators/kvcache/kvcache_read_write.cpp | 0 .../operators/kvcache/kvcache_utils.cpp | 0 .../operators/llamafile/conversion.h | 0 .../operators/llamafile/linear.cpp | 0 .../ktransformers_ext/operators/llamafile/linear.h | 0 .../ktransformers_ext/operators/llamafile/mlp.cpp | 0 .../ktransformers_ext/operators/llamafile/mlp.h | 0 .../ktransformers_ext/operators/llamafile/moe.cpp | 0 .../ktransformers_ext/operators/llamafile/moe.h | 0 .../operators/llamafile/sft_moe.cpp | 0 .../ktransformers_ext/operators/llamafile/sft_moe.h | 0 .../operators/llamafile/sft_moe_forward_cache.h | 0 .../csrc/ktransformers_ext/vendors/cuda.h | 0 .../csrc/ktransformers_ext/vendors/hip.h | 0 .../csrc/ktransformers_ext/vendors/musa.h | 0 .../csrc/ktransformers_ext/vendors/vendor.h | 0 {KT-SFT => kt-sft}/install-with-cache.sh | 0 {KT-SFT => kt-sft}/install.bat | 0 {KT-SFT => kt-sft}/install.sh | 0 {KT-SFT => kt-sft}/ktransformers/__init__.py | 0 .../ktransformers/configs/config.yaml | 0 .../ktransformers/configs/log_config.ini | 0 .../ktransformers/configs/model_config/config.json | 0 .../configs/model_config/configuration_deepseek.py | 0 .../custom_marlin/quantize/utils/__init__.py | 0 .../custom_marlin/quantize/utils/format_24.py | 0 .../custom_marlin/quantize/utils/marlin_24_perms.py | 0 .../custom_marlin/quantize/utils/marlin_perms.py | 0 .../custom_marlin/quantize/utils/marlin_utils.py | 0 .../custom_marlin/quantize/utils/quant_utils.py | 0 .../ktransformers_ext/triton/fp8gemm.py | 0 {KT-SFT => kt-sft}/ktransformers/local_chat.py | 0 {KT-SFT => kt-sft}/ktransformers/local_chat.sh | 0 .../ktransformers/lora_test_module.py | 0 {KT-SFT => kt-sft}/ktransformers/models/__init__.py | 0 .../ktransformers/models/configuration_deepseek.py | 0 .../models/configuration_deepseek_v3.py | 0 .../ktransformers/models/configuration_llama.py | 0 .../ktransformers/models/configuration_qwen2_moe.py | 0 .../ktransformers/models/configuration_qwen3_moe.py | 0 .../ktransformers/models/custom_cache.py | 0 .../models/custom_modeling_deepseek_v2.py | 0 .../models/custom_modeling_deepseek_v3.py | 0 .../models/custom_modeling_qwen2_moe.py | 0 .../models/custom_modeling_qwen3_moe.py | 0 .../ktransformers/models/modeling_deepseek.py | 0 .../ktransformers/models/modeling_deepseek_v3.py | 0 .../ktransformers/models/modeling_llama.py | 0 .../ktransformers/models/modeling_mixtral.py | 0 .../ktransformers/models/modeling_qwen2_moe.py | 0 .../ktransformers/models/modeling_qwen3_moe.py | 0 {KT-SFT => kt-sft}/ktransformers/moe_test_module.py | 0 .../ktransformers/moe_test_module_old.py | 0 {KT-SFT => kt-sft}/ktransformers/operators/RoPE.py | 0 .../ktransformers/operators/__init__.py | 0 .../ktransformers/operators/attention.py | 0 .../operators/balance_serve_attention.py | 0 .../ktransformers/operators/base_operator.py | 0 .../ktransformers/operators/cpuinfer.py | 0 .../ktransformers/operators/dynamic_attention.py | 0 .../ktransformers/operators/experts.py | 0 .../operators/flashinfer_batch_prefill_wrapper.py | 0 .../ktransformers/operators/flashinfer_wrapper.py | 0 {KT-SFT => kt-sft}/ktransformers/operators/gate.py | 0 .../ktransformers/operators/layernorm.py | 0 .../ktransformers/operators/linear.py | 0 {KT-SFT => kt-sft}/ktransformers/operators/mlp.py | 0 .../ktransformers/operators/models.py | 0 .../ktransformers/operators/triton_attention.py | 0 .../operators/triton_attention_prefill.py | 0 .../ktransformers/optimize/optimize.py | 0 .../DeepSeek-V2-Chat-multi-gpu-4.yaml | 0 .../optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml | 0 .../optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml | 0 .../optimize/optimize_rules/DeepSeek-V2-Chat.yaml | 0 .../DeepSeek-V2-Lite-Chat-multi-gpu.yaml | 0 .../DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml | 0 .../DeepSeek-V2-Lite-Chat-sft-amx.yaml | 0 .../optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml | 0 .../DeepSeek-V2-Lite-Chat-use-adapter.yaml | 0 .../optimize_rules/DeepSeek-V2-Lite-Chat.yaml | 0 .../optimize_rules/DeepSeek-V3-Chat-amx.yaml | 0 ...k-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml | 0 ...pSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml | 0 .../DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml | 0 .../DeepSeek-V3-Chat-multi-gpu-4.yaml | 0 .../DeepSeek-V3-Chat-multi-gpu-8.yaml | 0 ...k-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml | 0 .../DeepSeek-V3-Chat-multi-gpu-marlin.yaml | 0 .../optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml | 0 .../optimize_rules/DeepSeek-V3-Chat-serve.yaml | 0 .../DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml | 0 .../DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml | 0 .../optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml | 0 .../optimize/optimize_rules/DeepSeek-V3-Chat.yaml | 0 .../optimize_rules/Internlm2_5-7b-Chat-1m.yaml | 0 .../optimize/optimize_rules/Mixtral.yaml | 0 .../optimize_rules/Moonlight-16B-A3B-serve.yaml | 0 .../optimize/optimize_rules/Moonlight-16B-A3B.yaml | 0 .../Qwen2-57B-A14B-Instruct-multi-gpu.yaml | 0 .../optimize_rules/Qwen2-57B-A14B-Instruct.yaml | 0 .../optimize/optimize_rules/Qwen2-serve-amx.yaml | 0 .../optimize/optimize_rules/Qwen2-serve.yaml | 0 .../optimize/optimize_rules/Qwen3Moe-serve-amx.yaml | 0 .../optimize/optimize_rules/Qwen3Moe-serve.yaml | 0 .../optimize/optimize_rules/Qwen3Moe-sft-amx.yaml | 0 .../optimize_rules/rocm/DeepSeek-V3-Chat.yaml | 0 .../optimize_rules/xpu/DeepSeek-V2-Chat.yaml | 0 .../optimize_rules/xpu/DeepSeek-V3-Chat.yaml | 0 .../optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml | 0 {KT-SFT => kt-sft}/ktransformers/server/__init__.py | 0 .../ktransformers/server/api/__init__.py | 0 .../ktransformers/server/api/ollama/__init__.py | 0 .../ktransformers/server/api/ollama/completions.py | 0 .../ktransformers/server/api/openai/__init__.py | 0 .../server/api/openai/assistants/__init__.py | 0 .../server/api/openai/assistants/assistants.py | 0 .../server/api/openai/assistants/messages.py | 0 .../server/api/openai/assistants/runs.py | 0 .../server/api/openai/assistants/threads.py | 0 .../server/api/openai/endpoints/__init__.py | 0 .../server/api/openai/endpoints/chat.py | 0 .../server/api/openai/legacy/__init__.py | 0 .../server/api/openai/legacy/completions.py | 0 .../ktransformers/server/api/web/__init__.py | 0 .../ktransformers/server/api/web/system.py | 0 {KT-SFT => kt-sft}/ktransformers/server/args.py | 0 .../ktransformers/server/backend/__init__.py | 0 .../ktransformers/server/backend/args.py | 0 .../ktransformers/server/backend/base.py | 0 .../ktransformers/server/backend/context_manager.py | 0 .../server/backend/interfaces/__init__.py | 0 .../server/backend/interfaces/balance_serve.py | 0 .../server/backend/interfaces/exllamav2.py | 0 .../server/backend/interfaces/ktransformers.py | 0 .../server/backend/interfaces/transformers.py | 0 .../server/balance_serve/inference/__init__.py | 0 .../server/balance_serve/inference/config.py | 0 .../balance_serve/inference/distributed/__init__.py | 0 .../inference/distributed/communication_op.py | 0 .../inference/distributed/cuda_wrapper.py | 0 .../inference/distributed/custom_all_reduce.py | 0 .../distributed/custom_all_reduce_utils.py | 0 .../inference/distributed/parallel_state.py | 0 .../balance_serve/inference/distributed/pynccl.py | 0 .../inference/distributed/pynccl_wrapper.py | 0 .../balance_serve/inference/distributed/utils.py | 0 .../server/balance_serve/inference/forward_batch.py | 0 .../server/balance_serve/inference/model_runner.py | 0 .../server/balance_serve/inference/query_manager.py | 0 .../inference/sampling/penaltylib/__init__.py | 0 .../inference/sampling/penaltylib/orchestrator.py | 0 .../penaltylib/penalizers/frequency_penalty.py | 0 .../penaltylib/penalizers/min_new_tokens.py | 0 .../penaltylib/penalizers/presence_penalty.py | 0 .../penaltylib/penalizers/repetition_penalty.py | 0 .../balance_serve/inference/sampling/sampler.py | 0 .../ktransformers/server/balance_serve/sched_rpc.py | 0 .../ktransformers/server/balance_serve/settings.py | 0 .../ktransformers/server/config/config.py | 0 .../ktransformers/server/config/log.py | 0 .../ktransformers/server/config/singleton.py | 0 .../ktransformers/server/crud/__init__.py | 0 .../server/crud/assistants/__init__.py | 0 .../server/crud/assistants/assistants.py | 0 .../server/crud/assistants/messages.py | 0 .../ktransformers/server/crud/assistants/runs.py | 0 .../ktransformers/server/crud/assistants/threads.py | 0 .../ktransformers/server/exceptions.py | 0 {KT-SFT => kt-sft}/ktransformers/server/main.py | 0 .../ktransformers/server/models/__init__.py | 0 .../server/models/assistants/__init__.py | 0 .../server/models/assistants/assistants.py | 0 .../server/models/assistants/messages.py | 0 .../server/models/assistants/run_steps.py | 0 .../ktransformers/server/models/assistants/runs.py | 0 .../server/models/assistants/threads.py | 0 .../ktransformers/server/schemas/__init__.py | 0 .../server/schemas/assistants/__init__.py | 0 .../server/schemas/assistants/assistants.py | 0 .../server/schemas/assistants/messages.py | 0 .../ktransformers/server/schemas/assistants/runs.py | 0 .../server/schemas/assistants/streaming.py | 0 .../server/schemas/assistants/threads.py | 0 .../ktransformers/server/schemas/assistants/tool.py | 0 .../ktransformers/server/schemas/base.py | 0 .../ktransformers/server/schemas/conversation.py | 0 .../ktransformers/server/schemas/endpoints/chat.py | 0 .../ktransformers/server/schemas/legacy/__init__.py | 0 .../server/schemas/legacy/completions.py | 0 .../ktransformers/server/utils/__init__.py | 0 .../ktransformers/server/utils/create_interface.py | 0 .../ktransformers/server/utils/multi_timer.py | 0 .../ktransformers/server/utils/sql_utils.py | 0 {KT-SFT => kt-sft}/ktransformers/sft/__init__.py | 0 .../ktransformers/sft/flops_utils/__init__.py | 0 .../ktransformers/sft/flops_utils/custom_profile.py | 0 .../sft/flops_utils/lora_test_utils.py | 2 +- {KT-SFT => kt-sft}/ktransformers/sft/lora.py | 0 {KT-SFT => kt-sft}/ktransformers/sft/metrics.py | 0 .../ktransformers/sft/metrics_utils/__init__.py | 0 .../ktransformers/sft/metrics_utils/constants.py | 0 .../ktransformers/sft/metrics_utils/env.py | 0 .../ktransformers/sft/metrics_utils/logging.py | 0 .../ktransformers/sft/metrics_utils/misc.py | 0 .../ktransformers/sft/metrics_utils/packages.py | 0 .../ktransformers/sft/metrics_utils/ploting.py | 0 .../ktransformers/sft/monkey_patch_torch_module.py | 0 .../ktransformers/sft/peft_utils/__init__.py | 0 .../ktransformers/sft/peft_utils/lora_layer.py | 0 .../ktransformers/sft/peft_utils/lora_model.py | 0 .../ktransformers/sft/peft_utils/mapping.py | 0 .../ktransformers/sft/peft_utils/peft_model.py | 0 .../ktransformers/sft/torchviz_test.py | 0 {KT-SFT => kt-sft}/ktransformers/tests/.gitignore | 0 .../ktransformers/tests/AIME_2024/eval_api.py | 0 .../ktransformers/tests/AIME_2024/evaluation.py | 0 .../ktransformers/tests/AIME_2024/prompts.py | 0 .../ktransformers/tests/dequant_gpu.py | 0 .../ktransformers/tests/dequant_gpu_t.py | 0 .../ktransformers/tests/function_call_test.py | 0 .../ktransformers/tests/humaneval/eval_api.py | 0 .../ktransformers/tests/humaneval/evaluation.py | 0 .../ktransformers/tests/humaneval/prompts.py | 0 .../ktransformers/tests/mmlu_pro_test.py | 0 {KT-SFT => kt-sft}/ktransformers/tests/mmlu_test.py | 0 .../ktransformers/tests/mmlu_test_multi.py | 0 {KT-SFT => kt-sft}/ktransformers/tests/score.py | 0 .../ktransformers/tests/test_client.py | 0 .../ktransformers/tests/test_pytorch_q8.py | 0 .../ktransformers/tests/test_speed.py | 0 .../ktransformers/tests/triton_fp8gemm_test.py | 0 .../ktransformers/util/cuda_graph_runner.py | 0 .../ktransformers/util/custom_gguf.py | 0 .../ktransformers/util/custom_loader.py | 0 {KT-SFT => kt-sft}/ktransformers/util/globals.py | 0 .../ktransformers/util/grad_wrapper.py | 0 .../ktransformers/util/inference_state.py | 0 .../ktransformers/util/modeling_rope_utils.py | 0 {KT-SFT => kt-sft}/ktransformers/util/textstream.py | 0 {KT-SFT => kt-sft}/ktransformers/util/utils.py | 0 {KT-SFT => kt-sft}/ktransformers/util/vendors.py | 0 .../ktransformers/util/weight_loader.py | 0 .../ktransformers/website/.browserslistrc | 0 .../ktransformers/website/.eslintrc.js | 0 {KT-SFT => kt-sft}/ktransformers/website/.gitignore | 0 {KT-SFT => kt-sft}/ktransformers/website/README.md | 0 .../ktransformers/website/config.d.ts | 0 .../ktransformers/website/jest.config.js | 0 .../ktransformers/website/package-lock.json | 0 .../ktransformers/website/package.json | 0 .../ktransformers/website/public/balck.ico | Bin .../ktransformers/website/public/config.js | 0 .../ktransformers/website/public/css/reset.css | 0 .../website/public/images/assistant-avatar.png | Bin .../ktransformers/website/public/images/avatar.png | Bin .../ktransformers/website/public/images/bgbg.png | Bin .../ktransformers/website/public/images/logo.ico | Bin .../ktransformers/website/public/images/logo.png | Bin .../ktransformers/website/public/images/three.png | Bin .../website/public/images/user-filling.png | Bin .../ktransformers/website/public/index.html | 0 .../ktransformers/website/src/App.vue | 0 .../ktransformers/website/src/api/api-client.ts | 0 .../ktransformers/website/src/api/assistant.ts | 0 .../ktransformers/website/src/api/message.ts | 0 .../ktransformers/website/src/api/run.ts | 0 .../ktransformers/website/src/api/thread.ts | 0 .../website/src/assets/css/mixins.styl | 0 .../website/src/assets/iconfont/demo.css | 0 .../website/src/assets/iconfont/demo_index.html | 0 .../website/src/assets/iconfont/iconfont.css | 0 .../website/src/assets/iconfont/iconfont.js | 0 .../website/src/assets/iconfont/iconfont.json | 0 .../website/src/assets/iconfont/iconfont.ttf | Bin .../website/src/assets/iconfont/iconfont.woff | Bin .../website/src/assets/iconfont/iconfont.woff2 | Bin .../website/src/components/chat/index.vue | 0 .../ktransformers/website/src/conf/config.ts | 0 .../ktransformers/website/src/locals/en.js | 0 .../ktransformers/website/src/locals/index.js | 0 .../ktransformers/website/src/locals/zh.js | 0 .../ktransformers/website/src/main.ts | 0 .../ktransformers/website/src/router/index.ts | 0 .../ktransformers/website/src/shims-vue.d.ts | 0 .../ktransformers/website/src/store/index.ts | 0 .../ktransformers/website/src/utils/copy.ts | 0 .../ktransformers/website/src/utils/types.ts | 0 .../ktransformers/website/src/views/home.vue | 0 .../website/tests/unit/example.spec.ts | 0 .../ktransformers/website/tsconfig.json | 0 .../ktransformers/website/vue.config.js | 0 .../merge_tensors/merge_safetensor_gguf.py | 0 {KT-SFT => kt-sft}/pyproject.toml | 0 {KT-SFT => kt-sft}/requirements-sft.txt | 0 {KT-SFT => kt-sft}/setup.py | 0 {KT-SFT => kt-sft}/test_adapter/data_transfer.py | 0 .../test_adapter/infer_with_adapter.py | 0 {KT-SFT => kt-sft}/test_adapter/inspect_adapter.py | 0 {KT-SFT => kt-sft}/test_adapter/pred2metrics.py | 0 {KT-SFT => kt-sft}/test_adapter/test_grad.py | 2 +- .../test_adapter/time_test_lora_train.py | 0 {KT-SFT => kt-sft}/withoutKT_PEFT.py | 0 386 files changed, 33 insertions(+), 33 deletions(-) rename {KT-SFT => kt-sft}/.flake8 (100%) rename {KT-SFT => kt-sft}/.gitignore (100%) rename {KT-SFT => kt-sft}/.gitmodules (100%) rename {KT-SFT => kt-sft}/.pylintrc (100%) rename {KT-SFT => kt-sft}/Dockerfile (100%) rename {KT-SFT => kt-sft}/Dockerfile.xpu (100%) rename {KT-SFT => kt-sft}/LICENSE (100%) rename {KT-SFT => kt-sft}/MANIFEST.in (100%) rename {KT-SFT => kt-sft}/Makefile (100%) rename {KT-SFT => kt-sft}/README.md (100%) rename {KT-SFT => kt-sft}/SECURITY.md (100%) rename {KT-SFT => kt-sft}/WeChatGroup.png (100%) rename {KT-SFT => kt-sft}/autosetup.sh (100%) rename {KT-SFT => kt-sft}/book.toml (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/__init__.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/binding.cpp (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/gptq_marlin/gptq_marlin.cu (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/gptq_marlin/gptq_marlin_dtypes.cuh (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/gptq_marlin/gptq_marlin_repack.cu (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/gptq_marlin/ops.h (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/setup.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/test_cuda_graph.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/__init__.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/format24.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/marlin_24_perms.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/marlin_perms.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/marlin_utils.py (100%) rename {KT-SFT => kt-sft}/csrc/custom_marlin/utils/quant_utils.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/CMakeLists.txt (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_attention.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_attention_torch.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_linear.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_linear_torch.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_mlp.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_mlp_torch.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_moe.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_moe_amx.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/bench/bench_moe_torch.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cmake/FindSIMD.cmake (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/backend.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/backend.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/cpuinfer.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/task_queue.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/task_queue.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/vendors/README.md (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/vendors/cuda.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/vendors/hip.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/vendors/musa.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cpu_backend/vendors/vendor.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/binding.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/custom_gguf/dequant.cu (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/custom_gguf/ops.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cu (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cuh (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin_dtypes.cuh (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/gptq_marlin/ops.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/setup.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/cuda/test_dequant.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_attention.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_linear.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_mlp.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_moe.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_sft_amx_moe.py (98%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/examples/test_sft_moe.py (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/ext_bindings.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/debug_sft_moe.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/debug_tools_sft_moe.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/la/amx.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/la/utils.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/moe.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/amx/sft_moe.hpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/kvcache/kvcache.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/kvcache/kvcache_attn.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/kvcache/kvcache_load_dump.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/kvcache/kvcache_read_write.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/kvcache/kvcache_utils.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/conversion.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/linear.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/linear.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/mlp.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/mlp.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/moe.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/moe.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/sft_moe.cpp (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/sft_moe.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/operators/llamafile/sft_moe_forward_cache.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/vendors/cuda.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/vendors/hip.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/vendors/musa.h (100%) rename {KT-SFT => kt-sft}/csrc/ktransformers_ext/vendors/vendor.h (100%) rename {KT-SFT => kt-sft}/install-with-cache.sh (100%) rename {KT-SFT => kt-sft}/install.bat (100%) rename {KT-SFT => kt-sft}/install.sh (100%) rename {KT-SFT => kt-sft}/ktransformers/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/configs/config.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/configs/log_config.ini (100%) rename {KT-SFT => kt-sft}/ktransformers/configs/model_config/config.json (100%) rename {KT-SFT => kt-sft}/ktransformers/configs/model_config/configuration_deepseek.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/format_24.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_24_perms.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_perms.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/quant_utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/ktransformers_ext/triton/fp8gemm.py (100%) rename {KT-SFT => kt-sft}/ktransformers/local_chat.py (100%) rename {KT-SFT => kt-sft}/ktransformers/local_chat.sh (100%) rename {KT-SFT => kt-sft}/ktransformers/lora_test_module.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/configuration_deepseek.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/configuration_deepseek_v3.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/configuration_llama.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/configuration_qwen2_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/configuration_qwen3_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/custom_cache.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/custom_modeling_deepseek_v2.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/custom_modeling_deepseek_v3.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/custom_modeling_qwen2_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/custom_modeling_qwen3_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_deepseek.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_deepseek_v3.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_llama.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_mixtral.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_qwen2_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/models/modeling_qwen3_moe.py (100%) rename {KT-SFT => kt-sft}/ktransformers/moe_test_module.py (100%) rename {KT-SFT => kt-sft}/ktransformers/moe_test_module_old.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/RoPE.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/attention.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/balance_serve_attention.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/base_operator.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/cpuinfer.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/dynamic_attention.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/experts.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/flashinfer_batch_prefill_wrapper.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/flashinfer_wrapper.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/gate.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/layernorm.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/linear.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/mlp.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/models.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/triton_attention.py (100%) rename {KT-SFT => kt-sft}/ktransformers/operators/triton_attention_prefill.py (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize.py (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu-4.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-use-adapter.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-4.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-8.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-marlin.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-serve.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Internlm2_5-7b-Chat-1m.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Mixtral.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B-serve.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct-multi-gpu.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen2-serve-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen2-serve.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen3Moe-serve-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen3Moe-serve.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/Qwen3Moe-sft-amx.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/rocm/DeepSeek-V3-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V2-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V3-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml (100%) rename {KT-SFT => kt-sft}/ktransformers/server/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/ollama/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/ollama/completions.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/assistants/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/assistants/assistants.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/assistants/messages.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/assistants/runs.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/assistants/threads.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/endpoints/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/endpoints/chat.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/legacy/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/openai/legacy/completions.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/web/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/api/web/system.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/args.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/args.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/base.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/context_manager.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/interfaces/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/interfaces/balance_serve.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/interfaces/exllamav2.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/interfaces/ktransformers.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/backend/interfaces/transformers.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/config.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/communication_op.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/cuda_wrapper.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce_utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/parallel_state.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/pynccl.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/pynccl_wrapper.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/distributed/utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/forward_batch.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/model_runner.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/query_manager.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/orchestrator.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/frequency_penalty.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/min_new_tokens.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/presence_penalty.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/repetition_penalty.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/inference/sampling/sampler.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/sched_rpc.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/balance_serve/settings.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/config/config.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/config/log.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/config/singleton.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/assistants/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/assistants/assistants.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/assistants/messages.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/assistants/runs.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/crud/assistants/threads.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/exceptions.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/main.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/assistants.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/messages.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/run_steps.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/runs.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/models/assistants/threads.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/assistants.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/messages.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/runs.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/streaming.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/threads.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/assistants/tool.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/base.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/conversation.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/endpoints/chat.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/legacy/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/schemas/legacy/completions.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/utils/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/utils/create_interface.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/utils/multi_timer.py (100%) rename {KT-SFT => kt-sft}/ktransformers/server/utils/sql_utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/flops_utils/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/flops_utils/custom_profile.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/flops_utils/lora_test_utils.py (99%) rename {KT-SFT => kt-sft}/ktransformers/sft/lora.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/constants.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/env.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/logging.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/misc.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/packages.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/metrics_utils/ploting.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/monkey_patch_torch_module.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/peft_utils/__init__.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/peft_utils/lora_layer.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/peft_utils/lora_model.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/peft_utils/mapping.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/peft_utils/peft_model.py (100%) rename {KT-SFT => kt-sft}/ktransformers/sft/torchviz_test.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/.gitignore (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/AIME_2024/eval_api.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/AIME_2024/evaluation.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/AIME_2024/prompts.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/dequant_gpu.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/dequant_gpu_t.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/function_call_test.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/humaneval/eval_api.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/humaneval/evaluation.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/humaneval/prompts.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/mmlu_pro_test.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/mmlu_test.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/mmlu_test_multi.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/score.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/test_client.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/test_pytorch_q8.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/test_speed.py (100%) rename {KT-SFT => kt-sft}/ktransformers/tests/triton_fp8gemm_test.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/cuda_graph_runner.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/custom_gguf.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/custom_loader.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/globals.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/grad_wrapper.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/inference_state.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/modeling_rope_utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/textstream.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/utils.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/vendors.py (100%) rename {KT-SFT => kt-sft}/ktransformers/util/weight_loader.py (100%) rename {KT-SFT => kt-sft}/ktransformers/website/.browserslistrc (100%) rename {KT-SFT => kt-sft}/ktransformers/website/.eslintrc.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/.gitignore (100%) rename {KT-SFT => kt-sft}/ktransformers/website/README.md (100%) rename {KT-SFT => kt-sft}/ktransformers/website/config.d.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/jest.config.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/package-lock.json (100%) rename {KT-SFT => kt-sft}/ktransformers/website/package.json (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/balck.ico (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/config.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/css/reset.css (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/assistant-avatar.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/avatar.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/bgbg.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/logo.ico (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/logo.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/three.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/images/user-filling.png (100%) rename {KT-SFT => kt-sft}/ktransformers/website/public/index.html (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/App.vue (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/api/api-client.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/api/assistant.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/api/message.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/api/run.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/api/thread.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/css/mixins.styl (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/demo.css (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/demo_index.html (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.css (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.json (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.ttf (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.woff (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/assets/iconfont/iconfont.woff2 (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/components/chat/index.vue (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/conf/config.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/locals/en.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/locals/index.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/locals/zh.js (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/main.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/router/index.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/shims-vue.d.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/store/index.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/utils/copy.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/utils/types.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/src/views/home.vue (100%) rename {KT-SFT => kt-sft}/ktransformers/website/tests/unit/example.spec.ts (100%) rename {KT-SFT => kt-sft}/ktransformers/website/tsconfig.json (100%) rename {KT-SFT => kt-sft}/ktransformers/website/vue.config.js (100%) rename {KT-SFT => kt-sft}/merge_tensors/merge_safetensor_gguf.py (100%) rename {KT-SFT => kt-sft}/pyproject.toml (100%) rename {KT-SFT => kt-sft}/requirements-sft.txt (100%) rename {KT-SFT => kt-sft}/setup.py (100%) rename {KT-SFT => kt-sft}/test_adapter/data_transfer.py (100%) rename {KT-SFT => kt-sft}/test_adapter/infer_with_adapter.py (100%) rename {KT-SFT => kt-sft}/test_adapter/inspect_adapter.py (100%) rename {KT-SFT => kt-sft}/test_adapter/pred2metrics.py (100%) rename {KT-SFT => kt-sft}/test_adapter/test_grad.py (90%) rename {KT-SFT => kt-sft}/test_adapter/time_test_lora_train.py (100%) rename {KT-SFT => kt-sft}/withoutKT_PEFT.py (100%) diff --git a/README.md b/README.md index 0d597e91..4b928228 100644 --- a/README.md +++ b/README.md @@ -8,12 +8,12 @@

A Flexible Framework for Experiencing Cutting-edge LLM Inference/Fine-tune Optimizations

- 🎯 Overview | 🚀 kt-kernel | 🎓 KT-SFT | 🔥 Citation | 🚀 Roadmap(2025Q4) + 🎯 Overview | 🚀 kt-kernel | 🎓 kt-sft | 🔥 Citation | 🚀 Roadmap(2025Q4) ## 🎯 Overview -KTransformers is a research project focused on efficient inference and fine-tuning of large language models through CPU-GPU heterogeneous computing. The project has evolved into **two core modules**: [kt-kernel](./kt-kernel/) and [KT-SFT](./KT-SFT/). +KTransformers is a research project focused on efficient inference and fine-tuning of large language models through CPU-GPU heterogeneous computing. The project has evolved into **two core modules**: [kt-kernel](./kt-kernel/) and [kt-sft](./kt-sft/). ## 🔥 Updates @@ -79,7 +79,7 @@ pip install . --- -### 🎓 [KT-SFT](./KT-SFT/) - Fine-Tuning Framework +### 🎓 [kt-sft](./kt-sft/) - Fine-Tuning Framework KTransformers × LLaMA-Factory integration for ultra-large MoE model fine-tuning. @@ -101,12 +101,12 @@ KTransformers × LLaMA-Factory integration for ultra-large MoE model fine-tuning **Quick Start:** ```bash -cd KT-SFT -# Install environment following KT-SFT/README.md +cd kt-sft +# Install environment following kt-sft/README.md USE_KT=1 llamafactory-cli train examples/train_lora/deepseek3_lora_sft_kt.yaml ``` -👉 **[Full Documentation →](./KT-SFT/README.md)** +👉 **[Full Documentation →](./kt-sft/README.md)** --- diff --git a/README_ZH.md b/README_ZH.md index 20ddd721..0f0c7971 100644 --- a/README_ZH.md +++ b/README_ZH.md @@ -8,12 +8,12 @@

一个用于体验尖端 LLM 推理/微调优化的灵活框架

- 🎯 概览 | 🚀 kt-kernel | 🎓 KT-SFT | 🔥 引用 + 🎯 概览 | 🚀 kt-kernel | 🎓 kt-sft | 🔥 引用 ## 🎯 概览 -KTransformers 是一个专注于通过 CPU-GPU 异构计算实现大语言模型高效推理和微调的研究项目。该项目已发展为**两个核心模块**:[kt-kernel](./kt-kernel/) 和 [KT-SFT](./KT-SFT/)。 +KTransformers 是一个专注于通过 CPU-GPU 异构计算实现大语言模型高效推理和微调的研究项目。该项目已发展为**两个核心模块**:[kt-kernel](./kt-kernel/) 和 [kt-sft](./kt-sft/)。 ## 🔥 更新 @@ -78,7 +78,7 @@ pip install . --- -### 🎓 [KT-SFT](./KT-SFT/) - 微调框架 +### 🎓 [kt-sft](./kt-sft/) - 微调框架 KTransformers × LLaMA-Factory 集成,用于超大型 MoE 模型微调。 @@ -100,12 +100,12 @@ KTransformers × LLaMA-Factory 集成,用于超大型 MoE 模型微调。 **快速开始:** ```bash -cd KT-SFT -# 按照 KT-SFT/README.md 安装环境 +cd kt-sft +# 按照 kt-sft/README.md 安装环境 USE_KT=1 llamafactory-cli train examples/train_lora/deepseek3_lora_sft_kt.yaml ``` -👉 **[完整文档 →](./KT-SFT/README.md)** +👉 **[完整文档 →](./kt-sft/README.md)** --- diff --git a/archive/README.md b/archive/README.md index 56cb4d80..25de7841 100644 --- a/archive/README.md +++ b/archive/README.md @@ -9,7 +9,7 @@ ## 🎯 Overview -KTransformers is a research project focused on efficient inference and fine-tuning of large language models through CPU-GPU heterogeneous computing. The project has evolved into **two core modules**: [kt-kernel](./kt-kernel/) and [KT-SFT](./KT-SFT/). +KTransformers is a research project focused on efficient inference and fine-tuning of large language models through CPU-GPU heterogeneous computing. The project has evolved into **two core modules**: [kt-kernel](./kt-kernel/) and [kt-sft](./kt-sft/). ## 🔥 Updates @@ -67,7 +67,7 @@ pip install . --- -### 🎓 [KT-SFT](./KT-SFT/) - Fine-Tuning Framework +### 🎓 [kt-sft](./kt-sft/) - Fine-Tuning Framework KTransformers × LLaMA-Factory integration for ultra-large MoE model fine-tuning. @@ -89,12 +89,12 @@ KTransformers × LLaMA-Factory integration for ultra-large MoE model fine-tuning **Quick Start:** ```bash -cd KT-SFT -# Install environment following KT-SFT/README.md +cd kt-sft +# Install environment following kt-sft/README.md USE_KT=1 llamafactory-cli train examples/train_lora/deepseek3_lora_sft_kt.yaml ``` -👉 **[Full Documentation →](./KT-SFT/README.md)** +👉 **[Full Documentation →](./kt-sft/README.md)** --- diff --git a/archive/README_ZH.md b/archive/README_ZH.md index d91ee804..4993f860 100644 --- a/archive/README_ZH.md +++ b/archive/README_ZH.md @@ -9,7 +9,7 @@ ## 🎯 项目概述 -KTransformers 是一个专注于大语言模型高效推理和微调的研究项目,通过 CPU-GPU 异构计算实现资源受限环境下的模型部署。项目已演进为**两个核心模块**:[kt-kernel](./kt-kernel/) 和 [KT-SFT](./KT-SFT/)。 +KTransformers 是一个专注于大语言模型高效推理和微调的研究项目,通过 CPU-GPU 异构计算实现资源受限环境下的模型部署。项目已演进为**两个核心模块**:[kt-kernel](./kt-kernel/) 和 [kt-sft](./kt-sft/)。 ## 🔥 更新 @@ -66,7 +66,7 @@ pip install . --- -### 🎓 [KT-SFT](./KT-SFT/) - 微调框架 +### 🎓 [kt-sft](./kt-sft/) - 微调框架 KTransformers × LLaMA-Factory 集成,支持超大 MoE 模型微调。 @@ -86,12 +86,12 @@ KTransformers × LLaMA-Factory 集成,支持超大 MoE 模型微调。 **快速开始:** ```bash -cd KT-SFT -# 按照 KT-SFT/README.md 安装环境 +cd kt-sft +# 按照 kt-sft/README.md 安装环境 USE_KT=1 llamafactory-cli train examples/train_lora/deepseek3_lora_sft_kt.yaml ``` -👉 **[完整文档 →](./KT-SFT/README.md)** +👉 **[完整文档 →](./kt-sft/README.md)** --- diff --git a/doc/SUMMARY.md b/doc/SUMMARY.md index f9e62328..af806727 100644 --- a/doc/SUMMARY.md +++ b/doc/SUMMARY.md @@ -3,11 +3,11 @@ [Introduction](./README.md) # Install & Usage - [For kt-kernel](en/kt-kernel/kt-kernel_intro.md) -- [For SFT](en/SFT/KTransformers-Fine-Tuning_User-Guide.md) +- [For kt-sft](en/SFT/KTransformers-Fine-Tuning_User-Guide.md) # Tutorial -- [SFT part](en/SFT/README.md) - - [SFT developer tech notes](en/SFT/KTransformers-Fine-Tuning_Developer-Technical-Notes.md) +- [kt-sft part](en/SFT/README.md) + - [kt-sft developer tech notes](en/SFT/KTransformers-Fine-Tuning_Developer-Technical-Notes.md) - [Injection Tutorial](en/SFT/injection_tutorial.md) diff --git a/doc/en/SFT/README.md b/doc/en/SFT/README.md index fc3a5f56..174cb402 100644 --- a/doc/en/SFT/README.md +++ b/doc/en/SFT/README.md @@ -1 +1 @@ -# SFT Docs \ No newline at end of file +# kt-sft Docs \ No newline at end of file diff --git a/KT-SFT/.flake8 b/kt-sft/.flake8 similarity index 100% rename from KT-SFT/.flake8 rename to kt-sft/.flake8 diff --git a/KT-SFT/.gitignore b/kt-sft/.gitignore similarity index 100% rename from KT-SFT/.gitignore rename to kt-sft/.gitignore diff --git a/KT-SFT/.gitmodules b/kt-sft/.gitmodules similarity index 100% rename from KT-SFT/.gitmodules rename to kt-sft/.gitmodules diff --git a/KT-SFT/.pylintrc b/kt-sft/.pylintrc similarity index 100% rename from KT-SFT/.pylintrc rename to kt-sft/.pylintrc diff --git a/KT-SFT/Dockerfile b/kt-sft/Dockerfile similarity index 100% rename from KT-SFT/Dockerfile rename to kt-sft/Dockerfile diff --git a/KT-SFT/Dockerfile.xpu b/kt-sft/Dockerfile.xpu similarity index 100% rename from KT-SFT/Dockerfile.xpu rename to kt-sft/Dockerfile.xpu diff --git a/KT-SFT/LICENSE b/kt-sft/LICENSE similarity index 100% rename from KT-SFT/LICENSE rename to kt-sft/LICENSE diff --git a/KT-SFT/MANIFEST.in b/kt-sft/MANIFEST.in similarity index 100% rename from KT-SFT/MANIFEST.in rename to kt-sft/MANIFEST.in diff --git a/KT-SFT/Makefile b/kt-sft/Makefile similarity index 100% rename from KT-SFT/Makefile rename to kt-sft/Makefile diff --git a/KT-SFT/README.md b/kt-sft/README.md similarity index 100% rename from KT-SFT/README.md rename to kt-sft/README.md diff --git a/KT-SFT/SECURITY.md b/kt-sft/SECURITY.md similarity index 100% rename from KT-SFT/SECURITY.md rename to kt-sft/SECURITY.md diff --git a/KT-SFT/WeChatGroup.png b/kt-sft/WeChatGroup.png similarity index 100% rename from KT-SFT/WeChatGroup.png rename to kt-sft/WeChatGroup.png diff --git a/KT-SFT/autosetup.sh b/kt-sft/autosetup.sh similarity index 100% rename from KT-SFT/autosetup.sh rename to kt-sft/autosetup.sh diff --git a/KT-SFT/book.toml b/kt-sft/book.toml similarity index 100% rename from KT-SFT/book.toml rename to kt-sft/book.toml diff --git a/KT-SFT/csrc/custom_marlin/__init__.py b/kt-sft/csrc/custom_marlin/__init__.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/__init__.py rename to kt-sft/csrc/custom_marlin/__init__.py diff --git a/KT-SFT/csrc/custom_marlin/binding.cpp b/kt-sft/csrc/custom_marlin/binding.cpp similarity index 100% rename from KT-SFT/csrc/custom_marlin/binding.cpp rename to kt-sft/csrc/custom_marlin/binding.cpp diff --git a/KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin.cu b/kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin.cu similarity index 100% rename from KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin.cu rename to kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin.cu diff --git a/KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh b/kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh similarity index 100% rename from KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh rename to kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin.cuh diff --git a/KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin_dtypes.cuh b/kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin_dtypes.cuh similarity index 100% rename from KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin_dtypes.cuh rename to kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin_dtypes.cuh diff --git a/KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin_repack.cu b/kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin_repack.cu similarity index 100% rename from KT-SFT/csrc/custom_marlin/gptq_marlin/gptq_marlin_repack.cu rename to kt-sft/csrc/custom_marlin/gptq_marlin/gptq_marlin_repack.cu diff --git a/KT-SFT/csrc/custom_marlin/gptq_marlin/ops.h b/kt-sft/csrc/custom_marlin/gptq_marlin/ops.h similarity index 100% rename from KT-SFT/csrc/custom_marlin/gptq_marlin/ops.h rename to kt-sft/csrc/custom_marlin/gptq_marlin/ops.h diff --git a/KT-SFT/csrc/custom_marlin/setup.py b/kt-sft/csrc/custom_marlin/setup.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/setup.py rename to kt-sft/csrc/custom_marlin/setup.py diff --git a/KT-SFT/csrc/custom_marlin/test_cuda_graph.py b/kt-sft/csrc/custom_marlin/test_cuda_graph.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/test_cuda_graph.py rename to kt-sft/csrc/custom_marlin/test_cuda_graph.py diff --git a/KT-SFT/csrc/custom_marlin/utils/__init__.py b/kt-sft/csrc/custom_marlin/utils/__init__.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/__init__.py rename to kt-sft/csrc/custom_marlin/utils/__init__.py diff --git a/KT-SFT/csrc/custom_marlin/utils/format24.py b/kt-sft/csrc/custom_marlin/utils/format24.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/format24.py rename to kt-sft/csrc/custom_marlin/utils/format24.py diff --git a/KT-SFT/csrc/custom_marlin/utils/marlin_24_perms.py b/kt-sft/csrc/custom_marlin/utils/marlin_24_perms.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/marlin_24_perms.py rename to kt-sft/csrc/custom_marlin/utils/marlin_24_perms.py diff --git a/KT-SFT/csrc/custom_marlin/utils/marlin_perms.py b/kt-sft/csrc/custom_marlin/utils/marlin_perms.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/marlin_perms.py rename to kt-sft/csrc/custom_marlin/utils/marlin_perms.py diff --git a/KT-SFT/csrc/custom_marlin/utils/marlin_utils.py b/kt-sft/csrc/custom_marlin/utils/marlin_utils.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/marlin_utils.py rename to kt-sft/csrc/custom_marlin/utils/marlin_utils.py diff --git a/KT-SFT/csrc/custom_marlin/utils/quant_utils.py b/kt-sft/csrc/custom_marlin/utils/quant_utils.py similarity index 100% rename from KT-SFT/csrc/custom_marlin/utils/quant_utils.py rename to kt-sft/csrc/custom_marlin/utils/quant_utils.py diff --git a/KT-SFT/csrc/ktransformers_ext/CMakeLists.txt b/kt-sft/csrc/ktransformers_ext/CMakeLists.txt similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/CMakeLists.txt rename to kt-sft/csrc/ktransformers_ext/CMakeLists.txt diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_attention.py b/kt-sft/csrc/ktransformers_ext/bench/bench_attention.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_attention.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_attention.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_attention_torch.py b/kt-sft/csrc/ktransformers_ext/bench/bench_attention_torch.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_attention_torch.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_attention_torch.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_linear.py b/kt-sft/csrc/ktransformers_ext/bench/bench_linear.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_linear.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_linear.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_linear_torch.py b/kt-sft/csrc/ktransformers_ext/bench/bench_linear_torch.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_linear_torch.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_linear_torch.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_mlp.py b/kt-sft/csrc/ktransformers_ext/bench/bench_mlp.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_mlp.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_mlp.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_mlp_torch.py b/kt-sft/csrc/ktransformers_ext/bench/bench_mlp_torch.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_mlp_torch.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_mlp_torch.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_moe.py b/kt-sft/csrc/ktransformers_ext/bench/bench_moe.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_moe.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_moe.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_moe_amx.py b/kt-sft/csrc/ktransformers_ext/bench/bench_moe_amx.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_moe_amx.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_moe_amx.py diff --git a/KT-SFT/csrc/ktransformers_ext/bench/bench_moe_torch.py b/kt-sft/csrc/ktransformers_ext/bench/bench_moe_torch.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/bench/bench_moe_torch.py rename to kt-sft/csrc/ktransformers_ext/bench/bench_moe_torch.py diff --git a/KT-SFT/csrc/ktransformers_ext/cmake/FindSIMD.cmake b/kt-sft/csrc/ktransformers_ext/cmake/FindSIMD.cmake similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cmake/FindSIMD.cmake rename to kt-sft/csrc/ktransformers_ext/cmake/FindSIMD.cmake diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/backend.cpp b/kt-sft/csrc/ktransformers_ext/cpu_backend/backend.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/backend.cpp rename to kt-sft/csrc/ktransformers_ext/cpu_backend/backend.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/backend.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/backend.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/backend.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/backend.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/cpuinfer.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/cpuinfer.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/cpuinfer.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/cpuinfer.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.cpp b/kt-sft/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.cpp rename to kt-sft/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/shared_mem_buffer.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/task_queue.cpp b/kt-sft/csrc/ktransformers_ext/cpu_backend/task_queue.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/task_queue.cpp rename to kt-sft/csrc/ktransformers_ext/cpu_backend/task_queue.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/task_queue.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/task_queue.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/task_queue.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/task_queue.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/README.md b/kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/README.md similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/README.md rename to kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/README.md diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/cuda.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/cuda.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/cuda.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/cuda.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/hip.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/hip.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/hip.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/hip.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/musa.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/musa.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/musa.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/musa.h diff --git a/KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/vendor.h b/kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/vendor.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cpu_backend/vendors/vendor.h rename to kt-sft/csrc/ktransformers_ext/cpu_backend/vendors/vendor.h diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/binding.cpp b/kt-sft/csrc/ktransformers_ext/cuda/binding.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/binding.cpp rename to kt-sft/csrc/ktransformers_ext/cuda/binding.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/custom_gguf/dequant.cu b/kt-sft/csrc/ktransformers_ext/cuda/custom_gguf/dequant.cu similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/custom_gguf/dequant.cu rename to kt-sft/csrc/ktransformers_ext/cuda/custom_gguf/dequant.cu diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/custom_gguf/ops.h b/kt-sft/csrc/ktransformers_ext/cuda/custom_gguf/ops.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/custom_gguf/ops.h rename to kt-sft/csrc/ktransformers_ext/cuda/custom_gguf/ops.h diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cu b/kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cu similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cu rename to kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cu diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cuh b/kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cuh similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cuh rename to kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin.cuh diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin_dtypes.cuh b/kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin_dtypes.cuh similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin_dtypes.cuh rename to kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/gptq_marlin_dtypes.cuh diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/ops.h b/kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/ops.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/gptq_marlin/ops.h rename to kt-sft/csrc/ktransformers_ext/cuda/gptq_marlin/ops.h diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/setup.py b/kt-sft/csrc/ktransformers_ext/cuda/setup.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/setup.py rename to kt-sft/csrc/ktransformers_ext/cuda/setup.py diff --git a/KT-SFT/csrc/ktransformers_ext/cuda/test_dequant.py b/kt-sft/csrc/ktransformers_ext/cuda/test_dequant.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/cuda/test_dequant.py rename to kt-sft/csrc/ktransformers_ext/cuda/test_dequant.py diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_attention.py b/kt-sft/csrc/ktransformers_ext/examples/test_attention.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/examples/test_attention.py rename to kt-sft/csrc/ktransformers_ext/examples/test_attention.py diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_linear.py b/kt-sft/csrc/ktransformers_ext/examples/test_linear.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/examples/test_linear.py rename to kt-sft/csrc/ktransformers_ext/examples/test_linear.py diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_mlp.py b/kt-sft/csrc/ktransformers_ext/examples/test_mlp.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/examples/test_mlp.py rename to kt-sft/csrc/ktransformers_ext/examples/test_mlp.py diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_moe.py b/kt-sft/csrc/ktransformers_ext/examples/test_moe.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/examples/test_moe.py rename to kt-sft/csrc/ktransformers_ext/examples/test_moe.py diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_sft_amx_moe.py b/kt-sft/csrc/ktransformers_ext/examples/test_sft_amx_moe.py similarity index 98% rename from KT-SFT/csrc/ktransformers_ext/examples/test_sft_amx_moe.py rename to kt-sft/csrc/ktransformers_ext/examples/test_sft_amx_moe.py index 3d541853..d59be12f 100644 --- a/KT-SFT/csrc/ktransformers_ext/examples/test_sft_amx_moe.py +++ b/kt-sft/csrc/ktransformers_ext/examples/test_sft_amx_moe.py @@ -35,7 +35,7 @@ gradtype = torch.bfloat16 # torch.backends.cuda.matmul.allow_tf32 = False import shutil -folder_path = "/home/lpl/KT-SFT/debug" +folder_path = "/home/lpl/kt-sft/debug" if os.path.exists(folder_path): shutil.rmtree(folder_path) os.makedirs(folder_path) @@ -650,13 +650,13 @@ def manual_check(experts_ids): down_ba_ori = get_tensor(f"cpp_layer0_E_End{experts_idx}_down_ba_ori_", (expert_token_counts[experts_idx], intermediate_size)) - # with open(f"/home/lpl/KT-SFT/debug/cpp_{experts_idx}_down_ba_ori_view.txt", "w") as f: + # with open(f"/home/lpl/kt-sft/debug/cpp_{experts_idx}_down_ba_ori_view.txt", "w") as f: # f.write(str(down_ba_ori)) down_output_grad = get_tensor(f"cpp_layer0_E_End{experts_idx}_down_output_grad_", (expert_token_counts[experts_idx], hidden_size)) - # with open(f"/home/lpl/KT-SFT/debug/cpp_{experts_idx}_down_t_ba_ori_view.txt", "w") as f: + # with open(f"/home/lpl/kt-sft/debug/cpp_{experts_idx}_down_t_ba_ori_view.txt", "w") as f: # f.write(str(down_output_grad)) @@ -674,10 +674,10 @@ def manual_check(experts_ids): py_down_t_ba = torch.load(f"debug/py_layer0_E_End{experts_idx}_down_output_grad_.pt") py_down_ba = torch.load(f"debug/py_layer0_E_End{experts_idx}_gate_output_.pt") - # with open(f"/home/lpl/KT-SFT/debug/py_{experts_idx}_down_t_ba_ori_view.txt", "w") as f: + # with open(f"/home/lpl/kt-sft/debug/py_{experts_idx}_down_t_ba_ori_view.txt", "w") as f: # f.write(str(py_down_t_ba)) - # with open(f"/home/lpl/KT-SFT/debug/py_{experts_idx}_down_ba_ori_view.txt", "w") as f: + # with open(f"/home/lpl/kt-sft/debug/py_{experts_idx}_down_ba_ori_view.txt", "w") as f: # f.write(str(py_down_ba)) print(f"cpp_{experts_idx}_down_ba_ori_:{down_ba_ori}") diff --git a/KT-SFT/csrc/ktransformers_ext/examples/test_sft_moe.py b/kt-sft/csrc/ktransformers_ext/examples/test_sft_moe.py similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/examples/test_sft_moe.py rename to kt-sft/csrc/ktransformers_ext/examples/test_sft_moe.py diff --git a/KT-SFT/csrc/ktransformers_ext/ext_bindings.cpp b/kt-sft/csrc/ktransformers_ext/ext_bindings.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/ext_bindings.cpp rename to kt-sft/csrc/ktransformers_ext/ext_bindings.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/debug_sft_moe.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/debug_sft_moe.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/debug_sft_moe.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/debug_sft_moe.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/debug_tools_sft_moe.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/debug_tools_sft_moe.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/debug_tools_sft_moe.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/debug_tools_sft_moe.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/la/amx.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/la/amx.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/la/amx.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/la/amx.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/la/utils.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/la/utils.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/la/utils.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/la/utils.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/moe.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/moe.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/moe.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/moe.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/amx/sft_moe.hpp b/kt-sft/csrc/ktransformers_ext/operators/amx/sft_moe.hpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/amx/sft_moe.hpp rename to kt-sft/csrc/ktransformers_ext/operators/amx/sft_moe.hpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache.h b/kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache.h rename to kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_attn.cpp b/kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_attn.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_attn.cpp rename to kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_attn.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_load_dump.cpp b/kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_load_dump.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_load_dump.cpp rename to kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_load_dump.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_read_write.cpp b/kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_read_write.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_read_write.cpp rename to kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_read_write.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_utils.cpp b/kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_utils.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/kvcache/kvcache_utils.cpp rename to kt-sft/csrc/ktransformers_ext/operators/kvcache/kvcache_utils.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/conversion.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/conversion.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/conversion.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/conversion.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/linear.cpp b/kt-sft/csrc/ktransformers_ext/operators/llamafile/linear.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/linear.cpp rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/linear.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/linear.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/linear.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/linear.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/linear.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/mlp.cpp b/kt-sft/csrc/ktransformers_ext/operators/llamafile/mlp.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/mlp.cpp rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/mlp.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/mlp.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/mlp.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/mlp.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/mlp.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/moe.cpp b/kt-sft/csrc/ktransformers_ext/operators/llamafile/moe.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/moe.cpp rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/moe.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/moe.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/moe.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/moe.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/moe.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe.cpp b/kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe.cpp similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe.cpp rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe.cpp diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe.h diff --git a/KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe_forward_cache.h b/kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe_forward_cache.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/operators/llamafile/sft_moe_forward_cache.h rename to kt-sft/csrc/ktransformers_ext/operators/llamafile/sft_moe_forward_cache.h diff --git a/KT-SFT/csrc/ktransformers_ext/vendors/cuda.h b/kt-sft/csrc/ktransformers_ext/vendors/cuda.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/vendors/cuda.h rename to kt-sft/csrc/ktransformers_ext/vendors/cuda.h diff --git a/KT-SFT/csrc/ktransformers_ext/vendors/hip.h b/kt-sft/csrc/ktransformers_ext/vendors/hip.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/vendors/hip.h rename to kt-sft/csrc/ktransformers_ext/vendors/hip.h diff --git a/KT-SFT/csrc/ktransformers_ext/vendors/musa.h b/kt-sft/csrc/ktransformers_ext/vendors/musa.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/vendors/musa.h rename to kt-sft/csrc/ktransformers_ext/vendors/musa.h diff --git a/KT-SFT/csrc/ktransformers_ext/vendors/vendor.h b/kt-sft/csrc/ktransformers_ext/vendors/vendor.h similarity index 100% rename from KT-SFT/csrc/ktransformers_ext/vendors/vendor.h rename to kt-sft/csrc/ktransformers_ext/vendors/vendor.h diff --git a/KT-SFT/install-with-cache.sh b/kt-sft/install-with-cache.sh similarity index 100% rename from KT-SFT/install-with-cache.sh rename to kt-sft/install-with-cache.sh diff --git a/KT-SFT/install.bat b/kt-sft/install.bat similarity index 100% rename from KT-SFT/install.bat rename to kt-sft/install.bat diff --git a/KT-SFT/install.sh b/kt-sft/install.sh similarity index 100% rename from KT-SFT/install.sh rename to kt-sft/install.sh diff --git a/KT-SFT/ktransformers/__init__.py b/kt-sft/ktransformers/__init__.py similarity index 100% rename from KT-SFT/ktransformers/__init__.py rename to kt-sft/ktransformers/__init__.py diff --git a/KT-SFT/ktransformers/configs/config.yaml b/kt-sft/ktransformers/configs/config.yaml similarity index 100% rename from KT-SFT/ktransformers/configs/config.yaml rename to kt-sft/ktransformers/configs/config.yaml diff --git a/KT-SFT/ktransformers/configs/log_config.ini b/kt-sft/ktransformers/configs/log_config.ini similarity index 100% rename from KT-SFT/ktransformers/configs/log_config.ini rename to kt-sft/ktransformers/configs/log_config.ini diff --git a/KT-SFT/ktransformers/configs/model_config/config.json b/kt-sft/ktransformers/configs/model_config/config.json similarity index 100% rename from KT-SFT/ktransformers/configs/model_config/config.json rename to kt-sft/ktransformers/configs/model_config/config.json diff --git a/KT-SFT/ktransformers/configs/model_config/configuration_deepseek.py b/kt-sft/ktransformers/configs/model_config/configuration_deepseek.py similarity index 100% rename from KT-SFT/ktransformers/configs/model_config/configuration_deepseek.py rename to kt-sft/ktransformers/configs/model_config/configuration_deepseek.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/__init__.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/__init__.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/__init__.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/__init__.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/format_24.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/format_24.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/format_24.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/format_24.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_24_perms.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_24_perms.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_24_perms.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_24_perms.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_perms.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_perms.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_perms.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_perms.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_utils.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_utils.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_utils.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/marlin_utils.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/quant_utils.py b/kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/quant_utils.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/quant_utils.py rename to kt-sft/ktransformers/ktransformers_ext/operators/custom_marlin/quantize/utils/quant_utils.py diff --git a/KT-SFT/ktransformers/ktransformers_ext/triton/fp8gemm.py b/kt-sft/ktransformers/ktransformers_ext/triton/fp8gemm.py similarity index 100% rename from KT-SFT/ktransformers/ktransformers_ext/triton/fp8gemm.py rename to kt-sft/ktransformers/ktransformers_ext/triton/fp8gemm.py diff --git a/KT-SFT/ktransformers/local_chat.py b/kt-sft/ktransformers/local_chat.py similarity index 100% rename from KT-SFT/ktransformers/local_chat.py rename to kt-sft/ktransformers/local_chat.py diff --git a/KT-SFT/ktransformers/local_chat.sh b/kt-sft/ktransformers/local_chat.sh similarity index 100% rename from KT-SFT/ktransformers/local_chat.sh rename to kt-sft/ktransformers/local_chat.sh diff --git a/KT-SFT/ktransformers/lora_test_module.py b/kt-sft/ktransformers/lora_test_module.py similarity index 100% rename from KT-SFT/ktransformers/lora_test_module.py rename to kt-sft/ktransformers/lora_test_module.py diff --git a/KT-SFT/ktransformers/models/__init__.py b/kt-sft/ktransformers/models/__init__.py similarity index 100% rename from KT-SFT/ktransformers/models/__init__.py rename to kt-sft/ktransformers/models/__init__.py diff --git a/KT-SFT/ktransformers/models/configuration_deepseek.py b/kt-sft/ktransformers/models/configuration_deepseek.py similarity index 100% rename from KT-SFT/ktransformers/models/configuration_deepseek.py rename to kt-sft/ktransformers/models/configuration_deepseek.py diff --git a/KT-SFT/ktransformers/models/configuration_deepseek_v3.py b/kt-sft/ktransformers/models/configuration_deepseek_v3.py similarity index 100% rename from KT-SFT/ktransformers/models/configuration_deepseek_v3.py rename to kt-sft/ktransformers/models/configuration_deepseek_v3.py diff --git a/KT-SFT/ktransformers/models/configuration_llama.py b/kt-sft/ktransformers/models/configuration_llama.py similarity index 100% rename from KT-SFT/ktransformers/models/configuration_llama.py rename to kt-sft/ktransformers/models/configuration_llama.py diff --git a/KT-SFT/ktransformers/models/configuration_qwen2_moe.py b/kt-sft/ktransformers/models/configuration_qwen2_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/configuration_qwen2_moe.py rename to kt-sft/ktransformers/models/configuration_qwen2_moe.py diff --git a/KT-SFT/ktransformers/models/configuration_qwen3_moe.py b/kt-sft/ktransformers/models/configuration_qwen3_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/configuration_qwen3_moe.py rename to kt-sft/ktransformers/models/configuration_qwen3_moe.py diff --git a/KT-SFT/ktransformers/models/custom_cache.py b/kt-sft/ktransformers/models/custom_cache.py similarity index 100% rename from KT-SFT/ktransformers/models/custom_cache.py rename to kt-sft/ktransformers/models/custom_cache.py diff --git a/KT-SFT/ktransformers/models/custom_modeling_deepseek_v2.py b/kt-sft/ktransformers/models/custom_modeling_deepseek_v2.py similarity index 100% rename from KT-SFT/ktransformers/models/custom_modeling_deepseek_v2.py rename to kt-sft/ktransformers/models/custom_modeling_deepseek_v2.py diff --git a/KT-SFT/ktransformers/models/custom_modeling_deepseek_v3.py b/kt-sft/ktransformers/models/custom_modeling_deepseek_v3.py similarity index 100% rename from KT-SFT/ktransformers/models/custom_modeling_deepseek_v3.py rename to kt-sft/ktransformers/models/custom_modeling_deepseek_v3.py diff --git a/KT-SFT/ktransformers/models/custom_modeling_qwen2_moe.py b/kt-sft/ktransformers/models/custom_modeling_qwen2_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/custom_modeling_qwen2_moe.py rename to kt-sft/ktransformers/models/custom_modeling_qwen2_moe.py diff --git a/KT-SFT/ktransformers/models/custom_modeling_qwen3_moe.py b/kt-sft/ktransformers/models/custom_modeling_qwen3_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/custom_modeling_qwen3_moe.py rename to kt-sft/ktransformers/models/custom_modeling_qwen3_moe.py diff --git a/KT-SFT/ktransformers/models/modeling_deepseek.py b/kt-sft/ktransformers/models/modeling_deepseek.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_deepseek.py rename to kt-sft/ktransformers/models/modeling_deepseek.py diff --git a/KT-SFT/ktransformers/models/modeling_deepseek_v3.py b/kt-sft/ktransformers/models/modeling_deepseek_v3.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_deepseek_v3.py rename to kt-sft/ktransformers/models/modeling_deepseek_v3.py diff --git a/KT-SFT/ktransformers/models/modeling_llama.py b/kt-sft/ktransformers/models/modeling_llama.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_llama.py rename to kt-sft/ktransformers/models/modeling_llama.py diff --git a/KT-SFT/ktransformers/models/modeling_mixtral.py b/kt-sft/ktransformers/models/modeling_mixtral.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_mixtral.py rename to kt-sft/ktransformers/models/modeling_mixtral.py diff --git a/KT-SFT/ktransformers/models/modeling_qwen2_moe.py b/kt-sft/ktransformers/models/modeling_qwen2_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_qwen2_moe.py rename to kt-sft/ktransformers/models/modeling_qwen2_moe.py diff --git a/KT-SFT/ktransformers/models/modeling_qwen3_moe.py b/kt-sft/ktransformers/models/modeling_qwen3_moe.py similarity index 100% rename from KT-SFT/ktransformers/models/modeling_qwen3_moe.py rename to kt-sft/ktransformers/models/modeling_qwen3_moe.py diff --git a/KT-SFT/ktransformers/moe_test_module.py b/kt-sft/ktransformers/moe_test_module.py similarity index 100% rename from KT-SFT/ktransformers/moe_test_module.py rename to kt-sft/ktransformers/moe_test_module.py diff --git a/KT-SFT/ktransformers/moe_test_module_old.py b/kt-sft/ktransformers/moe_test_module_old.py similarity index 100% rename from KT-SFT/ktransformers/moe_test_module_old.py rename to kt-sft/ktransformers/moe_test_module_old.py diff --git a/KT-SFT/ktransformers/operators/RoPE.py b/kt-sft/ktransformers/operators/RoPE.py similarity index 100% rename from KT-SFT/ktransformers/operators/RoPE.py rename to kt-sft/ktransformers/operators/RoPE.py diff --git a/KT-SFT/ktransformers/operators/__init__.py b/kt-sft/ktransformers/operators/__init__.py similarity index 100% rename from KT-SFT/ktransformers/operators/__init__.py rename to kt-sft/ktransformers/operators/__init__.py diff --git a/KT-SFT/ktransformers/operators/attention.py b/kt-sft/ktransformers/operators/attention.py similarity index 100% rename from KT-SFT/ktransformers/operators/attention.py rename to kt-sft/ktransformers/operators/attention.py diff --git a/KT-SFT/ktransformers/operators/balance_serve_attention.py b/kt-sft/ktransformers/operators/balance_serve_attention.py similarity index 100% rename from KT-SFT/ktransformers/operators/balance_serve_attention.py rename to kt-sft/ktransformers/operators/balance_serve_attention.py diff --git a/KT-SFT/ktransformers/operators/base_operator.py b/kt-sft/ktransformers/operators/base_operator.py similarity index 100% rename from KT-SFT/ktransformers/operators/base_operator.py rename to kt-sft/ktransformers/operators/base_operator.py diff --git a/KT-SFT/ktransformers/operators/cpuinfer.py b/kt-sft/ktransformers/operators/cpuinfer.py similarity index 100% rename from KT-SFT/ktransformers/operators/cpuinfer.py rename to kt-sft/ktransformers/operators/cpuinfer.py diff --git a/KT-SFT/ktransformers/operators/dynamic_attention.py b/kt-sft/ktransformers/operators/dynamic_attention.py similarity index 100% rename from KT-SFT/ktransformers/operators/dynamic_attention.py rename to kt-sft/ktransformers/operators/dynamic_attention.py diff --git a/KT-SFT/ktransformers/operators/experts.py b/kt-sft/ktransformers/operators/experts.py similarity index 100% rename from KT-SFT/ktransformers/operators/experts.py rename to kt-sft/ktransformers/operators/experts.py diff --git a/KT-SFT/ktransformers/operators/flashinfer_batch_prefill_wrapper.py b/kt-sft/ktransformers/operators/flashinfer_batch_prefill_wrapper.py similarity index 100% rename from KT-SFT/ktransformers/operators/flashinfer_batch_prefill_wrapper.py rename to kt-sft/ktransformers/operators/flashinfer_batch_prefill_wrapper.py diff --git a/KT-SFT/ktransformers/operators/flashinfer_wrapper.py b/kt-sft/ktransformers/operators/flashinfer_wrapper.py similarity index 100% rename from KT-SFT/ktransformers/operators/flashinfer_wrapper.py rename to kt-sft/ktransformers/operators/flashinfer_wrapper.py diff --git a/KT-SFT/ktransformers/operators/gate.py b/kt-sft/ktransformers/operators/gate.py similarity index 100% rename from KT-SFT/ktransformers/operators/gate.py rename to kt-sft/ktransformers/operators/gate.py diff --git a/KT-SFT/ktransformers/operators/layernorm.py b/kt-sft/ktransformers/operators/layernorm.py similarity index 100% rename from KT-SFT/ktransformers/operators/layernorm.py rename to kt-sft/ktransformers/operators/layernorm.py diff --git a/KT-SFT/ktransformers/operators/linear.py b/kt-sft/ktransformers/operators/linear.py similarity index 100% rename from KT-SFT/ktransformers/operators/linear.py rename to kt-sft/ktransformers/operators/linear.py diff --git a/KT-SFT/ktransformers/operators/mlp.py b/kt-sft/ktransformers/operators/mlp.py similarity index 100% rename from KT-SFT/ktransformers/operators/mlp.py rename to kt-sft/ktransformers/operators/mlp.py diff --git a/KT-SFT/ktransformers/operators/models.py b/kt-sft/ktransformers/operators/models.py similarity index 100% rename from KT-SFT/ktransformers/operators/models.py rename to kt-sft/ktransformers/operators/models.py diff --git a/KT-SFT/ktransformers/operators/triton_attention.py b/kt-sft/ktransformers/operators/triton_attention.py similarity index 100% rename from KT-SFT/ktransformers/operators/triton_attention.py rename to kt-sft/ktransformers/operators/triton_attention.py diff --git a/KT-SFT/ktransformers/operators/triton_attention_prefill.py b/kt-sft/ktransformers/operators/triton_attention_prefill.py similarity index 100% rename from KT-SFT/ktransformers/operators/triton_attention_prefill.py rename to kt-sft/ktransformers/operators/triton_attention_prefill.py diff --git a/KT-SFT/ktransformers/optimize/optimize.py b/kt-sft/ktransformers/optimize/optimize.py similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize.py rename to kt-sft/ktransformers/optimize/optimize.py diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu-4.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu-4.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu-4.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu-4.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat-sft-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-sft.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-use-adapter.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-use-adapter.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-use-adapter.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat-use-adapter.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V2-Lite-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts-serve.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-fp8-linear-ggml-experts.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-4.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-4.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-4.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-4.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-8.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-8.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-8.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-8.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-fp8-linear-ggml-experts.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-marlin.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-marlin.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-marlin.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu-marlin.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-serve.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-serve.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-serve.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-serve.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu-4.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat-sft-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/DeepSeek-V3-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Internlm2_5-7b-Chat-1m.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Internlm2_5-7b-Chat-1m.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Internlm2_5-7b-Chat-1m.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Internlm2_5-7b-Chat-1m.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Mixtral.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Mixtral.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Mixtral.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Mixtral.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B-serve.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B-serve.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B-serve.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B-serve.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Moonlight-16B-A3B.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct-multi-gpu.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct-multi-gpu.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct-multi-gpu.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct-multi-gpu.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-serve-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen2-serve-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-serve-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen2-serve-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-serve.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen2-serve.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen2-serve.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen2-serve.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-serve-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-serve-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-serve-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-serve-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-serve.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-serve.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-serve.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-serve.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-sft-amx.yaml b/kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-sft-amx.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/Qwen3Moe-sft-amx.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/Qwen3Moe-sft-amx.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/rocm/DeepSeek-V3-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/rocm/DeepSeek-V3-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/rocm/DeepSeek-V3-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/rocm/DeepSeek-V3-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V2-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V2-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V2-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V2-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V3-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V3-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V3-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/xpu/DeepSeek-V3-Chat.yaml diff --git a/KT-SFT/ktransformers/optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml b/kt-sft/ktransformers/optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml similarity index 100% rename from KT-SFT/ktransformers/optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml rename to kt-sft/ktransformers/optimize/optimize_rules/xpu/Qwen3Moe-Chat.yaml diff --git a/KT-SFT/ktransformers/server/__init__.py b/kt-sft/ktransformers/server/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/__init__.py rename to kt-sft/ktransformers/server/__init__.py diff --git a/KT-SFT/ktransformers/server/api/__init__.py b/kt-sft/ktransformers/server/api/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/__init__.py rename to kt-sft/ktransformers/server/api/__init__.py diff --git a/KT-SFT/ktransformers/server/api/ollama/__init__.py b/kt-sft/ktransformers/server/api/ollama/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/ollama/__init__.py rename to kt-sft/ktransformers/server/api/ollama/__init__.py diff --git a/KT-SFT/ktransformers/server/api/ollama/completions.py b/kt-sft/ktransformers/server/api/ollama/completions.py similarity index 100% rename from KT-SFT/ktransformers/server/api/ollama/completions.py rename to kt-sft/ktransformers/server/api/ollama/completions.py diff --git a/KT-SFT/ktransformers/server/api/openai/__init__.py b/kt-sft/ktransformers/server/api/openai/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/__init__.py rename to kt-sft/ktransformers/server/api/openai/__init__.py diff --git a/KT-SFT/ktransformers/server/api/openai/assistants/__init__.py b/kt-sft/ktransformers/server/api/openai/assistants/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/assistants/__init__.py rename to kt-sft/ktransformers/server/api/openai/assistants/__init__.py diff --git a/KT-SFT/ktransformers/server/api/openai/assistants/assistants.py b/kt-sft/ktransformers/server/api/openai/assistants/assistants.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/assistants/assistants.py rename to kt-sft/ktransformers/server/api/openai/assistants/assistants.py diff --git a/KT-SFT/ktransformers/server/api/openai/assistants/messages.py b/kt-sft/ktransformers/server/api/openai/assistants/messages.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/assistants/messages.py rename to kt-sft/ktransformers/server/api/openai/assistants/messages.py diff --git a/KT-SFT/ktransformers/server/api/openai/assistants/runs.py b/kt-sft/ktransformers/server/api/openai/assistants/runs.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/assistants/runs.py rename to kt-sft/ktransformers/server/api/openai/assistants/runs.py diff --git a/KT-SFT/ktransformers/server/api/openai/assistants/threads.py b/kt-sft/ktransformers/server/api/openai/assistants/threads.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/assistants/threads.py rename to kt-sft/ktransformers/server/api/openai/assistants/threads.py diff --git a/KT-SFT/ktransformers/server/api/openai/endpoints/__init__.py b/kt-sft/ktransformers/server/api/openai/endpoints/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/endpoints/__init__.py rename to kt-sft/ktransformers/server/api/openai/endpoints/__init__.py diff --git a/KT-SFT/ktransformers/server/api/openai/endpoints/chat.py b/kt-sft/ktransformers/server/api/openai/endpoints/chat.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/endpoints/chat.py rename to kt-sft/ktransformers/server/api/openai/endpoints/chat.py diff --git a/KT-SFT/ktransformers/server/api/openai/legacy/__init__.py b/kt-sft/ktransformers/server/api/openai/legacy/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/legacy/__init__.py rename to kt-sft/ktransformers/server/api/openai/legacy/__init__.py diff --git a/KT-SFT/ktransformers/server/api/openai/legacy/completions.py b/kt-sft/ktransformers/server/api/openai/legacy/completions.py similarity index 100% rename from KT-SFT/ktransformers/server/api/openai/legacy/completions.py rename to kt-sft/ktransformers/server/api/openai/legacy/completions.py diff --git a/KT-SFT/ktransformers/server/api/web/__init__.py b/kt-sft/ktransformers/server/api/web/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/api/web/__init__.py rename to kt-sft/ktransformers/server/api/web/__init__.py diff --git a/KT-SFT/ktransformers/server/api/web/system.py b/kt-sft/ktransformers/server/api/web/system.py similarity index 100% rename from KT-SFT/ktransformers/server/api/web/system.py rename to kt-sft/ktransformers/server/api/web/system.py diff --git a/KT-SFT/ktransformers/server/args.py b/kt-sft/ktransformers/server/args.py similarity index 100% rename from KT-SFT/ktransformers/server/args.py rename to kt-sft/ktransformers/server/args.py diff --git a/KT-SFT/ktransformers/server/backend/__init__.py b/kt-sft/ktransformers/server/backend/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/__init__.py rename to kt-sft/ktransformers/server/backend/__init__.py diff --git a/KT-SFT/ktransformers/server/backend/args.py b/kt-sft/ktransformers/server/backend/args.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/args.py rename to kt-sft/ktransformers/server/backend/args.py diff --git a/KT-SFT/ktransformers/server/backend/base.py b/kt-sft/ktransformers/server/backend/base.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/base.py rename to kt-sft/ktransformers/server/backend/base.py diff --git a/KT-SFT/ktransformers/server/backend/context_manager.py b/kt-sft/ktransformers/server/backend/context_manager.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/context_manager.py rename to kt-sft/ktransformers/server/backend/context_manager.py diff --git a/KT-SFT/ktransformers/server/backend/interfaces/__init__.py b/kt-sft/ktransformers/server/backend/interfaces/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/interfaces/__init__.py rename to kt-sft/ktransformers/server/backend/interfaces/__init__.py diff --git a/KT-SFT/ktransformers/server/backend/interfaces/balance_serve.py b/kt-sft/ktransformers/server/backend/interfaces/balance_serve.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/interfaces/balance_serve.py rename to kt-sft/ktransformers/server/backend/interfaces/balance_serve.py diff --git a/KT-SFT/ktransformers/server/backend/interfaces/exllamav2.py b/kt-sft/ktransformers/server/backend/interfaces/exllamav2.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/interfaces/exllamav2.py rename to kt-sft/ktransformers/server/backend/interfaces/exllamav2.py diff --git a/KT-SFT/ktransformers/server/backend/interfaces/ktransformers.py b/kt-sft/ktransformers/server/backend/interfaces/ktransformers.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/interfaces/ktransformers.py rename to kt-sft/ktransformers/server/backend/interfaces/ktransformers.py diff --git a/KT-SFT/ktransformers/server/backend/interfaces/transformers.py b/kt-sft/ktransformers/server/backend/interfaces/transformers.py similarity index 100% rename from KT-SFT/ktransformers/server/backend/interfaces/transformers.py rename to kt-sft/ktransformers/server/backend/interfaces/transformers.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/__init__.py b/kt-sft/ktransformers/server/balance_serve/inference/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/__init__.py rename to kt-sft/ktransformers/server/balance_serve/inference/__init__.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/config.py b/kt-sft/ktransformers/server/balance_serve/inference/config.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/config.py rename to kt-sft/ktransformers/server/balance_serve/inference/config.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/__init__.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/__init__.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/__init__.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/communication_op.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/communication_op.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/communication_op.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/communication_op.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/cuda_wrapper.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/cuda_wrapper.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/cuda_wrapper.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/cuda_wrapper.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce_utils.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce_utils.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce_utils.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/custom_all_reduce_utils.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/parallel_state.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/parallel_state.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/parallel_state.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/parallel_state.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/pynccl.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/pynccl.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/pynccl.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/pynccl.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/pynccl_wrapper.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/pynccl_wrapper.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/pynccl_wrapper.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/pynccl_wrapper.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/distributed/utils.py b/kt-sft/ktransformers/server/balance_serve/inference/distributed/utils.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/distributed/utils.py rename to kt-sft/ktransformers/server/balance_serve/inference/distributed/utils.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/forward_batch.py b/kt-sft/ktransformers/server/balance_serve/inference/forward_batch.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/forward_batch.py rename to kt-sft/ktransformers/server/balance_serve/inference/forward_batch.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/model_runner.py b/kt-sft/ktransformers/server/balance_serve/inference/model_runner.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/model_runner.py rename to kt-sft/ktransformers/server/balance_serve/inference/model_runner.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/query_manager.py b/kt-sft/ktransformers/server/balance_serve/inference/query_manager.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/query_manager.py rename to kt-sft/ktransformers/server/balance_serve/inference/query_manager.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/__init__.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/__init__.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/__init__.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/orchestrator.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/orchestrator.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/orchestrator.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/orchestrator.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/frequency_penalty.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/frequency_penalty.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/frequency_penalty.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/frequency_penalty.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/min_new_tokens.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/min_new_tokens.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/min_new_tokens.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/min_new_tokens.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/presence_penalty.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/presence_penalty.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/presence_penalty.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/presence_penalty.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/repetition_penalty.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/repetition_penalty.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/repetition_penalty.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/penaltylib/penalizers/repetition_penalty.py diff --git a/KT-SFT/ktransformers/server/balance_serve/inference/sampling/sampler.py b/kt-sft/ktransformers/server/balance_serve/inference/sampling/sampler.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/inference/sampling/sampler.py rename to kt-sft/ktransformers/server/balance_serve/inference/sampling/sampler.py diff --git a/KT-SFT/ktransformers/server/balance_serve/sched_rpc.py b/kt-sft/ktransformers/server/balance_serve/sched_rpc.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/sched_rpc.py rename to kt-sft/ktransformers/server/balance_serve/sched_rpc.py diff --git a/KT-SFT/ktransformers/server/balance_serve/settings.py b/kt-sft/ktransformers/server/balance_serve/settings.py similarity index 100% rename from KT-SFT/ktransformers/server/balance_serve/settings.py rename to kt-sft/ktransformers/server/balance_serve/settings.py diff --git a/KT-SFT/ktransformers/server/config/config.py b/kt-sft/ktransformers/server/config/config.py similarity index 100% rename from KT-SFT/ktransformers/server/config/config.py rename to kt-sft/ktransformers/server/config/config.py diff --git a/KT-SFT/ktransformers/server/config/log.py b/kt-sft/ktransformers/server/config/log.py similarity index 100% rename from KT-SFT/ktransformers/server/config/log.py rename to kt-sft/ktransformers/server/config/log.py diff --git a/KT-SFT/ktransformers/server/config/singleton.py b/kt-sft/ktransformers/server/config/singleton.py similarity index 100% rename from KT-SFT/ktransformers/server/config/singleton.py rename to kt-sft/ktransformers/server/config/singleton.py diff --git a/KT-SFT/ktransformers/server/crud/__init__.py b/kt-sft/ktransformers/server/crud/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/__init__.py rename to kt-sft/ktransformers/server/crud/__init__.py diff --git a/KT-SFT/ktransformers/server/crud/assistants/__init__.py b/kt-sft/ktransformers/server/crud/assistants/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/assistants/__init__.py rename to kt-sft/ktransformers/server/crud/assistants/__init__.py diff --git a/KT-SFT/ktransformers/server/crud/assistants/assistants.py b/kt-sft/ktransformers/server/crud/assistants/assistants.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/assistants/assistants.py rename to kt-sft/ktransformers/server/crud/assistants/assistants.py diff --git a/KT-SFT/ktransformers/server/crud/assistants/messages.py b/kt-sft/ktransformers/server/crud/assistants/messages.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/assistants/messages.py rename to kt-sft/ktransformers/server/crud/assistants/messages.py diff --git a/KT-SFT/ktransformers/server/crud/assistants/runs.py b/kt-sft/ktransformers/server/crud/assistants/runs.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/assistants/runs.py rename to kt-sft/ktransformers/server/crud/assistants/runs.py diff --git a/KT-SFT/ktransformers/server/crud/assistants/threads.py b/kt-sft/ktransformers/server/crud/assistants/threads.py similarity index 100% rename from KT-SFT/ktransformers/server/crud/assistants/threads.py rename to kt-sft/ktransformers/server/crud/assistants/threads.py diff --git a/KT-SFT/ktransformers/server/exceptions.py b/kt-sft/ktransformers/server/exceptions.py similarity index 100% rename from KT-SFT/ktransformers/server/exceptions.py rename to kt-sft/ktransformers/server/exceptions.py diff --git a/KT-SFT/ktransformers/server/main.py b/kt-sft/ktransformers/server/main.py similarity index 100% rename from KT-SFT/ktransformers/server/main.py rename to kt-sft/ktransformers/server/main.py diff --git a/KT-SFT/ktransformers/server/models/__init__.py b/kt-sft/ktransformers/server/models/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/models/__init__.py rename to kt-sft/ktransformers/server/models/__init__.py diff --git a/KT-SFT/ktransformers/server/models/assistants/__init__.py b/kt-sft/ktransformers/server/models/assistants/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/__init__.py rename to kt-sft/ktransformers/server/models/assistants/__init__.py diff --git a/KT-SFT/ktransformers/server/models/assistants/assistants.py b/kt-sft/ktransformers/server/models/assistants/assistants.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/assistants.py rename to kt-sft/ktransformers/server/models/assistants/assistants.py diff --git a/KT-SFT/ktransformers/server/models/assistants/messages.py b/kt-sft/ktransformers/server/models/assistants/messages.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/messages.py rename to kt-sft/ktransformers/server/models/assistants/messages.py diff --git a/KT-SFT/ktransformers/server/models/assistants/run_steps.py b/kt-sft/ktransformers/server/models/assistants/run_steps.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/run_steps.py rename to kt-sft/ktransformers/server/models/assistants/run_steps.py diff --git a/KT-SFT/ktransformers/server/models/assistants/runs.py b/kt-sft/ktransformers/server/models/assistants/runs.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/runs.py rename to kt-sft/ktransformers/server/models/assistants/runs.py diff --git a/KT-SFT/ktransformers/server/models/assistants/threads.py b/kt-sft/ktransformers/server/models/assistants/threads.py similarity index 100% rename from KT-SFT/ktransformers/server/models/assistants/threads.py rename to kt-sft/ktransformers/server/models/assistants/threads.py diff --git a/KT-SFT/ktransformers/server/schemas/__init__.py b/kt-sft/ktransformers/server/schemas/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/__init__.py rename to kt-sft/ktransformers/server/schemas/__init__.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/__init__.py b/kt-sft/ktransformers/server/schemas/assistants/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/__init__.py rename to kt-sft/ktransformers/server/schemas/assistants/__init__.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/assistants.py b/kt-sft/ktransformers/server/schemas/assistants/assistants.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/assistants.py rename to kt-sft/ktransformers/server/schemas/assistants/assistants.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/messages.py b/kt-sft/ktransformers/server/schemas/assistants/messages.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/messages.py rename to kt-sft/ktransformers/server/schemas/assistants/messages.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/runs.py b/kt-sft/ktransformers/server/schemas/assistants/runs.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/runs.py rename to kt-sft/ktransformers/server/schemas/assistants/runs.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/streaming.py b/kt-sft/ktransformers/server/schemas/assistants/streaming.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/streaming.py rename to kt-sft/ktransformers/server/schemas/assistants/streaming.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/threads.py b/kt-sft/ktransformers/server/schemas/assistants/threads.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/threads.py rename to kt-sft/ktransformers/server/schemas/assistants/threads.py diff --git a/KT-SFT/ktransformers/server/schemas/assistants/tool.py b/kt-sft/ktransformers/server/schemas/assistants/tool.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/assistants/tool.py rename to kt-sft/ktransformers/server/schemas/assistants/tool.py diff --git a/KT-SFT/ktransformers/server/schemas/base.py b/kt-sft/ktransformers/server/schemas/base.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/base.py rename to kt-sft/ktransformers/server/schemas/base.py diff --git a/KT-SFT/ktransformers/server/schemas/conversation.py b/kt-sft/ktransformers/server/schemas/conversation.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/conversation.py rename to kt-sft/ktransformers/server/schemas/conversation.py diff --git a/KT-SFT/ktransformers/server/schemas/endpoints/chat.py b/kt-sft/ktransformers/server/schemas/endpoints/chat.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/endpoints/chat.py rename to kt-sft/ktransformers/server/schemas/endpoints/chat.py diff --git a/KT-SFT/ktransformers/server/schemas/legacy/__init__.py b/kt-sft/ktransformers/server/schemas/legacy/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/legacy/__init__.py rename to kt-sft/ktransformers/server/schemas/legacy/__init__.py diff --git a/KT-SFT/ktransformers/server/schemas/legacy/completions.py b/kt-sft/ktransformers/server/schemas/legacy/completions.py similarity index 100% rename from KT-SFT/ktransformers/server/schemas/legacy/completions.py rename to kt-sft/ktransformers/server/schemas/legacy/completions.py diff --git a/KT-SFT/ktransformers/server/utils/__init__.py b/kt-sft/ktransformers/server/utils/__init__.py similarity index 100% rename from KT-SFT/ktransformers/server/utils/__init__.py rename to kt-sft/ktransformers/server/utils/__init__.py diff --git a/KT-SFT/ktransformers/server/utils/create_interface.py b/kt-sft/ktransformers/server/utils/create_interface.py similarity index 100% rename from KT-SFT/ktransformers/server/utils/create_interface.py rename to kt-sft/ktransformers/server/utils/create_interface.py diff --git a/KT-SFT/ktransformers/server/utils/multi_timer.py b/kt-sft/ktransformers/server/utils/multi_timer.py similarity index 100% rename from KT-SFT/ktransformers/server/utils/multi_timer.py rename to kt-sft/ktransformers/server/utils/multi_timer.py diff --git a/KT-SFT/ktransformers/server/utils/sql_utils.py b/kt-sft/ktransformers/server/utils/sql_utils.py similarity index 100% rename from KT-SFT/ktransformers/server/utils/sql_utils.py rename to kt-sft/ktransformers/server/utils/sql_utils.py diff --git a/KT-SFT/ktransformers/sft/__init__.py b/kt-sft/ktransformers/sft/__init__.py similarity index 100% rename from KT-SFT/ktransformers/sft/__init__.py rename to kt-sft/ktransformers/sft/__init__.py diff --git a/KT-SFT/ktransformers/sft/flops_utils/__init__.py b/kt-sft/ktransformers/sft/flops_utils/__init__.py similarity index 100% rename from KT-SFT/ktransformers/sft/flops_utils/__init__.py rename to kt-sft/ktransformers/sft/flops_utils/__init__.py diff --git a/KT-SFT/ktransformers/sft/flops_utils/custom_profile.py b/kt-sft/ktransformers/sft/flops_utils/custom_profile.py similarity index 100% rename from KT-SFT/ktransformers/sft/flops_utils/custom_profile.py rename to kt-sft/ktransformers/sft/flops_utils/custom_profile.py diff --git a/KT-SFT/ktransformers/sft/flops_utils/lora_test_utils.py b/kt-sft/ktransformers/sft/flops_utils/lora_test_utils.py similarity index 99% rename from KT-SFT/ktransformers/sft/flops_utils/lora_test_utils.py rename to kt-sft/ktransformers/sft/flops_utils/lora_test_utils.py index fbab7ac9..627b86fd 100644 --- a/KT-SFT/ktransformers/sft/flops_utils/lora_test_utils.py +++ b/kt-sft/ktransformers/sft/flops_utils/lora_test_utils.py @@ -411,7 +411,7 @@ def report_meta_tensors(model): # gradients = collect_gradients(model, input_ids) ''' - # with open(f"/home/lpl/KT-SFT/tmp/KSFTExpertsCPU_grads.txt", "w") as f: + # with open(f"/home/lpl/kt-sft/tmp/KSFTExpertsCPU_grads.txt", "w") as f: # f.write("\n".join(gradients)) # print(xx) diff --git a/KT-SFT/ktransformers/sft/lora.py b/kt-sft/ktransformers/sft/lora.py similarity index 100% rename from KT-SFT/ktransformers/sft/lora.py rename to kt-sft/ktransformers/sft/lora.py diff --git a/KT-SFT/ktransformers/sft/metrics.py b/kt-sft/ktransformers/sft/metrics.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics.py rename to kt-sft/ktransformers/sft/metrics.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/__init__.py b/kt-sft/ktransformers/sft/metrics_utils/__init__.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/__init__.py rename to kt-sft/ktransformers/sft/metrics_utils/__init__.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/constants.py b/kt-sft/ktransformers/sft/metrics_utils/constants.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/constants.py rename to kt-sft/ktransformers/sft/metrics_utils/constants.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/env.py b/kt-sft/ktransformers/sft/metrics_utils/env.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/env.py rename to kt-sft/ktransformers/sft/metrics_utils/env.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/logging.py b/kt-sft/ktransformers/sft/metrics_utils/logging.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/logging.py rename to kt-sft/ktransformers/sft/metrics_utils/logging.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/misc.py b/kt-sft/ktransformers/sft/metrics_utils/misc.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/misc.py rename to kt-sft/ktransformers/sft/metrics_utils/misc.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/packages.py b/kt-sft/ktransformers/sft/metrics_utils/packages.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/packages.py rename to kt-sft/ktransformers/sft/metrics_utils/packages.py diff --git a/KT-SFT/ktransformers/sft/metrics_utils/ploting.py b/kt-sft/ktransformers/sft/metrics_utils/ploting.py similarity index 100% rename from KT-SFT/ktransformers/sft/metrics_utils/ploting.py rename to kt-sft/ktransformers/sft/metrics_utils/ploting.py diff --git a/KT-SFT/ktransformers/sft/monkey_patch_torch_module.py b/kt-sft/ktransformers/sft/monkey_patch_torch_module.py similarity index 100% rename from KT-SFT/ktransformers/sft/monkey_patch_torch_module.py rename to kt-sft/ktransformers/sft/monkey_patch_torch_module.py diff --git a/KT-SFT/ktransformers/sft/peft_utils/__init__.py b/kt-sft/ktransformers/sft/peft_utils/__init__.py similarity index 100% rename from KT-SFT/ktransformers/sft/peft_utils/__init__.py rename to kt-sft/ktransformers/sft/peft_utils/__init__.py diff --git a/KT-SFT/ktransformers/sft/peft_utils/lora_layer.py b/kt-sft/ktransformers/sft/peft_utils/lora_layer.py similarity index 100% rename from KT-SFT/ktransformers/sft/peft_utils/lora_layer.py rename to kt-sft/ktransformers/sft/peft_utils/lora_layer.py diff --git a/KT-SFT/ktransformers/sft/peft_utils/lora_model.py b/kt-sft/ktransformers/sft/peft_utils/lora_model.py similarity index 100% rename from KT-SFT/ktransformers/sft/peft_utils/lora_model.py rename to kt-sft/ktransformers/sft/peft_utils/lora_model.py diff --git a/KT-SFT/ktransformers/sft/peft_utils/mapping.py b/kt-sft/ktransformers/sft/peft_utils/mapping.py similarity index 100% rename from KT-SFT/ktransformers/sft/peft_utils/mapping.py rename to kt-sft/ktransformers/sft/peft_utils/mapping.py diff --git a/KT-SFT/ktransformers/sft/peft_utils/peft_model.py b/kt-sft/ktransformers/sft/peft_utils/peft_model.py similarity index 100% rename from KT-SFT/ktransformers/sft/peft_utils/peft_model.py rename to kt-sft/ktransformers/sft/peft_utils/peft_model.py diff --git a/KT-SFT/ktransformers/sft/torchviz_test.py b/kt-sft/ktransformers/sft/torchviz_test.py similarity index 100% rename from KT-SFT/ktransformers/sft/torchviz_test.py rename to kt-sft/ktransformers/sft/torchviz_test.py diff --git a/KT-SFT/ktransformers/tests/.gitignore b/kt-sft/ktransformers/tests/.gitignore similarity index 100% rename from KT-SFT/ktransformers/tests/.gitignore rename to kt-sft/ktransformers/tests/.gitignore diff --git a/KT-SFT/ktransformers/tests/AIME_2024/eval_api.py b/kt-sft/ktransformers/tests/AIME_2024/eval_api.py similarity index 100% rename from KT-SFT/ktransformers/tests/AIME_2024/eval_api.py rename to kt-sft/ktransformers/tests/AIME_2024/eval_api.py diff --git a/KT-SFT/ktransformers/tests/AIME_2024/evaluation.py b/kt-sft/ktransformers/tests/AIME_2024/evaluation.py similarity index 100% rename from KT-SFT/ktransformers/tests/AIME_2024/evaluation.py rename to kt-sft/ktransformers/tests/AIME_2024/evaluation.py diff --git a/KT-SFT/ktransformers/tests/AIME_2024/prompts.py b/kt-sft/ktransformers/tests/AIME_2024/prompts.py similarity index 100% rename from KT-SFT/ktransformers/tests/AIME_2024/prompts.py rename to kt-sft/ktransformers/tests/AIME_2024/prompts.py diff --git a/KT-SFT/ktransformers/tests/dequant_gpu.py b/kt-sft/ktransformers/tests/dequant_gpu.py similarity index 100% rename from KT-SFT/ktransformers/tests/dequant_gpu.py rename to kt-sft/ktransformers/tests/dequant_gpu.py diff --git a/KT-SFT/ktransformers/tests/dequant_gpu_t.py b/kt-sft/ktransformers/tests/dequant_gpu_t.py similarity index 100% rename from KT-SFT/ktransformers/tests/dequant_gpu_t.py rename to kt-sft/ktransformers/tests/dequant_gpu_t.py diff --git a/KT-SFT/ktransformers/tests/function_call_test.py b/kt-sft/ktransformers/tests/function_call_test.py similarity index 100% rename from KT-SFT/ktransformers/tests/function_call_test.py rename to kt-sft/ktransformers/tests/function_call_test.py diff --git a/KT-SFT/ktransformers/tests/humaneval/eval_api.py b/kt-sft/ktransformers/tests/humaneval/eval_api.py similarity index 100% rename from KT-SFT/ktransformers/tests/humaneval/eval_api.py rename to kt-sft/ktransformers/tests/humaneval/eval_api.py diff --git a/KT-SFT/ktransformers/tests/humaneval/evaluation.py b/kt-sft/ktransformers/tests/humaneval/evaluation.py similarity index 100% rename from KT-SFT/ktransformers/tests/humaneval/evaluation.py rename to kt-sft/ktransformers/tests/humaneval/evaluation.py diff --git a/KT-SFT/ktransformers/tests/humaneval/prompts.py b/kt-sft/ktransformers/tests/humaneval/prompts.py similarity index 100% rename from KT-SFT/ktransformers/tests/humaneval/prompts.py rename to kt-sft/ktransformers/tests/humaneval/prompts.py diff --git a/KT-SFT/ktransformers/tests/mmlu_pro_test.py b/kt-sft/ktransformers/tests/mmlu_pro_test.py similarity index 100% rename from KT-SFT/ktransformers/tests/mmlu_pro_test.py rename to kt-sft/ktransformers/tests/mmlu_pro_test.py diff --git a/KT-SFT/ktransformers/tests/mmlu_test.py b/kt-sft/ktransformers/tests/mmlu_test.py similarity index 100% rename from KT-SFT/ktransformers/tests/mmlu_test.py rename to kt-sft/ktransformers/tests/mmlu_test.py diff --git a/KT-SFT/ktransformers/tests/mmlu_test_multi.py b/kt-sft/ktransformers/tests/mmlu_test_multi.py similarity index 100% rename from KT-SFT/ktransformers/tests/mmlu_test_multi.py rename to kt-sft/ktransformers/tests/mmlu_test_multi.py diff --git a/KT-SFT/ktransformers/tests/score.py b/kt-sft/ktransformers/tests/score.py similarity index 100% rename from KT-SFT/ktransformers/tests/score.py rename to kt-sft/ktransformers/tests/score.py diff --git a/KT-SFT/ktransformers/tests/test_client.py b/kt-sft/ktransformers/tests/test_client.py similarity index 100% rename from KT-SFT/ktransformers/tests/test_client.py rename to kt-sft/ktransformers/tests/test_client.py diff --git a/KT-SFT/ktransformers/tests/test_pytorch_q8.py b/kt-sft/ktransformers/tests/test_pytorch_q8.py similarity index 100% rename from KT-SFT/ktransformers/tests/test_pytorch_q8.py rename to kt-sft/ktransformers/tests/test_pytorch_q8.py diff --git a/KT-SFT/ktransformers/tests/test_speed.py b/kt-sft/ktransformers/tests/test_speed.py similarity index 100% rename from KT-SFT/ktransformers/tests/test_speed.py rename to kt-sft/ktransformers/tests/test_speed.py diff --git a/KT-SFT/ktransformers/tests/triton_fp8gemm_test.py b/kt-sft/ktransformers/tests/triton_fp8gemm_test.py similarity index 100% rename from KT-SFT/ktransformers/tests/triton_fp8gemm_test.py rename to kt-sft/ktransformers/tests/triton_fp8gemm_test.py diff --git a/KT-SFT/ktransformers/util/cuda_graph_runner.py b/kt-sft/ktransformers/util/cuda_graph_runner.py similarity index 100% rename from KT-SFT/ktransformers/util/cuda_graph_runner.py rename to kt-sft/ktransformers/util/cuda_graph_runner.py diff --git a/KT-SFT/ktransformers/util/custom_gguf.py b/kt-sft/ktransformers/util/custom_gguf.py similarity index 100% rename from KT-SFT/ktransformers/util/custom_gguf.py rename to kt-sft/ktransformers/util/custom_gguf.py diff --git a/KT-SFT/ktransformers/util/custom_loader.py b/kt-sft/ktransformers/util/custom_loader.py similarity index 100% rename from KT-SFT/ktransformers/util/custom_loader.py rename to kt-sft/ktransformers/util/custom_loader.py diff --git a/KT-SFT/ktransformers/util/globals.py b/kt-sft/ktransformers/util/globals.py similarity index 100% rename from KT-SFT/ktransformers/util/globals.py rename to kt-sft/ktransformers/util/globals.py diff --git a/KT-SFT/ktransformers/util/grad_wrapper.py b/kt-sft/ktransformers/util/grad_wrapper.py similarity index 100% rename from KT-SFT/ktransformers/util/grad_wrapper.py rename to kt-sft/ktransformers/util/grad_wrapper.py diff --git a/KT-SFT/ktransformers/util/inference_state.py b/kt-sft/ktransformers/util/inference_state.py similarity index 100% rename from KT-SFT/ktransformers/util/inference_state.py rename to kt-sft/ktransformers/util/inference_state.py diff --git a/KT-SFT/ktransformers/util/modeling_rope_utils.py b/kt-sft/ktransformers/util/modeling_rope_utils.py similarity index 100% rename from KT-SFT/ktransformers/util/modeling_rope_utils.py rename to kt-sft/ktransformers/util/modeling_rope_utils.py diff --git a/KT-SFT/ktransformers/util/textstream.py b/kt-sft/ktransformers/util/textstream.py similarity index 100% rename from KT-SFT/ktransformers/util/textstream.py rename to kt-sft/ktransformers/util/textstream.py diff --git a/KT-SFT/ktransformers/util/utils.py b/kt-sft/ktransformers/util/utils.py similarity index 100% rename from KT-SFT/ktransformers/util/utils.py rename to kt-sft/ktransformers/util/utils.py diff --git a/KT-SFT/ktransformers/util/vendors.py b/kt-sft/ktransformers/util/vendors.py similarity index 100% rename from KT-SFT/ktransformers/util/vendors.py rename to kt-sft/ktransformers/util/vendors.py diff --git a/KT-SFT/ktransformers/util/weight_loader.py b/kt-sft/ktransformers/util/weight_loader.py similarity index 100% rename from KT-SFT/ktransformers/util/weight_loader.py rename to kt-sft/ktransformers/util/weight_loader.py diff --git a/KT-SFT/ktransformers/website/.browserslistrc b/kt-sft/ktransformers/website/.browserslistrc similarity index 100% rename from KT-SFT/ktransformers/website/.browserslistrc rename to kt-sft/ktransformers/website/.browserslistrc diff --git a/KT-SFT/ktransformers/website/.eslintrc.js b/kt-sft/ktransformers/website/.eslintrc.js similarity index 100% rename from KT-SFT/ktransformers/website/.eslintrc.js rename to kt-sft/ktransformers/website/.eslintrc.js diff --git a/KT-SFT/ktransformers/website/.gitignore b/kt-sft/ktransformers/website/.gitignore similarity index 100% rename from KT-SFT/ktransformers/website/.gitignore rename to kt-sft/ktransformers/website/.gitignore diff --git a/KT-SFT/ktransformers/website/README.md b/kt-sft/ktransformers/website/README.md similarity index 100% rename from KT-SFT/ktransformers/website/README.md rename to kt-sft/ktransformers/website/README.md diff --git a/KT-SFT/ktransformers/website/config.d.ts b/kt-sft/ktransformers/website/config.d.ts similarity index 100% rename from KT-SFT/ktransformers/website/config.d.ts rename to kt-sft/ktransformers/website/config.d.ts diff --git a/KT-SFT/ktransformers/website/jest.config.js b/kt-sft/ktransformers/website/jest.config.js similarity index 100% rename from KT-SFT/ktransformers/website/jest.config.js rename to kt-sft/ktransformers/website/jest.config.js diff --git a/KT-SFT/ktransformers/website/package-lock.json b/kt-sft/ktransformers/website/package-lock.json similarity index 100% rename from KT-SFT/ktransformers/website/package-lock.json rename to kt-sft/ktransformers/website/package-lock.json diff --git a/KT-SFT/ktransformers/website/package.json b/kt-sft/ktransformers/website/package.json similarity index 100% rename from KT-SFT/ktransformers/website/package.json rename to kt-sft/ktransformers/website/package.json diff --git a/KT-SFT/ktransformers/website/public/balck.ico b/kt-sft/ktransformers/website/public/balck.ico similarity index 100% rename from KT-SFT/ktransformers/website/public/balck.ico rename to kt-sft/ktransformers/website/public/balck.ico diff --git a/KT-SFT/ktransformers/website/public/config.js b/kt-sft/ktransformers/website/public/config.js similarity index 100% rename from KT-SFT/ktransformers/website/public/config.js rename to kt-sft/ktransformers/website/public/config.js diff --git a/KT-SFT/ktransformers/website/public/css/reset.css b/kt-sft/ktransformers/website/public/css/reset.css similarity index 100% rename from KT-SFT/ktransformers/website/public/css/reset.css rename to kt-sft/ktransformers/website/public/css/reset.css diff --git a/KT-SFT/ktransformers/website/public/images/assistant-avatar.png b/kt-sft/ktransformers/website/public/images/assistant-avatar.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/assistant-avatar.png rename to kt-sft/ktransformers/website/public/images/assistant-avatar.png diff --git a/KT-SFT/ktransformers/website/public/images/avatar.png b/kt-sft/ktransformers/website/public/images/avatar.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/avatar.png rename to kt-sft/ktransformers/website/public/images/avatar.png diff --git a/KT-SFT/ktransformers/website/public/images/bgbg.png b/kt-sft/ktransformers/website/public/images/bgbg.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/bgbg.png rename to kt-sft/ktransformers/website/public/images/bgbg.png diff --git a/KT-SFT/ktransformers/website/public/images/logo.ico b/kt-sft/ktransformers/website/public/images/logo.ico similarity index 100% rename from KT-SFT/ktransformers/website/public/images/logo.ico rename to kt-sft/ktransformers/website/public/images/logo.ico diff --git a/KT-SFT/ktransformers/website/public/images/logo.png b/kt-sft/ktransformers/website/public/images/logo.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/logo.png rename to kt-sft/ktransformers/website/public/images/logo.png diff --git a/KT-SFT/ktransformers/website/public/images/three.png b/kt-sft/ktransformers/website/public/images/three.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/three.png rename to kt-sft/ktransformers/website/public/images/three.png diff --git a/KT-SFT/ktransformers/website/public/images/user-filling.png b/kt-sft/ktransformers/website/public/images/user-filling.png similarity index 100% rename from KT-SFT/ktransformers/website/public/images/user-filling.png rename to kt-sft/ktransformers/website/public/images/user-filling.png diff --git a/KT-SFT/ktransformers/website/public/index.html b/kt-sft/ktransformers/website/public/index.html similarity index 100% rename from KT-SFT/ktransformers/website/public/index.html rename to kt-sft/ktransformers/website/public/index.html diff --git a/KT-SFT/ktransformers/website/src/App.vue b/kt-sft/ktransformers/website/src/App.vue similarity index 100% rename from KT-SFT/ktransformers/website/src/App.vue rename to kt-sft/ktransformers/website/src/App.vue diff --git a/KT-SFT/ktransformers/website/src/api/api-client.ts b/kt-sft/ktransformers/website/src/api/api-client.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/api/api-client.ts rename to kt-sft/ktransformers/website/src/api/api-client.ts diff --git a/KT-SFT/ktransformers/website/src/api/assistant.ts b/kt-sft/ktransformers/website/src/api/assistant.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/api/assistant.ts rename to kt-sft/ktransformers/website/src/api/assistant.ts diff --git a/KT-SFT/ktransformers/website/src/api/message.ts b/kt-sft/ktransformers/website/src/api/message.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/api/message.ts rename to kt-sft/ktransformers/website/src/api/message.ts diff --git a/KT-SFT/ktransformers/website/src/api/run.ts b/kt-sft/ktransformers/website/src/api/run.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/api/run.ts rename to kt-sft/ktransformers/website/src/api/run.ts diff --git a/KT-SFT/ktransformers/website/src/api/thread.ts b/kt-sft/ktransformers/website/src/api/thread.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/api/thread.ts rename to kt-sft/ktransformers/website/src/api/thread.ts diff --git a/KT-SFT/ktransformers/website/src/assets/css/mixins.styl b/kt-sft/ktransformers/website/src/assets/css/mixins.styl similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/css/mixins.styl rename to kt-sft/ktransformers/website/src/assets/css/mixins.styl diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/demo.css b/kt-sft/ktransformers/website/src/assets/iconfont/demo.css similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/demo.css rename to kt-sft/ktransformers/website/src/assets/iconfont/demo.css diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/demo_index.html b/kt-sft/ktransformers/website/src/assets/iconfont/demo_index.html similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/demo_index.html rename to kt-sft/ktransformers/website/src/assets/iconfont/demo_index.html diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.css b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.css similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.css rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.css diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.js b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.js similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.js rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.js diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.json b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.json similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.json rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.json diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.ttf b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.ttf similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.ttf rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.ttf diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.woff b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.woff similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.woff rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.woff diff --git a/KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.woff2 b/kt-sft/ktransformers/website/src/assets/iconfont/iconfont.woff2 similarity index 100% rename from KT-SFT/ktransformers/website/src/assets/iconfont/iconfont.woff2 rename to kt-sft/ktransformers/website/src/assets/iconfont/iconfont.woff2 diff --git a/KT-SFT/ktransformers/website/src/components/chat/index.vue b/kt-sft/ktransformers/website/src/components/chat/index.vue similarity index 100% rename from KT-SFT/ktransformers/website/src/components/chat/index.vue rename to kt-sft/ktransformers/website/src/components/chat/index.vue diff --git a/KT-SFT/ktransformers/website/src/conf/config.ts b/kt-sft/ktransformers/website/src/conf/config.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/conf/config.ts rename to kt-sft/ktransformers/website/src/conf/config.ts diff --git a/KT-SFT/ktransformers/website/src/locals/en.js b/kt-sft/ktransformers/website/src/locals/en.js similarity index 100% rename from KT-SFT/ktransformers/website/src/locals/en.js rename to kt-sft/ktransformers/website/src/locals/en.js diff --git a/KT-SFT/ktransformers/website/src/locals/index.js b/kt-sft/ktransformers/website/src/locals/index.js similarity index 100% rename from KT-SFT/ktransformers/website/src/locals/index.js rename to kt-sft/ktransformers/website/src/locals/index.js diff --git a/KT-SFT/ktransformers/website/src/locals/zh.js b/kt-sft/ktransformers/website/src/locals/zh.js similarity index 100% rename from KT-SFT/ktransformers/website/src/locals/zh.js rename to kt-sft/ktransformers/website/src/locals/zh.js diff --git a/KT-SFT/ktransformers/website/src/main.ts b/kt-sft/ktransformers/website/src/main.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/main.ts rename to kt-sft/ktransformers/website/src/main.ts diff --git a/KT-SFT/ktransformers/website/src/router/index.ts b/kt-sft/ktransformers/website/src/router/index.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/router/index.ts rename to kt-sft/ktransformers/website/src/router/index.ts diff --git a/KT-SFT/ktransformers/website/src/shims-vue.d.ts b/kt-sft/ktransformers/website/src/shims-vue.d.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/shims-vue.d.ts rename to kt-sft/ktransformers/website/src/shims-vue.d.ts diff --git a/KT-SFT/ktransformers/website/src/store/index.ts b/kt-sft/ktransformers/website/src/store/index.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/store/index.ts rename to kt-sft/ktransformers/website/src/store/index.ts diff --git a/KT-SFT/ktransformers/website/src/utils/copy.ts b/kt-sft/ktransformers/website/src/utils/copy.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/utils/copy.ts rename to kt-sft/ktransformers/website/src/utils/copy.ts diff --git a/KT-SFT/ktransformers/website/src/utils/types.ts b/kt-sft/ktransformers/website/src/utils/types.ts similarity index 100% rename from KT-SFT/ktransformers/website/src/utils/types.ts rename to kt-sft/ktransformers/website/src/utils/types.ts diff --git a/KT-SFT/ktransformers/website/src/views/home.vue b/kt-sft/ktransformers/website/src/views/home.vue similarity index 100% rename from KT-SFT/ktransformers/website/src/views/home.vue rename to kt-sft/ktransformers/website/src/views/home.vue diff --git a/KT-SFT/ktransformers/website/tests/unit/example.spec.ts b/kt-sft/ktransformers/website/tests/unit/example.spec.ts similarity index 100% rename from KT-SFT/ktransformers/website/tests/unit/example.spec.ts rename to kt-sft/ktransformers/website/tests/unit/example.spec.ts diff --git a/KT-SFT/ktransformers/website/tsconfig.json b/kt-sft/ktransformers/website/tsconfig.json similarity index 100% rename from KT-SFT/ktransformers/website/tsconfig.json rename to kt-sft/ktransformers/website/tsconfig.json diff --git a/KT-SFT/ktransformers/website/vue.config.js b/kt-sft/ktransformers/website/vue.config.js similarity index 100% rename from KT-SFT/ktransformers/website/vue.config.js rename to kt-sft/ktransformers/website/vue.config.js diff --git a/KT-SFT/merge_tensors/merge_safetensor_gguf.py b/kt-sft/merge_tensors/merge_safetensor_gguf.py similarity index 100% rename from KT-SFT/merge_tensors/merge_safetensor_gguf.py rename to kt-sft/merge_tensors/merge_safetensor_gguf.py diff --git a/KT-SFT/pyproject.toml b/kt-sft/pyproject.toml similarity index 100% rename from KT-SFT/pyproject.toml rename to kt-sft/pyproject.toml diff --git a/KT-SFT/requirements-sft.txt b/kt-sft/requirements-sft.txt similarity index 100% rename from KT-SFT/requirements-sft.txt rename to kt-sft/requirements-sft.txt diff --git a/KT-SFT/setup.py b/kt-sft/setup.py similarity index 100% rename from KT-SFT/setup.py rename to kt-sft/setup.py diff --git a/KT-SFT/test_adapter/data_transfer.py b/kt-sft/test_adapter/data_transfer.py similarity index 100% rename from KT-SFT/test_adapter/data_transfer.py rename to kt-sft/test_adapter/data_transfer.py diff --git a/KT-SFT/test_adapter/infer_with_adapter.py b/kt-sft/test_adapter/infer_with_adapter.py similarity index 100% rename from KT-SFT/test_adapter/infer_with_adapter.py rename to kt-sft/test_adapter/infer_with_adapter.py diff --git a/KT-SFT/test_adapter/inspect_adapter.py b/kt-sft/test_adapter/inspect_adapter.py similarity index 100% rename from KT-SFT/test_adapter/inspect_adapter.py rename to kt-sft/test_adapter/inspect_adapter.py diff --git a/KT-SFT/test_adapter/pred2metrics.py b/kt-sft/test_adapter/pred2metrics.py similarity index 100% rename from KT-SFT/test_adapter/pred2metrics.py rename to kt-sft/test_adapter/pred2metrics.py diff --git a/KT-SFT/test_adapter/test_grad.py b/kt-sft/test_adapter/test_grad.py similarity index 90% rename from KT-SFT/test_adapter/test_grad.py rename to kt-sft/test_adapter/test_grad.py index e1010240..21a2cff3 100644 --- a/KT-SFT/test_adapter/test_grad.py +++ b/kt-sft/test_adapter/test_grad.py @@ -1,6 +1,6 @@ import torch, glob -records = sorted(glob.glob("/home/lpl/KT-SFT/tmp/train_logs/step_*.pt")) +records = sorted(glob.glob("/home/lpl/kt-sft/tmp/train_logs/step_*.pt")) example = torch.load(records[1]) # print("step:", example["step"]) diff --git a/KT-SFT/test_adapter/time_test_lora_train.py b/kt-sft/test_adapter/time_test_lora_train.py similarity index 100% rename from KT-SFT/test_adapter/time_test_lora_train.py rename to kt-sft/test_adapter/time_test_lora_train.py diff --git a/KT-SFT/withoutKT_PEFT.py b/kt-sft/withoutKT_PEFT.py similarity index 100% rename from KT-SFT/withoutKT_PEFT.py rename to kt-sft/withoutKT_PEFT.py