mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-04-28 11:49:51 +00:00
* refactor: move legacy code to archive/ directory - Moved ktransformers, csrc, third_party, merge_tensors to archive/ - Moved build scripts and configurations to archive/ - Kept kt-kernel, KT-SFT, doc, and README files in root - Preserved complete git history for all moved files * refactor: restructure repository to focus on kt-kernel and KT-SFT modules * fix README * fix README * fix README * fix README * docs: add performance benchmarks to kt-kernel section Add comprehensive performance data for kt-kernel to match KT-SFT's presentation: - AMX kernel optimization: 21.3 TFLOPS (3.9× faster than PyTorch) - Prefill phase: up to 20× speedup vs baseline - Decode phase: up to 4× speedup - NUMA optimization: up to 63% throughput improvement - Multi-GPU (8×L20): 227.85 tokens/s total throughput with DeepSeek-R1 FP8 Source: https://lmsys.org/blog/2025-10-22-KTransformers/ This provides users with concrete performance metrics for both core modules, making it easier to understand the capabilities of each component. * refactor: improve kt-kernel performance data with specific hardware and models Replace generic performance descriptions with concrete benchmarks: - Specify exact hardware: 8×L20 GPU + Xeon Gold 6454S, Single/Dual-socket Xeon + AMX - Include specific models: DeepSeek-R1-0528 (FP8), DeepSeek-V3 (671B) - Show detailed metrics: total throughput, output throughput, concurrency details - Match KT-SFT presentation style for consistency This provides users with actionable performance data they can use to evaluate hardware requirements and expected performance for their use cases. * fix README * docs: clean up performance table and improve formatting * add pic for README * refactor: simplify .gitmodules and backup legacy submodules - Remove 7 legacy submodules from root .gitmodules (archive/third_party/*) - Keep only 2 active submodules for kt-kernel (llama.cpp, pybind11) - Backup complete .gitmodules to archive/.gitmodules - Add documentation in archive/README.md for researchers who need legacy submodules This reduces initial clone size by ~500MB and avoids downloading unused dependencies. * refactor: move doc/ back to root directory Keep documentation in root for easier access and maintenance. * refactor: consolidate all images to doc/assets/ - Move kt-kernel/assets/heterogeneous_computing.png to doc/assets/ - Remove KT-SFT/assets/ (images already in doc/assets/) - Update KT-SFT/README.md image references to ../doc/assets/ - Eliminates ~7.9MB image duplication - Centralizes all documentation assets in one location * fix pic path for README
61 lines
1.7 KiB
JSON
61 lines
1.7 KiB
JSON
{
|
|
"name": "",
|
|
"version": "",
|
|
"private": true,
|
|
"scripts": {
|
|
"serve": "vue-cli-service serve",
|
|
"build": "vue-cli-service build",
|
|
"test:unit": "vue-cli-service test:unit",
|
|
"lint": "vue-cli-service lint"
|
|
},
|
|
"dependencies": {
|
|
"@types/pdfjs-dist": "^2.10.378",
|
|
"@types/websocket": "^1.0.10",
|
|
"@vue/cli": "^5.0.8",
|
|
"ant-design-vue": "^4.2.1",
|
|
"apexcharts": "^3.49.1",
|
|
"axios": "^1.7.0",
|
|
"axios-extensions": "^3.1.6",
|
|
"better-scroll": "^2.5.1",
|
|
"element-plus": "^2.7.3",
|
|
"marked": "^12.0.2",
|
|
"marked-highlight": "^2.1.1",
|
|
"pdf-lib": "^1.17.1",
|
|
"pdfobject": "^2.3.0",
|
|
"v-clipboard": "^3.0.0-next.1",
|
|
"vue": "^3.4.27",
|
|
"vue-i18n": "^9.13.1",
|
|
"vue-pdf": "^4.3.0",
|
|
"vue-router": "^4.0.3",
|
|
"vue3-apexcharts": "^1.5.3",
|
|
"vuex": "^4.0.0",
|
|
"webpack": "^5.91.0",
|
|
"webpack-cli": "^5.1.4",
|
|
"websocket": "^1.0.35"
|
|
},
|
|
"devDependencies": {
|
|
"@types/jest": "^27.0.1",
|
|
"@types/pdfobject": "^2.2.5",
|
|
"@typescript-eslint/eslint-plugin": "^5.4.0",
|
|
"@typescript-eslint/parser": "^5.4.0",
|
|
"@vue/cli-plugin-eslint": "~5.0.0",
|
|
"@vue/cli-plugin-router": "~5.0.0",
|
|
"@vue/cli-plugin-typescript": "~5.0.0",
|
|
"@vue/cli-plugin-unit-jest": "~5.0.0",
|
|
"@vue/cli-plugin-vuex": "~5.0.0",
|
|
"@vue/cli-service": "~5.0.0",
|
|
"@vue/eslint-config-typescript": "^9.1.0",
|
|
"@vue/test-utils": "^2.0.0-0",
|
|
"@vue/vue3-jest": "^27.0.0-alpha.1",
|
|
"babel-jest": "^27.0.6",
|
|
"eslint": "^7.32.0",
|
|
"eslint-plugin-vue": "^8.0.3",
|
|
"jest": "^27.0.5",
|
|
"stylus": "^0.55.0",
|
|
"stylus-loader": "^6.1.0",
|
|
"ts-jest": "^27.0.4",
|
|
"typescript": "~4.5.5"
|
|
},
|
|
"_id": "@",
|
|
"readme": "ERROR: No README data found!"
|
|
}
|