koboldcpp

mirror of https://github.com/LostRuins/koboldcpp.git synced 2026-05-19 16:31:59 +00:00

History

Concedo a165a73120 Merge commit '`d6f3030047`' into concedo_experimental # Conflicts: # examples/model-conversion/scripts/causal/run-casual-gen-embeddings-org.py # examples/model-conversion/scripts/utils/semantic_check.py # ggml/CMakeLists.txt # ggml/src/CMakeLists.txt # ggml/src/ggml-cann/ggml-cann.cpp # ggml/src/ggml-cpu/amx/amx.cpp # ggml/src/ggml-cuda/CMakeLists.txt # ggml/src/ggml-hexagon/ggml-hexagon.cpp # ggml/src/ggml-hip/CMakeLists.txt # ggml/src/ggml-opencl/ggml-opencl.cpp # ggml/src/ggml-openvino/ggml-openvino.cpp # ggml/src/ggml-rpc/ggml-rpc.cpp # ggml/src/ggml-sycl/ggml-sycl.cpp # ggml/src/ggml-virtgpu/ggml-backend-buffer.cpp # ggml/src/ggml-virtgpu/ggml-backend.cpp # ggml/src/ggml-webgpu/ggml-webgpu.cpp # ggml/src/ggml-zdnn/ggml-zdnn.cpp # ggml/src/ggml-zendnn/ggml-zendnn.cpp # pyproject.toml # requirements/requirements-convert_legacy_llama.txt # requirements/requirements-tool_bench.txt # src/llama-model.cpp # src/llama.cpp # tests/test-llama-archs.cpp # tests/test-tokenizer-0.py # tests/test-tokenizer-random.py # tools/llama-bench/llama-bench.cpp # tools/perplexity/perplexity.cpp		2026-04-11 11:10:55 +08:00
..
ggml-alloc.h	llama: automatically set parameters not set by the user in such a way that maximizes GPU utilization (#16653 )	2025-12-15 09:24:59 +01:00
ggml-backend.h	ggml: backend-agnostic tensor parallelism (experimental) (#19378 )	2026-04-09 16:42:19 +02:00
ggml-blas.h	ggml : build backends as libraries (#10256 )	2024-11-14 18:04:35 +01:00
ggml-cpp.h	ggml : fix ggml_gallocr_ptr type (ggml/1205)	2025-05-01 09:58:44 +03:00
ggml-cpu.h	ggml-cpu: FA split across kv for faster TG (#19209 )	2026-02-03 01:19:55 +08:00
ggml-cuda.h	Merge commit '`d6f3030047`' into concedo_experimental	2026-04-11 11:10:55 +08:00
ggml-hexagon.h	Add experimental ggml-hexagon backend for the Hexagon NPU (#16547 )	2025-10-22 13:47:09 -07:00
ggml-metal.h	not sure if working on metal	2025-09-21 11:35:02 +08:00
ggml-opencl.h	Introducing experimental OpenCL backend with support for Qualcomm Adreno GPUs (#10693 )	2024-12-13 12:23:52 -08:00
ggml-openvino.h	ggml : add OpenVINO backend (#15307 )	2026-03-14 07:56:55 +02:00
ggml-opt.h	chore : correct typos [no ci] (#20041 )	2026-03-05 08:50:21 +01:00
ggml-rpc.h	ggml : bump RPC version (#20330 )	2026-03-10 21:36:57 +02:00
ggml-virtgpu.h	ggml-virtgpu: make the code thread safe (#19204 )	2026-02-04 10:46:18 +08:00
ggml-vulkan.h	vulkan: Make Vulkan optional at runtime (#11493 ). (#11494 )	2025-02-10 07:17:21 +01:00
ggml-zendnn.h	ggml-zendnn : add ZenDNN backend for AMD CPUs (#17690 )	2025-12-07 00:13:33 +08:00
ggml.h	Merge commit '`de1aa6fa73`' into concedo_experimental	2026-04-09 17:16:33 +08:00
gguf.h	llama: fix llama-model-saver (#20503 )	2026-03-25 12:53:16 +02:00