Merge branch 'upstream' into concedo_experimental

# Conflicts: # CMakePresets.json # README.md # common/CMakeLists.txt # ggml/src/ggml-cann/ggml-cann.cpp # ggml/src/ggml-opencl/CMakeLists.txt # ggml/src/ggml-opencl/ggml-opencl.cpp # ggml/src/ggml-sycl/ggml-sycl.cpp # scripts/sync-ggml.last # tests/test-backend-ops.cpp # tools/run/CMakeLists.txt
2025-09-13 10:29:43 +00:00 · 2025-07-13 23:39:41 +08:00 · 2025-07-13 23:39:41 +08:00 · 8cebec5128
commit 8cebec5128
parent 66755c8fe9 923e3ea2e3
41 changed files with 28682 additions and 366 deletions
--- a/src/llama-quant.cpp
+++ b/src/llama-quant.cpp
@ -847,6 +847,7 @@ static void llama_model_quantize_impl(const std::string & fname_inp, const std::
        // do not quantize Mamba's small yet 2D weights
        // NOTE: can't use LLM_TN here because the layer number is not known
        quantize &= name.find("ssm_conv1d.weight") == std::string::npos;
+        quantize &= name.find("shortconv.conv.weight") == std::string::npos;

        // do not quantize RWKV's small yet 2D weights
        quantize &= name.find("time_mix_first.weight") == std::string::npos;