Merge branch 'upstream' into concedo_experimental

# Conflicts: # README.md
2025-09-11 09:34:37 +00:00 · 2024-04-25 18:09:12 +08:00 · 2024-04-25 18:09:12 +08:00 · b56805a2ba
commit b56805a2ba
parent cb2dbe9e9a 784e11dea1
3 changed files with 10 additions and 4 deletions
--- a/common/common.h
+++ b/common/common.h
@ -82,8 +82,8 @@ struct gpt_params {
    ggml_numa_strategy numa = GGML_NUMA_STRATEGY_DISABLED;
-    llama_rope_scaling_type rope_scaling_type = LLAMA_ROPE_SCALING_TYPE_UNSPECIFIED;
+    enum llama_rope_scaling_type rope_scaling_type = LLAMA_ROPE_SCALING_TYPE_UNSPECIFIED;
-    llama_pooling_type      pooling_type      = LLAMA_POOLING_TYPE_UNSPECIFIED; // pooling type for embeddings
+    enum llama_pooling_type      pooling_type      = LLAMA_POOLING_TYPE_UNSPECIFIED; // pooling type for embeddings
    // sampling parameters
    int32_t top_k             = 40;    // <= 0 to use vocab size
--- a/llama.cpp
+++ b/llama.cpp
@ -15904,6 +15904,10 @@ enum llama_rope_type llama_rope_type(const struct llama_model * model) {
    return LLAMA_ROPE_TYPE_NONE;
 }
 enum llama_pooling_type llama_pooling_type(const struct llama_context * ctx) {
    return ctx->cparams.pooling_type;
 }
 int32_t llama_n_vocab(const struct llama_model * model) {
    return model->hparams.n_vocab;
 }
--- a/llama.h
+++ b/llama.h
@ -390,7 +390,9 @@ extern "C" {
    LLAMA_API uint32_t llama_n_ubatch   (const struct llama_context * ctx);
    LLAMA_API uint32_t llama_n_seq_max  (const struct llama_context * ctx);
-    LLAMA_API enum llama_vocab_type llama_vocab_type(const struct llama_model * model);
+    LLAMA_API enum llama_pooling_type llama_pooling_type(const struct llama_context * ctx);
    LLAMA_API enum llama_vocab_type   llama_vocab_type  (const struct llama_model   * model);
    LLAMA_API enum llama_rope_type    llama_rope_type   (const struct llama_model   * model);
    LLAMA_API int32_t llama_n_vocab    (const struct llama_model * model);