re-added smart context due to people complaining

2025-09-10 17:14:36 +00:00 · 2024-05-11 17:25:03 +08:00 · 2024-05-11 17:25:03 +08:00 · eff01660e4
commit eff01660e4
parent 702be65ed1
3 changed files with 20 additions and 8 deletions
--- a/gpttype_adapter.cpp
+++ b/gpttype_adapter.cpp
@ -92,6 +92,7 @@ static int current_llava_identifier = LLAVA_TOKEN_IDENTIFIER_A;
 static gpt_params * kcpp_params = nullptr;
 static int max_context_limit_at_load = 0;
 static int n_past = 0;
+static bool useSmartContext = false;
 static bool useContextShift = false;
 static int debugmode = 0; //-1 = hide all, 0 = normal, 1 = showall
 static std::string modelname;
@ -786,6 +787,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
    }
    kcpp_params->flash_attn = inputs.flash_attention;
    modelname = kcpp_params->model = inputs.model_filename;
+    useSmartContext = inputs.use_smartcontext;
    useContextShift = inputs.use_contextshift;
    debugmode = inputs.debugmode;

@ -1939,7 +1941,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
    }
    else
    {
-        bool triggersc = useContextShift;
+        bool triggersc = useSmartContext;
        if(useContextShift && (file_format == FileFormat::GGUF_GENERIC))
        {
            PurgeMissingTokens(llama_ctx_v4, current_context_tokens, embd_inp, inputs.max_length, nctx);