Merge branch 'master' into concedo_experimental

# Conflicts: # .github/workflows/nix-ci.yml # CMakeLists.txt # Makefile # ggml-cuda.cu # ggml-opencl.cpp # llama.cpp
2025-09-11 01:24:36 +00:00 · 2024-01-20 23:27:42 +08:00 · 2024-01-20 23:27:42 +08:00 · 71e9a64171
commit 71e9a64171
parent 425849f387 d9aa4ffa6e
43 changed files with 6540 additions and 3500 deletions
--- a/examples/main/main.cpp
+++ b/examples/main/main.cpp
@ -478,6 +478,7 @@ int main(int argc, char ** argv) {

    bool is_antiprompt        = false;
    bool input_echo           = true;
+    bool display              = true;
    bool need_to_save_session = !path_session.empty() && n_matching_session_tokens < embd_inp.size();

    int n_past             = 0;
@ -492,6 +493,7 @@ int main(int argc, char ** argv) {

    // the first thing we will do is to output the prompt, so set color accordingly
    console::set_display(console::prompt);
+    display = params.display_prompt;

    std::vector<llama_token> embd;
    std::vector<llama_token> embd_guidance;
@ -708,7 +710,7 @@ int main(int argc, char ** argv) {
        }

        // display text
-        if (input_echo) {
+        if (input_echo && display) {
            for (auto id : embd) {
                const std::string token_str = llama_token_to_piece(ctx, id);
                printf("%s", token_str.c_str());
@ -725,6 +727,7 @@ int main(int argc, char ** argv) {
        // reset color to default if there is no pending user input
        if (input_echo && (int) embd_inp.size() == n_consumed) {
            console::set_display(console::reset);
+            display = true;
        }

        // if not currently processing queued inputs;
@ -797,6 +800,7 @@ int main(int argc, char ** argv) {

                // color user input only
                console::set_display(console::user_input);
+                display = params.display_prompt;

                std::string line;
                bool another_line = true;
@ -807,6 +811,7 @@ int main(int argc, char ** argv) {

                // done taking input, reset color
                console::set_display(console::reset);
+                display = true;

                // Add tokens to embd only if the input buffer is non-empty
                // Entering a empty line lets the user pass control back