add args -k and --force

2025-09-04 22:09:04 +00:00 · 2025-03-11 22:09:39 +04:00 · 2025-03-11 22:09:39 +04:00 · 63b45a4c26
commit 63b45a4c26
parent bcfdace59b
2 changed files with 3 additions and 1 deletions
--- a/common/common.cpp
+++ b/common/common.cpp
@ -1012,7 +1012,7 @@ static bool assign_layers_to_device(
    };

    // get valid factors
-    std::vector<int> valid_k = cparams.n_cycles > 0 ? {(int)cparams.n_cycles} : find_factors(n_layer);
+    std::vector<int> valid_k = cparams.n_cycles > 0 ? std::vector<int>{cparams.n_cycles} : find_factors(n_layer);

    // assign devices to sets M1, M2, M3, and M4
    // M1: devices running on macOS without Metal, and with insufficient memory
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -2574,6 +2574,7 @@ struct llama_cparams {
    uint32_t  rank;
    uint32_t  n_layer_window[32];
    bool      prefetch;
+    bool      force;
    uint32_t  n_ctx;           // context size used during inference
    uint32_t  n_batch;
    uint32_t  n_ubatch;
@ -20343,6 +20344,7 @@ struct llama_context * llama_new_context_with_model(
    ctx->next_node_ip    = params.next_node_ip;
    ctx->cparams.n_world = params.n_world;
    ctx->cparams.rank    = params.rank;
+    ctx->cparams.force   = params.force;
    return ctx;
 }