mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-04 22:09:04 +00:00
add args -k and --force
This commit is contained in:
parent
bcfdace59b
commit
63b45a4c26
2 changed files with 3 additions and 1 deletions
|
@ -1012,7 +1012,7 @@ static bool assign_layers_to_device(
|
|||
};
|
||||
|
||||
// get valid factors
|
||||
std::vector<int> valid_k = cparams.n_cycles > 0 ? {(int)cparams.n_cycles} : find_factors(n_layer);
|
||||
std::vector<int> valid_k = cparams.n_cycles > 0 ? std::vector<int>{cparams.n_cycles} : find_factors(n_layer);
|
||||
|
||||
// assign devices to sets M1, M2, M3, and M4
|
||||
// M1: devices running on macOS without Metal, and with insufficient memory
|
||||
|
|
|
@ -2574,6 +2574,7 @@ struct llama_cparams {
|
|||
uint32_t rank;
|
||||
uint32_t n_layer_window[32];
|
||||
bool prefetch;
|
||||
bool force;
|
||||
uint32_t n_ctx; // context size used during inference
|
||||
uint32_t n_batch;
|
||||
uint32_t n_ubatch;
|
||||
|
@ -20343,6 +20344,7 @@ struct llama_context * llama_new_context_with_model(
|
|||
ctx->next_node_ip = params.next_node_ip;
|
||||
ctx->cparams.n_world = params.n_world;
|
||||
ctx->cparams.rank = params.rank;
|
||||
ctx->cparams.force = params.force;
|
||||
return ctx;
|
||||
}
|
||||
|
||||
|
|
Loading…
Add table
Reference in a new issue