mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-10 04:54:34 +00:00
use arg prefetch and remove arg unload
This commit is contained in:
parent
708b1d8c89
commit
c84f9d29fe
5 changed files with 15 additions and 19 deletions
|
@ -322,7 +322,7 @@ extern "C" {
|
|||
uint32_t rank; // my rank
|
||||
uint32_t n_layer_window[32];// number of layers to process in each compute
|
||||
uint32_t n_gpu_layers; // number of layers to process on GPU
|
||||
bool unload; // whether to unload layer weights after use
|
||||
bool prefetch; // whether to prefetch layer weights
|
||||
bool keep_out_in_metal; // whether to keep output weights in metal memory
|
||||
char * master_ip; // ip address of the master node
|
||||
char * next_node_ip; // ip address of the next node
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue