mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-06 14:39:03 +00:00
fix bugs in available_mem calculation
This commit is contained in:
parent
64c4a47980
commit
e64f237e04
1 changed files with 5 additions and 1 deletions
|
@ -1433,6 +1433,10 @@ static bool assign_layers_to_device(
|
|||
if (dev.gpu_support.cuda || dev.gpu_support.metal) {
|
||||
int64_t required_mem = w[m] * b_prime;
|
||||
int64_t available_mem = dev.gpu_props.memory_free * GIGABYTE - c_gpu[m];
|
||||
if (dev.gpu_support.metal && m == 0 && cparams.keep_out_in_metal) {
|
||||
available_mem -= bo;
|
||||
}
|
||||
|
||||
if (required_mem <= available_mem) {
|
||||
n_gpu_layers[m] = w[m];
|
||||
} else {
|
||||
|
|
Loading…
Add table
Reference in a new issue