fix compute_buffer estimate: add context GPU usage

This commit is contained in:
Li, Zonghang 2025-06-24 16:09:59 +04:00
parent c926088d6a
commit 16ba3564ce
2 changed files with 16 additions and 12 deletions

View file

@ -986,7 +986,7 @@ static bool assign_layers_to_device(
if ((is_macos && !dev.gpu_support.metal) || is_linux) {
mem_budget[m] = dev.memory.available_physical;
} else if (is_macos && dev.gpu_support.metal) {
mem_budget[m] = dev.gpu_props.memory_free;
mem_budget[m] = dev.gpu_props.memory_free + 1e-4; // to avoid division by zero
} else if (is_android) {
mem_budget[m] = dev.memory.available_physical + dev.memory.used_can_swap;
} else {