diff --git a/common/profiler.cpp b/common/profiler.cpp
index 96a1c701..550092b8 100644
--- a/common/profiler.cpp
+++ b/common/profiler.cpp
@@ -521,9 +521,9 @@ static uint64_t device_host_physical_memory(bool available) {
             // active pages compression has higher priority than releasing the clean mmap-ed pages
             // some of the active pages can be compressed to save memory for our mmap-ed model weights
             if (is_uma_arch()) {
-                // assume 30% of active pages can be compressed on macOS UMA (an empirical value) 
+                // assume 10% of active pages can be compressed on macOS UMA (an empirical value) 
                 // because GPU is more likely to use the inactive memory
-                memory += vm_stats.active_count * 0.3 * page_size;
+                memory += vm_stats.active_count * 0.1 * page_size;
             } else {
                 // assume 50% of active pages can be compressed on macOS NUMA (an empirical value)
                 memory += vm_stats.active_count * 0.5 * page_size;