diff --git a/modules_forge/main_entry.py b/modules_forge/main_entry.py
index e300a5fd..2492fc53 100644
--- a/modules_forge/main_entry.py
+++ b/modules_forge/main_entry.py
@@ -182,9 +182,7 @@ def refresh_memory_management_settings(model_memory, async_loading, pin_shared_m
 
     print(f'Environment vars changed: {log_dict}')
 
-    compute_percentage = (inference_memory / total_vram) * 100.0
-
-    if compute_percentage < 5:
+    if inference_memory < min(512, total_vram * 0.05):
         print('------------------')
         print(f'[Low VRAM Warning] You just set Forge to use 100% GPU memory ({model_memory:.2f} MB) to load model weights.')
         print('[Low VRAM Warning] This means you will have 0% GPU memory (0.00 MB) to do matrix computation. Computations may fallback to CPU or go Out of Memory.')
@@ -194,6 +192,7 @@ def refresh_memory_management_settings(model_memory, async_loading, pin_shared_m
         print('[Low VRAM Warning] Make sure that you know what you are testing.')
         print('------------------')
     else:
+        compute_percentage = (inference_memory / total_vram) * 100.0
         print(f'[GPU Setting] You will use {(100 - compute_percentage):.2f}% GPU memory ({model_memory:.2f} MB) to load weights, and use {compute_percentage:.2f}% GPU memory ({inference_memory:.2f} MB) to do matrix computation.')
 
     processing.need_global_unload = True