diff --git a/comfy/model_management.py b/comfy/model_management.py
index c97bfcff..ff7cbeb0 100644
--- a/comfy/model_management.py
+++ b/comfy/model_management.py
@@ -13,16 +13,22 @@ total_vram_available_mb = -1
 import sys
 
 set_vram_to = NORMAL_VRAM
+
+try:
+    import torch
+    total_vram = torch.cuda.mem_get_info(torch.cuda.current_device())[1] / (1024 * 1024)
+    if total_vram <= 4096 and not "--normalvram" in sys.argv:
+        print("Trying to enable lowvram mode because your GPU seems to have 4GB or less. If you don't want this use: --normalvram")
+        set_vram_to = LOW_VRAM
+except:
+    pass
+
 if "--lowvram" in sys.argv:
     set_vram_to = LOW_VRAM
 if "--novram" in sys.argv:
     set_vram_to = NO_VRAM
 
-try:
-    import torch
-    total_vram = torch.cuda.mem_get_info(torch.cuda.current_device())[1] / (1024 * 1024)
-except:
-    pass
+
 
 if set_vram_to != NORMAL_VRAM:
     try:
diff --git a/main.py b/main.py
index 0f466a3f..666193b6 100644
--- a/main.py
+++ b/main.py
@@ -14,6 +14,7 @@ if __name__ == "__main__":
         print("\t--dont-upcast-attention\t\tDisable upcasting of attention \n\t\t\t\t\tcan boost speed but increase the chances of black images.\n")
         print("\t--use-split-cross-attention\tUse the split cross attention optimization instead of the sub-quadratic one.\n\t\t\t\t\tIgnored when xformers is used.")
         print()
+        print("\t--normalvram\t\t\tUsed to force normal vram use if lowvram gets automatically enabled.")
         print("\t--lowvram\t\t\tSplit the unet in parts to use less vram.")
         print("\t--novram\t\t\tWhen lowvram isn't enough.")
         print()