Disable cuda malloc by default.

comfyanonymous · Aug 14, 2024 · 50bf66e · 50bf66e · Thireus · Aug 14, 2024
1 parent e60e19b
commit 50bf66e
Show file tree

Hide file tree

Showing 2 changed files with 8 additions and 4 deletions.
diff --git a/comfy/cli_args.py b/comfy/cli_args.py
@@ -51,8 +51,8 @@ def __call__(self, parser, namespace, values, option_string=None):
 parser.add_argument("--disable-auto-launch", action="store_true", help="Disable auto launching the browser.")
 parser.add_argument("--cuda-device", type=int, default=None, metavar="DEVICE_ID", help="Set the id of the cuda device this instance will use.")
 cm_group = parser.add_mutually_exclusive_group()
-cm_group.add_argument("--cuda-malloc", action="store_true", help="Enable cudaMallocAsync (enabled by default for torch 2.0 and up).")
-cm_group.add_argument("--disable-cuda-malloc", action="store_true", help="Disable cudaMallocAsync.")
+cm_group.add_argument("--cuda-malloc", action="store_true", help="Enable cudaMallocAsync.")
+cm_group.add_argument("--disable-cuda-malloc", action="store_true", help="Disable cudaMallocAsync (The current default).")
 
 
 fp_group = parser.add_mutually_exclusive_group()

diff --git a/cuda_malloc.py b/cuda_malloc.py
@@ -2,6 +2,7 @@
 import importlib.util
 from comfy.cli_args import args
 import subprocess
+import logging
 
 #Can't use pytorch to get the GPU names because the cuda malloc has to be set before the first import.
 def get_gpu_names():
@@ -63,7 +64,7 @@ def cuda_malloc_supported():
     return True
 
 
-if not args.cuda_malloc:
+if args.cuda_malloc:
     try:
         version = ""
         torch_spec = importlib.util.find_spec("torch")
@@ -74,8 +75,11 @@ def cuda_malloc_supported():
                 module = importlib.util.module_from_spec(spec)
                 spec.loader.exec_module(module)
                 version = module.__version__
+        supported = False
         if int(version[0]) >= 2: #enable by default for torch version 2.0 and up
-            args.cuda_malloc = cuda_malloc_supported()
+            supported = cuda_malloc_supported()
+        if not supported:
+            logging.warning("WARNING: cuda malloc enabled but not supported.")
     except:
         pass