modal-labs · kning · Nov 15, 2024 · Nov 14, 2024 · Nov 14, 2024
diff --git a/06_gpu_and_ml/comfyui/comfyapp.py b/06_gpu_and_ml/comfyui/comfyapp.py
@@ -5,19 +5,15 @@
 #
 # # Run Flux on ComfyUI interactively and as an API
 #
-# [ComfyUI](https://github.com/comfyanonymous/ComfyUI) is an open-source Stable Diffusion GUI with a graph/nodes based interface that allows you to design and execute advanced image generation pipelines.
+# [ComfyUI](https://github.com/comfyanonymous/ComfyUI) is an open-source diffusion model platform with a graph/nodes interface that allows you to design and execute advanced image generation pipelines.
 
-# Flux is a family of cutting-edge text-to-image models created by [black forest labs](https://huggingface.co/black-forest-labs), rapidly gaining popularity due to their exceptional image quality.
 #
 # In this example, we show you how to
 #
-# 1. run Flux on ComfyUI interactively to develop workflows
+# 1. run the [Flux](https://huggingface.co/docs/diffusers/main/en/api/pipelines/flux) diffusion model on ComfyUI interactively to develop workflows
 #
 # 2. serve a Flux ComfyUI workflow as an API
 #
-# Combining the UI and the API in a single app makes it easy to iterate on your workflow even after deployment.
-# Simply head to the interactive UI, make your changes, export the JSON, and redeploy the app.
-#
 # ## Quickstart
 #
 # This example runs `workflow_api.json` in this directory, which is an adapation of [this simple FLUX.1-schnell workflow](https://openart.ai/workflows/reverentelusarca/flux-simple-workflow-schnell/40OkdaB23J2TMTXHmxxu) with an Image Resize custom node added at the end.
@@ -28,13 +24,17 @@
 # ![example comfyui image](./flux_gen_image.jpeg)
 #
 # To serve the workflow in this example as an API:
-# 1. Stand up the ComfyUI server in development mode:
+# 1. Download the Flux models to a Modal [Volume](/docs/guide/volumes):
+# ```bash
+# modal run 06_gpu_and_ml/comfyui/comfyapp.py::download_models
+# ```
+#
+# 2. Stand up the ComfyUI server in development mode:
 # ```bash
 # modal serve 06_gpu_and_ml/comfyui/comfyapp.py
 # ```
-# Note: if you're running this for the first time, it will take several minutes to build the image, since we have to download the Flux models (>20GB) to the container. Successive calls will reuse this prebuilt image.
 #
-# 2. In another terminal, run inference:
+# 3. In another terminal, run inference:
 # ```bash
 # python 06_gpu_and_ml/comfyui/comfyclient.py --dev --modal-workspace $(modal profile current) --prompt "neon green sign that says Modal"
 # ```
@@ -54,9 +54,6 @@
 
 # ### Building up the environment
 #
-# ComfyUI setups can be complex, with a lot of custom nodes and models to manage.
-# We'll use [`comfy-cli`](https://github.com/Comfy-Org/comfy-cli) to manage the installation of ComfyUI, its dependencies, models, and custom nodes.
-#
 # We start from a base image and specify all of our dependencies.
 # We'll call out the interesting ones as they come up below.
 #
@@ -76,70 +73,81 @@
         "comfy --skip-prompt install --nvidia"
     )
 )
-
-# #### Downloading models
-#
-# We'll download the Flux models using `comfy-cli`.
-# ComfyUI will look for these models in the `models` subdirectory under specific subdirectories
-# (e.g. `vae`, `unet`, `clip`, etc.), so we need to download them into the correct location.
-#
-# You can run multiple commands using comma separated commands in `.run_commands()`.
-# But here we opt to split them up to allow for more granular layer caching in the Modal Image.
-# By appending a model install using `.run_commands(...)` at the end of this build step we ensure
-# that the previous steps remain un-changed and will be cached, avoiding unnecessary re-runs.
-
+# ### Downloading custom nodes
+# We'll use `comfy-cli` to download custom nodes, in this case the popular WAS Node Suite pack.
 image = (
-    image.run_commands(
-        "comfy --skip-prompt model download --url https://huggingface.co/comfyanonymous/flux_text_encoders/resolve/main/t5xxl_fp8_e4m3fn.safetensors --relative-path models/clip"
-    )
-    .run_commands(
-        "comfy --skip-prompt model download --url https://huggingface.co/comfyanonymous/flux_text_encoders/resolve/main/clip_l.safetensors --relative-path models/clip"
-    )
-    .run_commands(
-        "comfy --skip-prompt model download --url https://huggingface.co/black-forest-labs/FLUX.1-schnell/resolve/main/ae.safetensors --relative-path models/vae"
-    )
-    .run_commands(
-        "comfy --skip-prompt model download --url https://huggingface.co/black-forest-labs/FLUX.1-schnell/resolve/main/flux1-schnell.safetensors --relative-path models/unet"
+    image.run_commands(  # download a custom node
+        "comfy node install was-node-suite-comfyui"
     )
-    # Add .run_commands(...) calls for any other models you want to download
+    # Add .run_commands(...) calls for any other custom nodes you want to download
 )
 
-# To download gated models that require a Hugging Face token (e.g. Flux Dev), add `--set-hf-api-token=<your_token>` to your `comfy model download` command.
+# See [this post](/blog/comfyui-custom-nodes) for more on how to install custom nodes on Modal.
+# ### Downloading models
 
-# #### Downloading custom nodes
-#
-# We'll download custom nodes using `comfy-cli` too.
-# Alternatively, you can install them by cloning the git repositories to your `/root/comfy/ComfyUI/custom_nodes`
-# directory and installing the required dependencies manually.
-#
-# Similarly to models, we opt to split the custom node installation into separate `.run_commands(...)` calls
-# to allow for more granular layer caching.
+# You can also use comfy-cli to download models, but for this example we'll download the Flux models directly from Hugging Face into a Modal Volume.
+# Then on container start, we'll mount our models into the ComfyUI models directory.
+# This allows us to avoid re-downloading the models every time you rebuild your image.
 
 image = (
-    image.run_commands(  # download a custom node
-        "comfy node install image-resize-comfyui"
+    # install huggingface_hub with hf_transfer support to speed up downloads
+    image.pip_install("huggingface_hub[hf_transfer]==0.26.2")
+    .env({"HF_HUB_ENABLE_HF_TRANSFER": "1"})
+    .run_commands(  # needs to be empty for Volume mount to work
+        "rm -rf /root/comfy/ComfyUI/models"
     )
-    # Add .run_commands(...) calls for any other custom nodes you want to download
 )
 
-# #### Adding more dependencies
+# We create the app and specify the image we built above.
+
+app = modal.App(name="example-comfyui", image=image)
+
 #
-# To add more dependencies, models or custom nodes without having to rebuild the entire image
-# it's recommended to append them at the end of your image build rather than modifying previous steps.
-# This allows you to cache all previous steps and only build the new steps when you make changes to the image.
+# First we need to run a function to download the Flux models to a Modal Volume.
 
-image = (
-    image  # Add any additional steps here
-    # .run_commands(...)
-    # .pip_install(...)
-    # .apt_install(...)
+vol = modal.Volume.from_name("comfyui-models", create_if_missing=True)
+
+
+@app.function(
+    volumes={"/root/models": vol},
 )
+def hf_download(repo_id: str, filename: str, model_type: str):
+    from huggingface_hub import hf_hub_download
 
-# #### Create the app
-#
-# We create the app and specify the image we built above.
+    hf_hub_download(
+        repo_id=repo_id,
+        filename=filename,
+        local_dir=f"/root/models/{model_type}",
+    )
 
-app = modal.App(name="example-comfyui", image=image)
+
+# We can kick off the model downloads in parallel using [`starmap`](/docs/reference/modal.Function#starmap).
+@app.local_entrypoint()
+def download_models():
+    models_to_download = [
+        # format is (huggingface repo_id, the model filename, comfyui models subdirectory we want to save the model in)
+        (
+            "black-forest-labs/FLUX.1-schnell",
+            "ae.safetensors",
+            "vae",
+        ),
+        (
+            "black-forest-labs/FLUX.1-schnell",
+            "flux1-schnell.safetensors",
+            "unet",
+        ),
+        (
+            "comfyanonymous/flux_text_encoders",
+            "t5xxl_fp8_e4m3fn.safetensors",
+            "clip",
+        ),
+        ("comfyanonymous/flux_text_encoders", "clip_l.safetensors", "clip"),
+    ]
+    list(hf_download.starmap(models_to_download))
+
+
+# To run the download step, run `modal run 06_gpu_and_ml/comfyui/comfyapp.py::download_models`.
+# By leveraging [hf_transfer](https://huggingface.co/docs/huggingface_hub/en/guides/download#faster-downloads), Modal starmap for parallelism, and Volumes, image build time drops from ~10 minutes to ~25 seconds.
 
 # ## Running ComfyUI interactively and as an API on Modal
 #
@@ -152,6 +160,7 @@
     container_idle_timeout=30,
     timeout=1800,
     gpu="A10G",
+    volumes={"/root/comfy/ComfyUI/models": vol},
 )
 @modal.web_server(8000, startup_timeout=60)
 def ui():
@@ -179,6 +188,7 @@ def ui():
             "/root/workflow_api.json",
         ),
     ],
+    volumes={"/root/comfy/ComfyUI/models": vol},
 )
 class ComfyUI:
     @modal.enter()
@@ -247,6 +257,6 @@ def api(self, item: Dict):
 # Then, redeploy the app with this new workflow by running `modal deploy 06_gpu_and_ml/comfyui/comfyapp.py` again.
 #
 # ## Further optimizations
-# - To decrease inference latency, you can process multiple inputs in parallel by setting `allow_concurrent_inputs=1`, which will run each input on its own container. This will reduce overall response time, but will cost you more money. See our [Scaling ComfyUI](https://modal.com/blog/scaling-comfyui) blog post for more details.
+# - To decrease inference latency, you can process multiple inputs in parallel by setting `allow_concurrent_inputs=1`, which will run each input on its own container. See our [Scaling ComfyUI](https://modal.com/blog/scaling-comfyui) blog post for more details.
 # - If you're noticing long startup times for the ComfyUI server (e.g. >30s), this is likely due to too many custom nodes being loaded in. Consider breaking out your deployments into one App per unique combination of models and custom nodes.
 # - For those who prefer to run a ComfyUI workflow directly as a Python script, see [this blog post](https://modal.com/blog/comfyui-prototype-to-production).
diff --git a/06_gpu_and_ml/comfyui/workflow_api.json b/06_gpu_and_ml/comfyui/workflow_api.json
@@ -33,7 +33,7 @@
   "9": {
     "inputs": {
       "filename_prefix": "ComfyUI",
-      "images": ["26", 0]
+      "images": ["28", 0]
     },
     "class_type": "SaveImage",
     "_meta": {
@@ -116,37 +116,35 @@
   },
   "25": {
     "inputs": {
-      "noise_seed": 857914953840122
+      "noise_seed": 229383932224230
     },
     "class_type": "RandomNoise",
     "_meta": {
       "title": "RandomNoise"
     }
   },
-  "26": {
+  "27": {
     "inputs": {
-      "action": "crop to ratio",
-      "smaller_side": 0,
-      "larger_side": 0,
-      "scale_factor": 2,
-      "resize_mode": "any",
-      "side_ratio": "1:1",
-      "crop_pad_position": 0.5,
-      "pad_feathering": 20,
-      "pixels": ["8", 0]
+      "images": ["8", 0]
     },
-    "class_type": "ImageResize",
+    "class_type": "PreviewImage",
     "_meta": {
-      "title": "Image Resize"
+      "title": "Preview Image"
     }
   },
-  "27": {
+  "28": {
     "inputs": {
-      "images": ["8", 0]
+      "mode": "rescale",
+      "supersample": "true",
+      "resampling": "lanczos",
+      "rescale_factor": 2,
+      "resize_width": 2048,
+      "resize_height": 2048,
+      "image": ["8", 0]
     },
-    "class_type": "PreviewImage",
+    "class_type": "Image Resize",
     "_meta": {
-      "title": "Preview Image"
+      "title": "Image Resize"
     }
   }
 }