modal-labs
diff --git a/‎06_gpu_and_ml/comfyui/comfyapp.py
Lines changed: 5 additions & 23 deletions b/‎06_gpu_and_ml/comfyui/comfyapp.py
Lines changed: 5 additions & 23 deletions
diff --git a/‎06_gpu_and_ml/comfyui/comfyui_menu.jpeg
-62.8 KB b/‎06_gpu_and_ml/comfyui/comfyui_menu.jpeg
-62.8 KB
diff --git a/‎06_gpu_and_ml/comfyui/flux_gen_image.jpeg
-250 KB b/‎06_gpu_and_ml/comfyui/flux_gen_image.jpeg
-250 KB
diff --git a/‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_example.py
Lines changed: 91 additions & 0 deletions b/‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_example.py
Lines changed: 91 additions & 0 deletions
diff --git a/‎06_gpu_and_ml/comfyui/memory_snapshot_helper/__init__.py renamed to ‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_helper/__init__.py b/‎06_gpu_and_ml/comfyui/memory_snapshot_helper/__init__.py renamed to ‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_helper/__init__.py
diff --git a/‎06_gpu_and_ml/comfyui/memory_snapshot_helper/prestartup_script.py renamed to ‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_helper/prestartup_script.py b/‎06_gpu_and_ml/comfyui/memory_snapshot_helper/prestartup_script.py renamed to ‎06_gpu_and_ml/comfyui/memory_snapshot/memory_snapshot_helper/prestartup_script.py
@@ -23,7 +23,7 @@
 # python 06_gpu_and_ml/comfyui/comfyclient.py --modal-workspace $(modal profile current) --prompt "Surreal dreamscape with floating islands, upside-down waterfalls, and impossible geometric structures, all bathed in a soft, ethereal light"
 # ```
 
-# ![example comfyui image](./flux_gen_image.jpeg)
+# ![example comfyui image](https://modal-cdn.com/cdnbot/flux_gen_imagesenr_0w3_209b7170.webp)
 
 # The first inference will take ~1m since the container needs to launch the ComfyUI server and load Flux into memory. Successive calls on a warm container should take a few seconds.
 
@@ -64,12 +64,6 @@
     # Add .run_commands(...) calls for any other custom nodes you want to download
 )
 
-# We'll also add our own custom node that patches core ComfyUI so that we can use Modal's [memory snapshot](https://modal.com/docs/guide/memory-snapshot) feature to speed up cold starts (more on that on [running as an API](https://modal.com/docs/examples/comfyapp#running-comfyui-as-an-api)).
-image = image.add_local_dir(
-    local_path=Path(__file__).parent / "memory_snapshot_helper",
-    remote_path="/root/comfy/ComfyUI/custom_nodes/memory_snapshot_helper",
-    copy=True,
-)
 # See [this post](https://modal.com/blog/comfyui-custom-nodes) for more examples
 # on how to install popular custom nodes like ComfyUI Impact Pack and ComfyUI IPAdapter Plus.
 
@@ -164,29 +158,17 @@ def ui():
     scaledown_window=300,  # 5 minute container keep alive after it processes an input
     gpu="L40S",
     volumes={"/cache": vol},
-    enable_memory_snapshot=True,  # snapshot container state for faster cold starts
 )
 @modal.concurrent(max_inputs=5)  # run 5 inputs per container
 class ComfyUI:
     port: int = 8000
 
-    @modal.enter(snap=True)
+    @modal.enter()
     def launch_comfy_background(self):
+        # launch the ComfyUI server exactly once when the container starts
         cmd = f"comfy launch --background -- --port {self.port}"
         subprocess.run(cmd, shell=True, check=True)
 
-    @modal.enter(snap=False)
-    def restore_snapshot(self):
-        # initialize GPU for ComfyUI after snapshot restore
-        # note: requires patching core ComfyUI, see the memory_snapshot_helper directory for more details
-        import requests
-
-        response = requests.post(f"http://127.0.0.1:{self.port}/cuda/set_device")
-        if response.status_code != 200:
-            print("Failed to set CUDA device")
-        else:
-            print("Successfully set CUDA device")
-
     @modal.method()
     def infer(self, workflow_path: str = "/root/workflow_api.json"):
         # sometimes the ComfyUI server stops responding (we think because of memory leaks), so this makes sure it's still up
@@ -256,10 +238,10 @@ def poll_server_health(self) -> Dict:
 
 # This serves the `workflow_api.json` in this repo. When deploying your own workflows, make sure you select the "Export (API)" option in the ComfyUI menu:
 
-# ![comfyui menu](./comfyui_menu.jpeg)
+# ![comfyui menu](https://modal-cdn.com/cdnbot/comfyui_menugo5j8ahx_27d72c45.webp)
 
 # ## More resources
-# - [Alternative approach](https://modal.com/blog/comfyui-mem-snapshots) for deploying ComfyUI with memory snapshots
+# - Use [memory snapshots](https://modal.com/docs/guide/memory-snapshot) to speed up cold starts (check out the `memory_snapshot` directory on [Github](https://github.com/modal-labs/modal-examples/tree/main/06_gpu_and_ml/comfyui))
 # - Run a ComfyUI workflow as a [Python script](https://modal.com/blog/comfyui-prototype-to-production)
 
 # - When to use [A1111 vs ComfyUI](https://modal.com/blog/a1111-vs-comfyui)
 
@@ -0,0 +1,91 @@
+# Simple ComfyUI example using memory snapshot to speed up cold starts.
+
+# CAUTION: Some custom nodes may not work with memory snapshots, especially if they make calls to torch (i.e. require a GPU) on initialization.
+# Run `modal deploy memory_snapshot_example.py` to deploy with memory snapshot enabled.
+
+# Image building and model downloading is directly taken from the core example: https://modal.com/docs/examples/comfyapp
+# The notable changes are copying the custom node in the image and the cls object
+import subprocess
+from pathlib import Path
+
+import modal
+
+image = (
+    modal.Image.debian_slim(python_version="3.11")
+    .apt_install("git")
+    .pip_install("fastapi[standard]==0.115.4")
+    .pip_install("comfy-cli==1.3.8")
+    .run_commands("comfy --skip-prompt install --fast-deps --nvidia --version 0.3.10")
+)
+
+# Add custom node that patches core ComfyUI so that we can use Modal's [memory snapshot](https://modal.com/docs/guide/memory-snapshot)
+image = image.add_local_dir(
+    local_path=Path(__file__).parent / "memory_snapshot_helper",
+    remote_path="/root/comfy/ComfyUI/custom_nodes/memory_snapshot_helper",
+    copy=True,
+)
+
+
+def hf_download():
+    from huggingface_hub import hf_hub_download
+
+    flux_model = hf_hub_download(
+        repo_id="Comfy-Org/flux1-schnell",
+        filename="flux1-schnell-fp8.safetensors",
+        cache_dir="/cache",
+    )
+
+    subprocess.run(
+        f"ln -s {flux_model} /root/comfy/ComfyUI/models/checkpoints/flux1-schnell-fp8.safetensors",
+        shell=True,
+        check=True,
+    )
+
+
+vol = modal.Volume.from_name("hf-hub-cache", create_if_missing=True)
+
+image = (
+    image.pip_install("huggingface_hub[hf_transfer]==0.30.0")
+    .env({"HF_HUB_ENABLE_HF_TRANSFER": "1"})
+    .run_function(
+        hf_download,
+        volumes={"/cache": vol},
+    )
+)
+
+
+app = modal.App(name="example-comfyui-memory-snapshot", image=image)
+
+
+@app.cls(
+    max_containers=1,
+    gpu="L40S",
+    volumes={"/cache": vol},
+    enable_memory_snapshot=True,  # snapshot container state for faster cold starts
+)
+@modal.concurrent(max_inputs=10)
+class ComfyUIMemorySnapshot:
+    port: int = 8000
+
+    # Snapshot ComfyUI server launch state, which includes import torch and custom node initialization (GPU not available during this step)
+    @modal.enter(snap=True)
+    def launch_comfy_background(self):
+        cmd = f"comfy launch --background -- --port {self.port}"
+        subprocess.run(cmd, shell=True, check=True)
+
+    # Restore ComfyUI server state. Re-enables the CUDA device for inference.
+    @modal.enter(snap=False)
+    def restore_snapshot(self):
+        import requests
+
+        response = requests.post(f"http://127.0.0.1:{self.port}/cuda/set_device")
+        if response.status_code != 200:
+            print("Failed to set CUDA device")
+        else:
+            print("Successfully set CUDA device")
+
+    @modal.web_server(port, startup_timeout=60)
+    def ui(self):
+        subprocess.Popen(
+            f"comfy launch -- --listen 0.0.0.0 --port {self.port}", shell=True
+        )