comfyui nodes

mitchross · mitchross · commit fc6196dd8a56 · 2026-02-28T15:27:10.000-05:00
diff --git a/my-apps/ai/comfyui/configmap.yaml b/my-apps/ai/comfyui/configmap.yaml
@@ -72,6 +72,11 @@ data:
     # ── System Setup ───────────────────────────────────────────
     mkdir -p /usr/share/fonts/truetype
 
+    # ── Bridge Nodes (from ConfigMap) ─────────────────────────
+    echo "[INFO] Installing bridge nodes..."
+    cp /opt/custom-nodes/image_to_llamacpp_base64.py \
+       /root/ComfyUI/custom_nodes/image_to_llamacpp_base64.py
+
     # ── Example Workflows ──────────────────────────────────────
     DEST="/root/ComfyUI/user/default/workflows"
     mkdir -p "$DEST"
@@ -82,3 +87,74 @@ data:
     fi
 
     echo "[INFO] Pre-start setup complete."
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: comfyui-custom-nodes
+  namespace: comfyui
+data:
+  image_to_llamacpp_base64.py: |
+    """Bridge node: converts ComfyUI IMAGE tensor to base64 JSON for LlamaCppClient."""
+
+    import base64
+    import io
+    import json
+
+    import numpy as np
+    from PIL import Image
+
+
+    class ImageToLlamaCppBase64:
+        @classmethod
+        def INPUT_TYPES(cls):
+            return {
+                "required": {
+                    "image": ("IMAGE",),
+                },
+                "optional": {
+                    "prompt": (
+                        "STRING",
+                        {
+                            "default": "Describe this image in rich detail for use as an image generation prompt. "
+                            "Focus on subject, composition, lighting, colors, style, and mood. "
+                            "Output only the prompt text, no preamble.",
+                            "multiline": True,
+                        },
+                    ),
+                },
+            }
+
+        RETURN_TYPES = ("STRING", "STRING")
+        RETURN_NAMES = ("image_data", "user_message")
+        FUNCTION = "convert"
+        CATEGORY = "AI/LlamaCpp"
+
+        def convert(
+            self,
+            image,
+            prompt="Describe this image in rich detail for use as an image generation prompt. "
+            "Focus on subject, composition, lighting, colors, style, and mood. "
+            "Output only the prompt text, no preamble.",
+        ):
+            # IMAGE tensor shape: [batch, height, width, channels] float32 0-1
+            img_array = (image[0].cpu().numpy() * 255).astype(np.uint8)
+            pil_image = Image.fromarray(img_array)
+
+            buffer = io.BytesIO()
+            pil_image.save(buffer, format="PNG")
+            b64_str = base64.b64encode(buffer.getvalue()).decode("utf-8")
+
+            image_data = json.dumps([{"data": f"data:image/png;base64,{b64_str}", "id": 1}])
+            user_message = f"[img-1] {prompt}"
+
+            return (image_data, user_message)
+
+
+    NODE_CLASS_MAPPINGS = {
+        "ImageToLlamaCppBase64": ImageToLlamaCppBase64,
+    }
+
+    NODE_DISPLAY_NAME_MAPPINGS = {
+        "ImageToLlamaCppBase64": "Image to LlamaCpp Base64",
+    }
diff --git a/my-apps/ai/comfyui/custom-nodes/image_to_llamacpp_base64.py b/my-apps/ai/comfyui/custom-nodes/image_to_llamacpp_base64.py
@@ -0,0 +1,63 @@
+"""Bridge node: converts ComfyUI IMAGE tensor to base64 JSON for LlamaCppClient."""
+
+import base64
+import io
+import json
+
+import numpy as np
+from PIL import Image
+
+
+class ImageToLlamaCppBase64:
+    @classmethod
+    def INPUT_TYPES(cls):
+        return {
+            "required": {
+                "image": ("IMAGE",),
+            },
+            "optional": {
+                "prompt": (
+                    "STRING",
+                    {
+                        "default": "Describe this image in rich detail for use as an image generation prompt. "
+                        "Focus on subject, composition, lighting, colors, style, and mood. "
+                        "Output only the prompt text, no preamble.",
+                        "multiline": True,
+                    },
+                ),
+            },
+        }
+
+    RETURN_TYPES = ("STRING", "STRING")
+    RETURN_NAMES = ("image_data", "user_message")
+    FUNCTION = "convert"
+    CATEGORY = "AI/LlamaCpp"
+
+    def convert(
+        self,
+        image,
+        prompt="Describe this image in rich detail for use as an image generation prompt. "
+        "Focus on subject, composition, lighting, colors, style, and mood. "
+        "Output only the prompt text, no preamble.",
+    ):
+        # IMAGE tensor shape: [batch, height, width, channels] float32 0-1
+        img_array = (image[0].cpu().numpy() * 255).astype(np.uint8)
+        pil_image = Image.fromarray(img_array)
+
+        buffer = io.BytesIO()
+        pil_image.save(buffer, format="PNG")
+        b64_str = base64.b64encode(buffer.getvalue()).decode("utf-8")
+
+        image_data = json.dumps([{"data": f"data:image/png;base64,{b64_str}", "id": 1}])
+        user_message = f"[img-1] {prompt}"
+
+        return (image_data, user_message)
+
+
+NODE_CLASS_MAPPINGS = {
+    "ImageToLlamaCppBase64": ImageToLlamaCppBase64,
+}
+
+NODE_DISPLAY_NAME_MAPPINGS = {
+    "ImageToLlamaCppBase64": "Image to LlamaCpp Base64",
+}
diff --git a/my-apps/ai/comfyui/deployment.yaml b/my-apps/ai/comfyui/deployment.yaml
@@ -77,6 +77,9 @@ spec:
         - name: manager-config
           mountPath: /root/ComfyUI/user/__manager/config.ini
           subPath: config.ini
+        - name: custom-nodes
+          mountPath: /opt/custom-nodes
+          readOnly: true
         readinessProbe:
           httpGet:
             path: /
@@ -104,3 +107,6 @@ spec:
         configMap:
           name: comfyui-pre-start
           defaultMode: 0755
+      - name: custom-nodes
+        configMap:
+          name: comfyui-custom-nodes
diff --git a/my-apps/ai/comfyui/workflows/llamacpp-vision-to-image.json b/my-apps/ai/comfyui/workflows/llamacpp-vision-to-image.json
@@ -0,0 +1,101 @@
+{
+  "1": {
+    "class_type": "LoadImage",
+    "inputs": {
+      "image": "example.png"
+    }
+  },
+  "2": {
+    "class_type": "ImageToLlamaCppBase64",
+    "inputs": {
+      "image": ["1", 0],
+      "prompt": "Describe this image in rich detail for use as an image generation prompt. Focus on subject, composition, lighting, colors, style, and mood. Output only the prompt text, no preamble."
+    }
+  },
+  "3": {
+    "class_type": "LlamaCppClient",
+    "inputs": {
+      "server_url": "http://llama-cpp-service.llama-cpp.svc.cluster.local:8080",
+      "endpoint": "chat_completions",
+      "prompt": "",
+      "system_message": "You are an expert image description assistant. When given an image, produce a detailed, vivid text-to-image prompt that would recreate a similar image. Include subject, setting, lighting, colors, composition, artistic style, and mood. Output ONLY the prompt text with no preamble, labels, or explanation.",
+      "user_message": ["2", 1],
+      "image_data": ["2", 0],
+      "temperature": 0.6,
+      "n_predict": 256,
+      "max_tokens": 256
+    }
+  },
+  "4": {
+    "class_type": "CLIPTextEncode",
+    "inputs": {
+      "text": ["3", 0],
+      "clip": ["6", 0]
+    }
+  },
+  "5": {
+    "class_type": "CLIPTextEncode",
+    "inputs": {
+      "text": "blurry, low quality, distorted, watermark, text, deformed",
+      "clip": ["6", 0]
+    }
+  },
+  "6": {
+    "class_type": "DualCLIPLoader",
+    "inputs": {
+      "clip_name1": "clip_l.safetensors",
+      "clip_name2": "t5xxl_fp8_e4m3fn.safetensors",
+      "type": "flux"
+    }
+  },
+  "7": {
+    "class_type": "UNETLoader",
+    "inputs": {
+      "unet_name": "z_image_turbo_bf16.safetensors",
+      "weight_dtype": "fp8_e4m3fn"
+    }
+  },
+  "8": {
+    "class_type": "VAELoader",
+    "inputs": {
+      "vae_name": "ae.safetensors"
+    }
+  },
+  "9": {
+    "class_type": "EmptyLatentImage",
+    "inputs": {
+      "width": 1024,
+      "height": 1024,
+      "batch_size": 1
+    }
+  },
+  "10": {
+    "class_type": "KSampler",
+    "inputs": {
+      "seed": 0,
+      "steps": 9,
+      "cfg": 1.0,
+      "sampler_name": "euler",
+      "scheduler": "normal",
+      "denoise": 1.0,
+      "model": ["7", 0],
+      "positive": ["4", 0],
+      "negative": ["5", 0],
+      "latent_image": ["9", 0]
+    }
+  },
+  "11": {
+    "class_type": "VAEDecode",
+    "inputs": {
+      "samples": ["10", 0],
+      "vae": ["8", 0]
+    }
+  },
+  "12": {
+    "class_type": "SaveImage",
+    "inputs": {
+      "filename_prefix": "vision-to-image",
+      "images": ["11", 0]
+    }
+  }
+}