Merge pull request #933 from osirigunso/fix/comfyui-populated-text

Fix ComfyUI prompt extraction for ImpactWildcardProcessor
2026-03-24 00:22:49 +08:00 · 2026-03-24 00:22:49 +08:00 · 5694044a09
parent 16330934f5 e74293806b
commit 5694044a09
1 changed files with 157 additions and 12 deletions
--- a/scripts/iib/tool.py
+++ b/scripts/iib/tool.py
@ -487,37 +487,148 @@ def is_img_created_by_comfyui(img: Image):
 def is_img_created_by_comfyui_with_webui_gen_info(img: Image):
    return is_img_created_by_comfyui(img) and img.info.get('parameters')

+
+
+def extract_comfyui_prompt_with_wildcard_support(data: Dict, KSampler_entry: Dict):
+    """
+    Enhanced prompt extraction for workflows using ImpactWildcardProcessor.
+
+    This function handles:
+    - populated_text over wildcard_text
+    - Recursive resolution of upstream prompt nodes
+    - Intermediate conditioning nodes such as FluxGuidance
+
+    Returns:
+        tuple of (positive_prompt, negative_prompt)
+    """
+
+    def get_node(node_id):
+        return data.get(str(node_id)) or data.get(node_id)
+
+    def normalize_text(value):
+        if not isinstance(value, str):
+            return None
+        return value.strip()
+
+    def extract_direct_text(node):
+        if not isinstance(node, dict):
+            return None, False
+
+        class_type = node.get("class_type", "")
+        inputs = node.get("inputs", {}) or {}
+
+        if class_type == "ImpactWildcardProcessor":
+            populated = normalize_text(inputs.get("populated_text"))
+            return (populated or ""), True
+
+        if "CLIPTextEncode" in class_type:
+            for key in ("text", "t5xxl"):
+                if key in inputs:
+                    value = inputs.get(key)
+                    if isinstance(value, str):
+                        return value.strip(), True
+                    if isinstance(value, list) and len(value) >= 1:
+                        return None, False
+                    return "", True
+
+        for key in ("text", "t5xxl", "prompt", "string", "value"):
+            if key in inputs and isinstance(inputs.get(key), str):
+                return inputs.get(key).strip(), True
+
+        return None, False
+
+    def resolve_text_from_ref(ref, visited=None):
+        if visited is None:
+            visited = set()
+
+        node_id = ref[0] if isinstance(ref, list) and len(ref) >= 1 else ref
+        node_key = str(node_id)
+        if not node_key or node_key in visited:
+            return ""
+        visited.add(node_key)
+
+        node = get_node(node_id)
+        if not isinstance(node, dict):
+            return ""
+
+        direct_text, is_terminal = extract_direct_text(node)
+        if direct_text is not None:
+            return direct_text
+        if is_terminal:
+            return ""
+
+        inputs = node.get("inputs", {}) or {}
+        class_type = node.get("class_type", "")
+
+        if class_type == "FluxGuidance":
+            conditioning = inputs.get("conditioning")
+            if isinstance(conditioning, list) and len(conditioning) >= 1:
+                return resolve_text_from_ref(conditioning, visited)
+            return ""
+
+        for key in ("text", "t5xxl", "conditioning", "positive", "negative", "prompt", "string", "value"):
+            value = inputs.get(key)
+            if isinstance(value, list) and len(value) >= 1:
+                resolved = resolve_text_from_ref(value, visited)
+                if resolved or resolved == "":
+                    return resolved
+
+        return ""
+
+    try:
+        positive_ref = KSampler_entry.get("positive")
+        negative_ref = KSampler_entry.get("negative")
+
+        positive_prompt = resolve_text_from_ref(positive_ref) if positive_ref else ""
+        negative_prompt = resolve_text_from_ref(negative_ref) if negative_ref else ""
+
+        return positive_prompt or "", negative_prompt or ""
+    except Exception as e:
+        print(e)
+        return "", ""
+
+
 def get_comfyui_exif_data(img: Image):
+    prompt = None
    if img.format == "PNG":
        prompt = img.info.get('prompt')
    elif img.format == "WEBP":
        exif = img.info.get("exif")
-        split = [x.decode("utf-8", errors="ignore") for x in exif.split(b"\x00")]
-        prompt_str = find(split, lambda x: x.lower().startswith("prompt:"))
-        if prompt_str:
-            prompt = prompt_str.split(":", 1)[1] if prompt_str else None
+        if exif:
+            split = [x.decode("utf-8", errors="ignore") for x in exif.split(b"\x00")]
+            prompt_str = find(split, lambda x: x.lower().startswith("prompt:"))
+            if prompt_str:
+                prompt = prompt_str.split(":", 1)[1] if prompt_str else None
    if not prompt:
        return {}
+
+    data: Dict[str, Any] = json.loads(prompt)
    meta_key = '3'
-    data: Dict[str, any] = json.loads(prompt)
    for i in data.keys():
        try:
            if data[i]["class_type"].startswith("KSampler"):
                meta_key = i
                break
-        except:
+        except Exception:
            pass
+
+    if meta_key not in data:
+        return {}
+
    meta = {}
    KSampler_entry = data[meta_key]["inputs"]
-    #print(KSampler_entry) # for testing

    # As a workaround to bypass parsing errors in the parser.
    # https://github.com/jiw0220/stable-diffusion-image-metadata/blob/00b8d42d4d1a536862bba0b07c332bdebb2a0ce5/src/index.ts#L130
    meta["Steps"] = KSampler_entry.get("steps", "Unknown")
-    meta["Sampler"] = KSampler_entry["sampler_name"]
-    meta["Model"] = data[KSampler_entry["model"][0]]["inputs"].get("ckpt_name")
+    meta["Sampler"] = KSampler_entry.get("sampler_name", "Unknown")
+    try:
+        meta["Model"] = data[KSampler_entry["model"][0]]["inputs"].get("ckpt_name")
+    except Exception:
+        meta["Model"] = None
    meta["Source Identifier"] = "ComfyUI"
-    def get_text_from_clip(idx: str) :
+
+    def get_text_from_clip(idx: str):
        try:
            inputs = data[idx]["inputs"]
            if "text" in inputs:
@ -526,13 +637,33 @@ def get_comfyui_exif_data(img: Image):
                text = inputs["t5xxl"]
            else:
                return ""
-            if isinstance(text, list): # type:CLIPTextEncode (NSP) mode:Wildcards
+            if isinstance(text, list):  # type:CLIPTextEncode (NSP) mode:Wildcards
                text = data[text[0]]["inputs"]["text"]
            return text.strip()
        except Exception as e:
            print(e)
            return ""

+    has_impact_wildcard = any(
+        node_data.get("class_type") == "ImpactWildcardProcessor"
+        for node_data in data.values()
+        if isinstance(node_data, dict)
+    )
+
+    # Detection Point 1: Check if workflow contains ImpactWildcardProcessor
+    # If yes, immediately use the enhanced extraction and return
+    if has_impact_wildcard:
+        pos_prompt, neg_prompt = extract_comfyui_prompt_with_wildcard_support(
+            data, KSampler_entry
+        )
+        pos_prompt_arr = unique_by(parse_prompt(pos_prompt)["pos_prompt"])
+        return {
+            "meta": meta,
+            "pos_prompt": pos_prompt_arr,
+            "pos_prompt_raw": pos_prompt,
+            "neg_prompt_raw": neg_prompt
+        }
+
    extract_all_prompts = os.getenv("IIB_COMFYUI_EXTRACT_ALL_PROMPTS", "false").lower() == "true"

    if extract_all_prompts:
@ -567,11 +698,25 @@ def get_comfyui_exif_data(img: Image):
        neg_prompt = get_text_from_clip(KSampler_entry["negative"][0])

    pos_prompt_arr = unique_by(parse_prompt(pos_prompt)["pos_prompt"])
+
+    # Detection Point 2: Fallback if no prompts were extracted
+    # If standard extraction failed, try the enhanced method
+    if has_impact_wildcard and (not pos_prompt_arr or not pos_prompt.strip()):
+        pos_prompt_fallback, neg_prompt_fallback = extract_comfyui_prompt_with_wildcard_support(
+            data, KSampler_entry
+        )
+        if pos_prompt_fallback:
+            pos_prompt = pos_prompt_fallback
+            pos_prompt_arr = unique_by(parse_prompt(pos_prompt_fallback)["pos_prompt"])
+
+        if neg_prompt_fallback:
+            neg_prompt = neg_prompt_fallback
+
    return {
        "meta": meta,
        "pos_prompt": pos_prompt_arr,
        "pos_prompt_raw": pos_prompt,
-        "neg_prompt_raw" : neg_prompt
+        "neg_prompt_raw": neg_prompt
    }

 def comfyui_exif_data_to_str(data):