Merge pull request #933 from osirigunso/fix/comfyui-populated-text
Fix ComfyUI prompt extraction for ImpactWildcardProcessorfix/non-standard-exif-support
commit
5694044a09
|
|
@ -487,37 +487,148 @@ def is_img_created_by_comfyui(img: Image):
|
|||
def is_img_created_by_comfyui_with_webui_gen_info(img: Image):
|
||||
return is_img_created_by_comfyui(img) and img.info.get('parameters')
|
||||
|
||||
|
||||
|
||||
def extract_comfyui_prompt_with_wildcard_support(data: Dict, KSampler_entry: Dict):
|
||||
"""
|
||||
Enhanced prompt extraction for workflows using ImpactWildcardProcessor.
|
||||
|
||||
This function handles:
|
||||
- populated_text over wildcard_text
|
||||
- Recursive resolution of upstream prompt nodes
|
||||
- Intermediate conditioning nodes such as FluxGuidance
|
||||
|
||||
Returns:
|
||||
tuple of (positive_prompt, negative_prompt)
|
||||
"""
|
||||
|
||||
def get_node(node_id):
|
||||
return data.get(str(node_id)) or data.get(node_id)
|
||||
|
||||
def normalize_text(value):
|
||||
if not isinstance(value, str):
|
||||
return None
|
||||
return value.strip()
|
||||
|
||||
def extract_direct_text(node):
|
||||
if not isinstance(node, dict):
|
||||
return None, False
|
||||
|
||||
class_type = node.get("class_type", "")
|
||||
inputs = node.get("inputs", {}) or {}
|
||||
|
||||
if class_type == "ImpactWildcardProcessor":
|
||||
populated = normalize_text(inputs.get("populated_text"))
|
||||
return (populated or ""), True
|
||||
|
||||
if "CLIPTextEncode" in class_type:
|
||||
for key in ("text", "t5xxl"):
|
||||
if key in inputs:
|
||||
value = inputs.get(key)
|
||||
if isinstance(value, str):
|
||||
return value.strip(), True
|
||||
if isinstance(value, list) and len(value) >= 1:
|
||||
return None, False
|
||||
return "", True
|
||||
|
||||
for key in ("text", "t5xxl", "prompt", "string", "value"):
|
||||
if key in inputs and isinstance(inputs.get(key), str):
|
||||
return inputs.get(key).strip(), True
|
||||
|
||||
return None, False
|
||||
|
||||
def resolve_text_from_ref(ref, visited=None):
|
||||
if visited is None:
|
||||
visited = set()
|
||||
|
||||
node_id = ref[0] if isinstance(ref, list) and len(ref) >= 1 else ref
|
||||
node_key = str(node_id)
|
||||
if not node_key or node_key in visited:
|
||||
return ""
|
||||
visited.add(node_key)
|
||||
|
||||
node = get_node(node_id)
|
||||
if not isinstance(node, dict):
|
||||
return ""
|
||||
|
||||
direct_text, is_terminal = extract_direct_text(node)
|
||||
if direct_text is not None:
|
||||
return direct_text
|
||||
if is_terminal:
|
||||
return ""
|
||||
|
||||
inputs = node.get("inputs", {}) or {}
|
||||
class_type = node.get("class_type", "")
|
||||
|
||||
if class_type == "FluxGuidance":
|
||||
conditioning = inputs.get("conditioning")
|
||||
if isinstance(conditioning, list) and len(conditioning) >= 1:
|
||||
return resolve_text_from_ref(conditioning, visited)
|
||||
return ""
|
||||
|
||||
for key in ("text", "t5xxl", "conditioning", "positive", "negative", "prompt", "string", "value"):
|
||||
value = inputs.get(key)
|
||||
if isinstance(value, list) and len(value) >= 1:
|
||||
resolved = resolve_text_from_ref(value, visited)
|
||||
if resolved or resolved == "":
|
||||
return resolved
|
||||
|
||||
return ""
|
||||
|
||||
try:
|
||||
positive_ref = KSampler_entry.get("positive")
|
||||
negative_ref = KSampler_entry.get("negative")
|
||||
|
||||
positive_prompt = resolve_text_from_ref(positive_ref) if positive_ref else ""
|
||||
negative_prompt = resolve_text_from_ref(negative_ref) if negative_ref else ""
|
||||
|
||||
return positive_prompt or "", negative_prompt or ""
|
||||
except Exception as e:
|
||||
print(e)
|
||||
return "", ""
|
||||
|
||||
|
||||
def get_comfyui_exif_data(img: Image):
|
||||
prompt = None
|
||||
if img.format == "PNG":
|
||||
prompt = img.info.get('prompt')
|
||||
elif img.format == "WEBP":
|
||||
exif = img.info.get("exif")
|
||||
split = [x.decode("utf-8", errors="ignore") for x in exif.split(b"\x00")]
|
||||
prompt_str = find(split, lambda x: x.lower().startswith("prompt:"))
|
||||
if prompt_str:
|
||||
prompt = prompt_str.split(":", 1)[1] if prompt_str else None
|
||||
if exif:
|
||||
split = [x.decode("utf-8", errors="ignore") for x in exif.split(b"\x00")]
|
||||
prompt_str = find(split, lambda x: x.lower().startswith("prompt:"))
|
||||
if prompt_str:
|
||||
prompt = prompt_str.split(":", 1)[1] if prompt_str else None
|
||||
if not prompt:
|
||||
return {}
|
||||
|
||||
data: Dict[str, Any] = json.loads(prompt)
|
||||
meta_key = '3'
|
||||
data: Dict[str, any] = json.loads(prompt)
|
||||
for i in data.keys():
|
||||
try:
|
||||
if data[i]["class_type"].startswith("KSampler"):
|
||||
meta_key = i
|
||||
break
|
||||
except:
|
||||
except Exception:
|
||||
pass
|
||||
|
||||
if meta_key not in data:
|
||||
return {}
|
||||
|
||||
meta = {}
|
||||
KSampler_entry = data[meta_key]["inputs"]
|
||||
#print(KSampler_entry) # for testing
|
||||
|
||||
# As a workaround to bypass parsing errors in the parser.
|
||||
# https://github.com/jiw0220/stable-diffusion-image-metadata/blob/00b8d42d4d1a536862bba0b07c332bdebb2a0ce5/src/index.ts#L130
|
||||
meta["Steps"] = KSampler_entry.get("steps", "Unknown")
|
||||
meta["Sampler"] = KSampler_entry["sampler_name"]
|
||||
meta["Model"] = data[KSampler_entry["model"][0]]["inputs"].get("ckpt_name")
|
||||
meta["Sampler"] = KSampler_entry.get("sampler_name", "Unknown")
|
||||
try:
|
||||
meta["Model"] = data[KSampler_entry["model"][0]]["inputs"].get("ckpt_name")
|
||||
except Exception:
|
||||
meta["Model"] = None
|
||||
meta["Source Identifier"] = "ComfyUI"
|
||||
def get_text_from_clip(idx: str) :
|
||||
|
||||
def get_text_from_clip(idx: str):
|
||||
try:
|
||||
inputs = data[idx]["inputs"]
|
||||
if "text" in inputs:
|
||||
|
|
@ -526,13 +637,33 @@ def get_comfyui_exif_data(img: Image):
|
|||
text = inputs["t5xxl"]
|
||||
else:
|
||||
return ""
|
||||
if isinstance(text, list): # type:CLIPTextEncode (NSP) mode:Wildcards
|
||||
if isinstance(text, list): # type:CLIPTextEncode (NSP) mode:Wildcards
|
||||
text = data[text[0]]["inputs"]["text"]
|
||||
return text.strip()
|
||||
except Exception as e:
|
||||
print(e)
|
||||
return ""
|
||||
|
||||
has_impact_wildcard = any(
|
||||
node_data.get("class_type") == "ImpactWildcardProcessor"
|
||||
for node_data in data.values()
|
||||
if isinstance(node_data, dict)
|
||||
)
|
||||
|
||||
# Detection Point 1: Check if workflow contains ImpactWildcardProcessor
|
||||
# If yes, immediately use the enhanced extraction and return
|
||||
if has_impact_wildcard:
|
||||
pos_prompt, neg_prompt = extract_comfyui_prompt_with_wildcard_support(
|
||||
data, KSampler_entry
|
||||
)
|
||||
pos_prompt_arr = unique_by(parse_prompt(pos_prompt)["pos_prompt"])
|
||||
return {
|
||||
"meta": meta,
|
||||
"pos_prompt": pos_prompt_arr,
|
||||
"pos_prompt_raw": pos_prompt,
|
||||
"neg_prompt_raw": neg_prompt
|
||||
}
|
||||
|
||||
extract_all_prompts = os.getenv("IIB_COMFYUI_EXTRACT_ALL_PROMPTS", "false").lower() == "true"
|
||||
|
||||
if extract_all_prompts:
|
||||
|
|
@ -567,11 +698,25 @@ def get_comfyui_exif_data(img: Image):
|
|||
neg_prompt = get_text_from_clip(KSampler_entry["negative"][0])
|
||||
|
||||
pos_prompt_arr = unique_by(parse_prompt(pos_prompt)["pos_prompt"])
|
||||
|
||||
# Detection Point 2: Fallback if no prompts were extracted
|
||||
# If standard extraction failed, try the enhanced method
|
||||
if has_impact_wildcard and (not pos_prompt_arr or not pos_prompt.strip()):
|
||||
pos_prompt_fallback, neg_prompt_fallback = extract_comfyui_prompt_with_wildcard_support(
|
||||
data, KSampler_entry
|
||||
)
|
||||
if pos_prompt_fallback:
|
||||
pos_prompt = pos_prompt_fallback
|
||||
pos_prompt_arr = unique_by(parse_prompt(pos_prompt_fallback)["pos_prompt"])
|
||||
|
||||
if neg_prompt_fallback:
|
||||
neg_prompt = neg_prompt_fallback
|
||||
|
||||
return {
|
||||
"meta": meta,
|
||||
"pos_prompt": pos_prompt_arr,
|
||||
"pos_prompt_raw": pos_prompt,
|
||||
"neg_prompt_raw" : neg_prompt
|
||||
"neg_prompt_raw": neg_prompt
|
||||
}
|
||||
|
||||
def comfyui_exif_data_to_str(data):
|
||||
|
|
|
|||
Loading…
Reference in New Issue