import io import sys import json import time import zlib import base64 import pickle import inspect import traceback import threading import numpy as np from datetime import datetime, timedelta from enum import Enum from PIL import Image, PngImagePlugin from typing import Any, Callable, Union from fastapi import FastAPI from modules import progress, shared, script_callbacks from modules.call_queue import queue_lock, wrap_gradio_call from modules.txt2img import txt2img from modules.img2img import img2img from modules.api.api import Api, encode_pil_to_base64 from modules.api.models import ( StableDiffusionTxt2ImgProcessingAPI, StableDiffusionImg2ImgProcessingAPI, ) from scripts.db import TaskStatus, AppStateKey, Task, task_manager, state_manager from scripts.helpers import log, detect_control_net, get_component_by_elem_id img2img_image_args_by_mode: dict[int, list[list[str]]] = { 0: [["init_img"]], 1: [["sketch"]], 2: [["init_img_with_mask", "image"], ["init_img_with_mask", "mask"]], 3: [["inpaint_color_sketch"], ["inpaint_color_sketch_orig"]], 4: [["init_img_inpaint"], ["init_mask_inpaint"]], } class TaskRunner: instance = None def __init__(self, UiControlNetUnit=None): self.UiControlNetUnit = UiControlNetUnit self.__total_pending_tasks: int = 0 self.__current_thread: threading.Thread = None self.__api = Api(FastAPI(), queue_lock) self.__saved_images_path: list[str] = [] script_callbacks.on_image_saved(self.__on_image_saved) self.script_callbacks = { "task_registered": [], "task_started": [], "task_finished": [], "task_cleared": [], } # Mark this to True when reload UI self.dispose = False if TaskRunner.instance is not None: raise Exception("TaskRunner instance already exists") TaskRunner.instance = self @property def current_task_id(self) -> Union[str, None]: return progress.current_task @property def is_executing_task(self) -> bool: return self.__current_thread and self.__current_thread.is_alive() @property def paused(self) -> bool: return state_manager.get_value(AppStateKey.QueueState) == "paused" def __serialize_image(self, image): if isinstance(image, np.ndarray): shape = image.shape data = base64.b64encode(zlib.compress(image.tobytes())).decode() return {"shape": shape, "data": data, "cls": "ndarray"} elif isinstance(image, Image.Image): size = image.size mode = image.mode data = base64.b64encode(zlib.compress(image.tobytes())).decode() return { "size": size, "mode": mode, "data": data, "cls": "Image", } else: return image def __deserialize_image(self, image_str): if isinstance(image_str, dict) and image_str.get("cls", None): cls = image_str["cls"] data = zlib.decompress(base64.b64decode(image_str["data"])) if cls == "ndarray": shape = tuple(image_str["shape"]) image = np.frombuffer(data, dtype=np.uint8) return image.reshape(shape) else: size = tuple(image_str["size"]) mode = image_str["mode"] return Image.frombytes(mode, size, data) else: return image_str def __serialize_img2img_images(self, args: dict, image_args: list): for keys in image_args: if len(keys) == 1: image = args.get(keys[0], None) args[keys[0]] = self.__serialize_image(image) else: value = args.get(keys[0], {}) image = value.get(keys[1], None) value[keys[1]] = self.__serialize_image(image) args[keys[0]] = value def __deserialize_img2img_images(self, args: dict, image_args: list): for keys in image_args: if len(keys) == 1: image = args.get(keys[0], None) args[keys[0]] = self.__deserialize_image(image) else: value = args.get(keys[0], {}) image = value.get(keys[1], None) value[keys[1]] = self.__deserialize_image(image) args[keys[0]] = value def __serialize_ui_task_args(self, is_img2img: bool, *args, checkpoint: str = None): args_name = [] if is_img2img: args_name = inspect.getfullargspec(img2img).args else: args_name = inspect.getfullargspec(txt2img).args args = list(args) named_args = dict(zip(args_name, args[0 : len(args_name)])) script_args = args[len(args_name) :] if checkpoint: override_settings_texts = named_args.get("override_settings_texts", []) override_settings_texts.append("Model hash: " + checkpoint) named_args["override_settings_texts"] = override_settings_texts # loop through named_args and serialize images if is_img2img: for mode, image_args in img2img_image_args_by_mode.items(): if mode == named_args["mode"]: self.__serialize_img2img_images(named_args, image_args) else: # set None to unused image args to save space for keys in image_args: named_args[keys[0]] = None # loop through script_args and serialize controlnets if self.UiControlNetUnit is not None: for i, a in enumerate(script_args): if isinstance(a, self.UiControlNetUnit): script_args[i] = a.__dict__ script_args[i]["is_cnet"] = True for k, v in script_args[i].items(): if k == "image" and v is not None: script_args[i][k] = { "image": self.__serialize_image(v["image"]), "mask": self.__serialize_image(v["mask"]), } if isinstance(v, Enum): script_args[i][k] = v.value return json.dumps( { "args": named_args, "script_args": script_args, "checkpoint": checkpoint, "is_ui": True, "is_img2img": is_img2img, } ) def __serialize_api_task_args( self, is_img2img: bool, script_args: list = [], **named_args ): override_settings = named_args.get("override_settings", {}) checkpoint = override_settings.get("sd_model_checkpoint", None) return json.dumps( { "args": named_args, "script_args": script_args, "checkpoint": checkpoint, "is_ui": False, "is_img2img": is_img2img, } ) def __deserialize_ui_task_args( self, is_img2img: bool, named_args: dict, script_args: list ): # loop through image_args and deserialize images if is_img2img: for mode, image_args in img2img_image_args_by_mode.items(): if mode == named_args["mode"]: self.__deserialize_img2img_images(named_args, image_args) # loop through script_args and deserialize controlnets if self.UiControlNetUnit is not None: for i, arg in enumerate(script_args): if isinstance(arg, dict) and arg.get("is_cnet", False): arg.pop("is_cnet") for k, v in arg.items(): if k == "image" and v is not None: arg[k] = { "image": self.__deserialize_image(v["image"]), "mask": self.__deserialize_image(v["mask"]), } def parse_task_args( self, params: str, script_params: bytes, deserialization: bool = True ): parsed: dict[str, Any] = json.loads(params) is_ui = parsed.get("is_ui", True) is_img2img = parsed.get("is_img2img", None) checkpoint = parsed.get("checkpoint", None) named_args: dict[str, Any] = parsed["args"] script_args: list[Any] = ( parsed["script_args"] if "script_args" in parsed else pickle.loads(script_params) ) if is_ui and deserialization: self.__deserialize_ui_task_args(is_img2img, named_args, script_args) args = list(named_args.values()) + script_args return { "args": args, "named_args": named_args, "script_args": script_args, "checkpoint": checkpoint, "is_ui": is_ui, } def register_ui_task( self, task_id: str, is_img2img: bool, *args, checkpoint: str = None ): progress.add_task_to_queue(task_id) params = self.__serialize_ui_task_args(is_img2img, *args, checkpoint=checkpoint) task_type = "img2img" if is_img2img else "txt2img" task_manager.add_task(Task(id=task_id, type=task_type, params=params)) self.__run_callbacks( "task_registered", task_id, is_img2img=is_img2img, is_ui=True, args=params ) self.__total_pending_tasks += 1 def register_api_task(self, task_id: str, is_img2img: bool, args: dict): progress.add_task_to_queue(task_id) params = self.__serialize_api_task_args(is_img2img, **args) task_type = "img2img" if is_img2img else "txt2img" task_manager.add_task(Task(id=task_id, type=task_type, params=params)) self.__run_callbacks( "task_registered", task_id, is_img2img=is_img2img, is_ui=False, args=params ) self.__total_pending_tasks += 1 def execute_task(self, task: Task, get_next_task: Callable): while True: if self.dispose: sys.exit(0) if progress.current_task is None: task_id = task.id is_img2img = task.type == "img2img" log.info(f"[AgentScheduler] Executing task {task_id}") task_args = self.parse_task_args( task.params, task.script_params, ) task_meta = {"is_img2img": is_img2img, "is_ui": task_args["is_ui"]} self.__saved_images_path = [] self.__run_callbacks("task_started", task_id, **task_meta) res = self.__execute_task(task_id, is_img2img, task_args) if not res or isinstance(res, Exception): task_manager.update_task(id=task_id, status=TaskStatus.FAILED) self.__run_callbacks( "task_finished", task_id, status=TaskStatus.FAILED, **task_meta ) else: res = json.loads(res) log.info(f"\n[AgentScheduler] Task {task.id} done") infotexts = [] for line in res["infotexts"]: infotexts.extend(line.split("\n")) infotexts[0] = f"Prompt: {infotexts[0]}" log.info("\n".join(["** " + text for text in infotexts])) result = { "images": self.__saved_images_path.copy(), "infotexts": infotexts, } task_manager.update_task( id=task_id, status=TaskStatus.DONE, result=json.dumps(result), ) self.__run_callbacks( "task_finished", task_id, status=TaskStatus.DONE, result=result, **task_meta, ) self.__saved_images_path = [] else: time.sleep(2) continue task = get_next_task() if not task: sys.exit(0) def execute_pending_tasks_threading(self): if self.paused: log.info("[AgentScheduler] Runner is paused") return if self.is_executing_task: log.info("[AgentScheduler] Runner already started") return pending_task = self.__get_pending_task() if pending_task: # Start the infinite loop in a separate thread self.__current_thread = threading.Thread( target=self.execute_task, args=( pending_task, self.__get_pending_task, ), ) self.__current_thread.daemon = True self.__current_thread.start() def get_task_info(self, task: Task) -> list[Any]: task_args = self.parse_task_args( task.params, task.script_params, ) return [ task.id, task.type, json.dumps(task_args["named_args"]), task.created_at.strftime("%Y-%m-%d %H:%M:%S"), ] def __execute_task(self, task_id: str, is_img2img: bool, task_args: dict): if task_args["is_ui"]: return self.__execute_ui_task(task_id, is_img2img, *task_args["args"]) else: return self.__execute_api_task( task_id, is_img2img, script_args=task_args["script_args"], **task_args["named_args"], ) def __execute_ui_task(self, task_id: str, is_img2img: bool, *args): func = wrap_gradio_call(img2img if is_img2img else txt2img, add_stats=True) with queue_lock: shared.state.begin() progress.start_task(task_id) res = None try: result = func(*args) res = result[1] except Exception as e: log.error(f"[AgentScheduler] Task {task_id} failed: {e}") log.error(traceback.format_exc()) res = e finally: progress.finish_task(task_id) shared.state.end() return res def __execute_api_task(self, task_id: str, is_img2img: bool, **kwargs): progress.start_task(task_id) res = None try: result = ( self.__api.img2imgapi(StableDiffusionImg2ImgProcessingAPI(**kwargs)) if is_img2img else self.__api.text2imgapi( StableDiffusionTxt2ImgProcessingAPI(**kwargs) ) ) res = result.info except Exception as e: log.error(f"[AgentScheduler] Task {task_id} failed: {e}") log.error(traceback.format_exc()) res = e finally: progress.finish_task(task_id) return res def __get_pending_task(self): if self.dispose: return None # delete task that are 7 days old task_manager.delete_tasks_before(datetime.now() - timedelta(days=7)) self.__total_pending_tasks = task_manager.count_tasks(status="pending") # get more task if needed if self.__total_pending_tasks > 0: log.info( f"[AgentScheduler] Total pending tasks: {self.__total_pending_tasks}" ) pending_tasks = task_manager.get_tasks(status="pending", limit=1) if len(pending_tasks) > 0: return pending_tasks[0] else: log.info("[AgentScheduler] Task queue is empty") self.__run_callbacks("task_cleared") def __on_image_saved(self, data: script_callbacks.ImageSaveParams): self.__saved_images_path.append(data.filename) def on_task_registered(self, callback: Callable): """Callback when a task is registered Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool, args: dict) """ self.script_callbacks["task_registered"].append(callback) def on_task_started(self, callback: Callable): """Callback when a task is started Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool) """ self.script_callbacks["task_started"].append(callback) def on_task_finished(self, callback: Callable): """Callback when a task is finished Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool, status: TaskStatus, result: dict) """ self.script_callbacks["task_finished"].append(callback) def on_task_cleared(self, callback: Callable): self.script_callbacks["task_cleared"].append(callback) def __run_callbacks(self, name: str, *args, **kwargs): for callback in self.script_callbacks[name]: callback(*args, **kwargs) def get_instance(block) -> TaskRunner: if TaskRunner.instance is None: txt2img_submit_button = get_component_by_elem_id(block, "txt2img_generate") UiControlNetUnit = detect_control_net(block, txt2img_submit_button) TaskRunner(UiControlNetUnit) def on_before_reload(): # Tell old instance to stop TaskRunner.instance.dispose = True # force recreate the instance TaskRunner.instance = None script_callbacks.on_before_reload(on_before_reload) return TaskRunner.instance