sd-webui-agent-scheduler/scripts/task_runner.py

499 lines
17 KiB
Python

import io
import sys
import json
import time
import zlib
import base64
import pickle
import inspect
import traceback
import threading
import numpy as np
from datetime import datetime, timedelta
from enum import Enum
from PIL import Image, PngImagePlugin
from typing import Any, Callable, Union
from fastapi import FastAPI
from modules import progress, shared, script_callbacks
from modules.call_queue import queue_lock, wrap_gradio_call
from modules.txt2img import txt2img
from modules.img2img import img2img
from modules.api.api import Api, encode_pil_to_base64
from modules.api.models import (
StableDiffusionTxt2ImgProcessingAPI,
StableDiffusionImg2ImgProcessingAPI,
)
from scripts.db import TaskStatus, AppStateKey, Task, task_manager, state_manager
from scripts.helpers import log, detect_control_net, get_component_by_elem_id
img2img_image_args_by_mode: dict[int, list[list[str]]] = {
0: [["init_img"]],
1: [["sketch"]],
2: [["init_img_with_mask", "image"], ["init_img_with_mask", "mask"]],
3: [["inpaint_color_sketch"], ["inpaint_color_sketch_orig"]],
4: [["init_img_inpaint"], ["init_mask_inpaint"]],
}
class TaskRunner:
instance = None
def __init__(self, UiControlNetUnit=None):
self.UiControlNetUnit = UiControlNetUnit
self.__total_pending_tasks: int = 0
self.__current_thread: threading.Thread = None
self.__api = Api(FastAPI(), queue_lock)
self.__saved_images_path: list[str] = []
script_callbacks.on_image_saved(self.__on_image_saved)
self.script_callbacks = {
"task_registered": [],
"task_started": [],
"task_finished": [],
"task_cleared": [],
}
# Mark this to True when reload UI
self.dispose = False
if TaskRunner.instance is not None:
raise Exception("TaskRunner instance already exists")
TaskRunner.instance = self
@property
def current_task_id(self) -> Union[str, None]:
return progress.current_task
@property
def is_executing_task(self) -> bool:
return self.__current_thread and self.__current_thread.is_alive()
@property
def paused(self) -> bool:
return state_manager.get_value(AppStateKey.QueueState) == "paused"
def __serialize_image(self, image):
if isinstance(image, np.ndarray):
shape = image.shape
data = base64.b64encode(zlib.compress(image.tobytes())).decode()
return {"shape": shape, "data": data, "cls": "ndarray"}
elif isinstance(image, Image.Image):
size = image.size
mode = image.mode
data = base64.b64encode(zlib.compress(image.tobytes())).decode()
return {
"size": size,
"mode": mode,
"data": data,
"cls": "Image",
}
else:
return image
def __deserialize_image(self, image_str):
if isinstance(image_str, dict) and image_str.get("cls", None):
cls = image_str["cls"]
data = zlib.decompress(base64.b64decode(image_str["data"]))
if cls == "ndarray":
shape = tuple(image_str["shape"])
image = np.frombuffer(data, dtype=np.uint8)
return image.reshape(shape)
else:
size = tuple(image_str["size"])
mode = image_str["mode"]
return Image.frombytes(mode, size, data)
else:
return image_str
def __serialize_img2img_images(self, args: dict, image_args: list):
for keys in image_args:
if len(keys) == 1:
image = args.get(keys[0], None)
args[keys[0]] = self.__serialize_image(image)
else:
value = args.get(keys[0], {})
image = value.get(keys[1], None)
value[keys[1]] = self.__serialize_image(image)
args[keys[0]] = value
def __deserialize_img2img_images(self, args: dict, image_args: list):
for keys in image_args:
if len(keys) == 1:
image = args.get(keys[0], None)
args[keys[0]] = self.__deserialize_image(image)
else:
value = args.get(keys[0], {})
image = value.get(keys[1], None)
value[keys[1]] = self.__deserialize_image(image)
args[keys[0]] = value
def __serialize_ui_task_args(self, is_img2img: bool, *args, checkpoint: str = None):
args_name = []
if is_img2img:
args_name = inspect.getfullargspec(img2img).args
else:
args_name = inspect.getfullargspec(txt2img).args
args = list(args)
named_args = dict(zip(args_name, args[0 : len(args_name)]))
script_args = args[len(args_name) :]
if checkpoint:
override_settings_texts = named_args.get("override_settings_texts", [])
override_settings_texts.append("Model hash: " + checkpoint)
named_args["override_settings_texts"] = override_settings_texts
# loop through named_args and serialize images
if is_img2img:
for mode, image_args in img2img_image_args_by_mode.items():
if mode == named_args["mode"]:
self.__serialize_img2img_images(named_args, image_args)
else:
# set None to unused image args to save space
for keys in image_args:
named_args[keys[0]] = None
# loop through script_args and serialize controlnets
if self.UiControlNetUnit is not None:
for i, a in enumerate(script_args):
if isinstance(a, self.UiControlNetUnit):
script_args[i] = a.__dict__
script_args[i]["is_cnet"] = True
for k, v in script_args[i].items():
if k == "image" and v is not None:
script_args[i][k] = {
"image": self.__serialize_image(v["image"]),
"mask": self.__serialize_image(v["mask"]),
}
if isinstance(v, Enum):
script_args[i][k] = v.value
return json.dumps(
{
"args": named_args,
"script_args": script_args,
"checkpoint": checkpoint,
"is_ui": True,
"is_img2img": is_img2img,
}
)
def __serialize_api_task_args(
self, is_img2img: bool, script_args: list = [], **named_args
):
override_settings = named_args.get("override_settings", {})
checkpoint = override_settings.get("sd_model_checkpoint", None)
return json.dumps(
{
"args": named_args,
"script_args": script_args,
"checkpoint": checkpoint,
"is_ui": False,
"is_img2img": is_img2img,
}
)
def __deserialize_ui_task_args(
self, is_img2img: bool, named_args: dict, script_args: list
):
# loop through image_args and deserialize images
if is_img2img:
for mode, image_args in img2img_image_args_by_mode.items():
if mode == named_args["mode"]:
self.__deserialize_img2img_images(named_args, image_args)
# loop through script_args and deserialize controlnets
if self.UiControlNetUnit is not None:
for i, arg in enumerate(script_args):
if isinstance(arg, dict) and arg.get("is_cnet", False):
arg.pop("is_cnet")
for k, v in arg.items():
if k == "image" and v is not None:
arg[k] = {
"image": self.__deserialize_image(v["image"]),
"mask": self.__deserialize_image(v["mask"]),
}
def parse_task_args(
self, params: str, script_params: bytes, deserialization: bool = True
):
parsed: dict[str, Any] = json.loads(params)
is_ui = parsed.get("is_ui", True)
is_img2img = parsed.get("is_img2img", None)
checkpoint = parsed.get("checkpoint", None)
named_args: dict[str, Any] = parsed["args"]
script_args: list[Any] = (
parsed["script_args"]
if "script_args" in parsed
else pickle.loads(script_params)
)
if is_ui and deserialization:
self.__deserialize_ui_task_args(is_img2img, named_args, script_args)
args = list(named_args.values()) + script_args
return {
"args": args,
"named_args": named_args,
"script_args": script_args,
"checkpoint": checkpoint,
"is_ui": is_ui,
}
def register_ui_task(
self, task_id: str, is_img2img: bool, *args, checkpoint: str = None
):
progress.add_task_to_queue(task_id)
params = self.__serialize_ui_task_args(is_img2img, *args, checkpoint=checkpoint)
task_type = "img2img" if is_img2img else "txt2img"
task_manager.add_task(Task(id=task_id, type=task_type, params=params))
self.__run_callbacks(
"task_registered", task_id, is_img2img=is_img2img, is_ui=True, args=params
)
self.__total_pending_tasks += 1
def register_api_task(self, task_id: str, is_img2img: bool, args: dict):
progress.add_task_to_queue(task_id)
params = self.__serialize_api_task_args(is_img2img, **args)
task_type = "img2img" if is_img2img else "txt2img"
task_manager.add_task(Task(id=task_id, type=task_type, params=params))
self.__run_callbacks(
"task_registered", task_id, is_img2img=is_img2img, is_ui=False, args=params
)
self.__total_pending_tasks += 1
def execute_task(self, task: Task, get_next_task: Callable):
while True:
if self.dispose:
sys.exit(0)
if progress.current_task is None:
task_id = task.id
is_img2img = task.type == "img2img"
log.info(f"[AgentScheduler] Executing task {task_id}")
task_args = self.parse_task_args(
task.params,
task.script_params,
)
task_meta = {"is_img2img": is_img2img, "is_ui": task_args["is_ui"]}
self.__saved_images_path = []
self.__run_callbacks("task_started", task_id, **task_meta)
res = self.__execute_task(task_id, is_img2img, task_args)
if not res or isinstance(res, Exception):
task_manager.update_task(id=task_id, status=TaskStatus.FAILED)
self.__run_callbacks(
"task_finished", task_id, status=TaskStatus.FAILED, **task_meta
)
else:
res = json.loads(res)
log.info(f"\n[AgentScheduler] Task {task.id} done")
infotexts = []
for line in res["infotexts"]:
infotexts.extend(line.split("\n"))
infotexts[0] = f"Prompt: {infotexts[0]}"
log.info("\n".join(["** " + text for text in infotexts]))
result = {
"images": self.__saved_images_path.copy(),
"infotexts": infotexts,
}
task_manager.update_task(
id=task_id,
status=TaskStatus.DONE,
result=json.dumps(result),
)
self.__run_callbacks(
"task_finished",
task_id,
status=TaskStatus.DONE,
result=result,
**task_meta,
)
self.__saved_images_path = []
else:
time.sleep(2)
continue
task = get_next_task()
if not task:
sys.exit(0)
def execute_pending_tasks_threading(self):
if self.paused:
log.info("[AgentScheduler] Runner is paused")
return
if self.is_executing_task:
log.info("[AgentScheduler] Runner already started")
return
pending_task = self.__get_pending_task()
if pending_task:
# Start the infinite loop in a separate thread
self.__current_thread = threading.Thread(
target=self.execute_task,
args=(
pending_task,
self.__get_pending_task,
),
)
self.__current_thread.daemon = True
self.__current_thread.start()
def get_task_info(self, task: Task) -> list[Any]:
task_args = self.parse_task_args(
task.params,
task.script_params,
)
return [
task.id,
task.type,
json.dumps(task_args["named_args"]),
task.created_at.strftime("%Y-%m-%d %H:%M:%S"),
]
def __execute_task(self, task_id: str, is_img2img: bool, task_args: dict):
if task_args["is_ui"]:
return self.__execute_ui_task(task_id, is_img2img, *task_args["args"])
else:
return self.__execute_api_task(
task_id,
is_img2img,
script_args=task_args["script_args"],
**task_args["named_args"],
)
def __execute_ui_task(self, task_id: str, is_img2img: bool, *args):
func = wrap_gradio_call(img2img if is_img2img else txt2img, add_stats=True)
with queue_lock:
shared.state.begin()
progress.start_task(task_id)
res = None
try:
result = func(*args)
res = result[1]
except Exception as e:
log.error(f"[AgentScheduler] Task {task_id} failed: {e}")
log.error(traceback.format_exc())
res = e
finally:
progress.finish_task(task_id)
shared.state.end()
return res
def __execute_api_task(self, task_id: str, is_img2img: bool, **kwargs):
progress.start_task(task_id)
res = None
try:
result = (
self.__api.img2imgapi(StableDiffusionImg2ImgProcessingAPI(**kwargs))
if is_img2img
else self.__api.text2imgapi(
StableDiffusionTxt2ImgProcessingAPI(**kwargs)
)
)
res = result.info
except Exception as e:
log.error(f"[AgentScheduler] Task {task_id} failed: {e}")
log.error(traceback.format_exc())
res = e
finally:
progress.finish_task(task_id)
return res
def __get_pending_task(self):
if self.dispose:
return None
# delete task that are 7 days old
task_manager.delete_tasks_before(datetime.now() - timedelta(days=7))
self.__total_pending_tasks = task_manager.count_tasks(status="pending")
# get more task if needed
if self.__total_pending_tasks > 0:
log.info(
f"[AgentScheduler] Total pending tasks: {self.__total_pending_tasks}"
)
pending_tasks = task_manager.get_tasks(status="pending", limit=1)
if len(pending_tasks) > 0:
return pending_tasks[0]
else:
log.info("[AgentScheduler] Task queue is empty")
self.__run_callbacks("task_cleared")
def __on_image_saved(self, data: script_callbacks.ImageSaveParams):
self.__saved_images_path.append(data.filename)
def on_task_registered(self, callback: Callable):
"""Callback when a task is registered
Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool, args: dict)
"""
self.script_callbacks["task_registered"].append(callback)
def on_task_started(self, callback: Callable):
"""Callback when a task is started
Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool)
"""
self.script_callbacks["task_started"].append(callback)
def on_task_finished(self, callback: Callable):
"""Callback when a task is finished
Callback signature: callback(task_id: str, is_img2img: bool, is_ui: bool, status: TaskStatus, result: dict)
"""
self.script_callbacks["task_finished"].append(callback)
def on_task_cleared(self, callback: Callable):
self.script_callbacks["task_cleared"].append(callback)
def __run_callbacks(self, name: str, *args, **kwargs):
for callback in self.script_callbacks[name]:
callback(*args, **kwargs)
def get_instance(block) -> TaskRunner:
if TaskRunner.instance is None:
txt2img_submit_button = get_component_by_elem_id(block, "txt2img_generate")
UiControlNetUnit = detect_control_net(block, txt2img_submit_button)
TaskRunner(UiControlNetUnit)
def on_before_reload():
# Tell old instance to stop
TaskRunner.instance.dispose = True
# force recreate the instance
TaskRunner.instance = None
script_callbacks.on_before_reload(on_before_reload)
return TaskRunner.instance