Port SDForge's preprocessor structure (#2754)

* wip * wip2 * wip3 * fix issues * Add scribble xdog * port legacy processors * nit * Add tests * Fix modules test * Add back normal_dsine * Remove legacy code * Remove code * Add tests * rename param * Linter ignore * fix is_image * fix is_image * nit * nit * Better assertion message * Add back ip-adapter-auto * Add test * Fix various tag matching * fix * Add back preprocessor cache * Add back sparse ctrl * fix test failure * Add log
2024-04-17 22:28:56 -04:00 · 2024-04-17 22:28:56 -04:00 · 442398bb9f
parent bbcae309d1
commit 442398bb9f
23 changed files with 2315 additions and 1129 deletions
--- a/annotator/normaldsine/init.py
+++ b/annotator/normaldsine/init.py
@ -9,7 +9,7 @@ from annotator.annotator_path import models_path
 import torchvision.transforms as transforms
 import dsine.utils.utils as utils
 from dsine.models.dsine import DSINE
-from scripts.processor import resize_image_with_pad
+from scripts.utils import resize_image_with_pad


 class NormalDsineDetector:
--- a/internal_controlnet/external_code.py
+++ b/internal_controlnet/external_code.py
@ -10,9 +10,9 @@ import numpy as np
 from modules import scripts, processing, shared
 from modules.safe import unsafe_torch_load
 from scripts import global_state
-from scripts.processor import preprocessor_sliders_config, model_free_preprocessors
 from scripts.logging import logger
 from scripts.enums import HiResFixOption
+from scripts.supported_preprocessor import Preprocessor, PreprocessorParameter

 from modules.api import api

@ -56,10 +56,10 @@ class ResizeMode(Enum):


 resize_mode_aliases = {
-    'Inner Fit (Scale to Fit)': 'Crop and Resize',
-    'Outer Fit (Shrink to Fit)': 'Resize and Fill',
-    'Scale to Fit (Inner Fit)': 'Crop and Resize',
-    'Envelope (Outer Fit)': 'Resize and Fill',
+    "Inner Fit (Scale to Fit)": "Crop and Resize",
+    "Outer Fit (Shrink to Fit)": "Resize and Fill",
+    "Scale to Fit (Inner Fit)": "Crop and Resize",
+    "Envelope (Outer Fit)": "Resize and Fill",
 }


@ -72,7 +72,9 @@ def resize_mode_from_value(value: Union[str, int, ResizeMode]) -> ResizeMode:
            return ResizeMode.RESIZE

        if value >= len(ResizeMode):
-            logger.warning(f'Unrecognized ResizeMode int value {value}. Fall back to RESIZE.')
+            logger.warning(
+                f"Unrecognized ResizeMode int value {value}. Fall back to RESIZE."
+            )
            return ResizeMode.RESIZE

        return [e for e in ResizeMode][value]
@ -100,10 +102,10 @@ def visualize_inpaint_mask(img):


 def pixel_perfect_resolution(
-        image: np.ndarray,
-        target_H: int,
-        target_W: int,
-        resize_mode: ResizeMode,
+    image: np.ndarray,
+    target_H: int,
+    target_W: int,
+    resize_mode: ResizeMode,
 ) -> int:
    """
    Calculate the estimated resolution for resizing an image while preserving aspect ratio.
@ -159,6 +161,7 @@ class ControlNetUnit:
    """
    Represents an entire ControlNet processing unit.
    """
+
    enabled: bool = True
    module: str = "none"
    model: str = "None"
@ -242,10 +245,13 @@ class ControlNetUnit:
    @property
    def uses_clip(self) -> bool:
        """Whether this unit uses clip preprocessor."""
-        return any((
-            ("ip-adapter" in self.module and "face_id" not in self.module),
-            self.module in ("clip_vision", "revision_clipvision", "revision_ignore_prompt"),
-        ))
+        return any(
+            (
+                ("ip-adapter" in self.module and "face_id" not in self.module),
+                self.module
+                in ("clip_vision", "revision_clipvision", "revision_ignore_prompt"),
+            )
+        )

    @property
    def is_inpaint(self) -> bool:
@ -257,18 +263,18 @@ class ControlNetUnit:
        Parameters 'processor_res', 'threshold_a', 'threshold_b' are reset to
        their default values if negative.
        """
-        cfg = preprocessor_sliders_config.get(global_state.get_module_basename(self.module), [])
-        defaults = {
-            param: cfg_default['value']
-            for param, cfg_default in zip(
-                ("processor_res", 'threshold_a', 'threshold_b'), cfg)
-            if cfg_default is not None
-        }
-        for param, default_value in defaults.items():
-            value = getattr(self, param)
+        preprocessor = Preprocessor.get_preprocessor(self.module)
+        for unit_param, param in zip(
+            ("processor_res", "threshold_a", "threshold_b"),
+            ("slider_resolution", "slider_1", "slider_2"),
+        ):
+            value = getattr(self, unit_param)
+            cfg: PreprocessorParameter = getattr(preprocessor, param)
            if value < 0:
-                setattr(self, param, default_value)
-                logger.info(f'[{self.module}.{param}] Invalid value({value}), using default value {default_value}.')
+                setattr(self, unit_param, cfg.value)
+                logger.info(
+                    f"[{self.module}.{unit_param}] Invalid value({value}), using default value {cfg.value}."
+                )


 def to_base64_nparray(encoding: str):
@ -276,10 +282,12 @@ def to_base64_nparray(encoding: str):
    Convert a base64 image into the image type the extension uses
    """

-    return np.array(api.decode_base64_to_image(encoding)).astype('uint8')
+    return np.array(api.decode_base64_to_image(encoding)).astype("uint8")


-def get_all_units_in_processing(p: processing.StableDiffusionProcessing) -> List[ControlNetUnit]:
+def get_all_units_in_processing(
+    p: processing.StableDiffusionProcessing,
+) -> List[ControlNetUnit]:
    """
    Fetch ControlNet processing units from a StableDiffusionProcessing.
    """
@ -287,7 +295,9 @@ def get_all_units_in_processing(p: processing.StableDiffusionProcessing) -> List
    return get_all_units(p.scripts, p.script_args)


-def get_all_units(script_runner: scripts.ScriptRunner, script_args: List[Any]) -> List[ControlNetUnit]:
+def get_all_units(
+    script_runner: scripts.ScriptRunner, script_args: List[Any]
+) -> List[ControlNetUnit]:
    """
    Fetch ControlNet processing units from an existing script runner.
    Use this function to fetch units from the list of all scripts arguments.
@ -295,7 +305,7 @@ def get_all_units(script_runner: scripts.ScriptRunner, script_args: List[Any]) -

    cn_script = find_cn_script(script_runner)
    if cn_script:
-        return get_all_units_from(script_args[cn_script.args_from:cn_script.args_to])
+        return get_all_units_from(script_args[cn_script.args_from : cn_script.args_to])

    return []

@ -307,23 +317,20 @@ def get_all_units_from(script_args: List[Any]) -> List[ControlNetUnit]:
    """

    def is_stale_unit(script_arg: Any) -> bool:
-        """ Returns whether the script_arg is potentially an stale version of
+        """Returns whether the script_arg is potentially an stale version of
        ControlNetUnit created before module reload."""
-        return (
-                'ControlNetUnit' in type(script_arg).__name__ and
-                not isinstance(script_arg, ControlNetUnit)
+        return "ControlNetUnit" in type(script_arg).__name__ and not isinstance(
+            script_arg, ControlNetUnit
        )

    def is_controlnet_unit(script_arg: Any) -> bool:
-        """ Returns whether the script_arg is ControlNetUnit or anything that
-        can be treated like ControlNetUnit. """
-        return (
-                isinstance(script_arg, (ControlNetUnit, dict)) or
-                (
-                        hasattr(script_arg, '__dict__') and
-                        set(vars(ControlNetUnit()).keys()).issubset(
-                            set(vars(script_arg).keys()))
-                )
+        """Returns whether the script_arg is ControlNetUnit or anything that
+        can be treated like ControlNetUnit."""
+        return isinstance(script_arg, (ControlNetUnit, dict)) or (
+            hasattr(script_arg, "__dict__")
+            and set(vars(ControlNetUnit()).keys()).issubset(
+                set(vars(script_arg).keys())
+            )
        )

    all_units = [
@ -334,7 +341,8 @@ def get_all_units_from(script_args: List[Any]) -> List[ControlNetUnit]:
    if not all_units:
        logger.warning(
            "No ControlNetUnit detected in args. It is very likely that you are having an extension conflict."
-            f"Here are args received by ControlNet: {script_args}.")
+            f"Here are args received by ControlNet: {script_args}."
+        )
    if any(is_stale_unit(script_arg) for script_arg in script_args):
        logger.debug(
            "Stale version of ControlNetUnit detected. The ControlNetUnit received"
@ -346,7 +354,9 @@ def get_all_units_from(script_args: List[Any]) -> List[ControlNetUnit]:
    return all_units


-def get_single_unit_from(script_args: List[Any], index: int = 0) -> Optional[ControlNetUnit]:
+def get_single_unit_from(
+    script_args: List[Any], index: int = 0
+) -> Optional[ControlNetUnit]:
    """
    Fetch a single ControlNet processing unit from ControlNet script arguments.
    The list must not contain script positional arguments. It must only contain processing units.
@ -379,10 +389,10 @@ def to_processing_unit(unit: Union[Dict[str, Any], ControlNetUnit]) -> ControlNe
    """

    ext_compat_keys = {
-        'guessmode': 'guess_mode',
-        'guidance': 'guidance_end',
-        'lowvram': 'low_vram',
-        'input_image': 'image'
+        "guessmode": "guess_mode",
+        "guidance": "guidance_end",
+        "lowvram": "low_vram",
+        "input_image": "image",
    }

    if isinstance(unit, dict):
@ -390,20 +400,24 @@ def to_processing_unit(unit: Union[Dict[str, Any], ControlNetUnit]) -> ControlNe

        # Handle mask
        mask = None
-        if 'mask' in unit:
-            mask = unit['mask']
-            del unit['mask']
+        if "mask" in unit:
+            mask = unit["mask"]
+            del unit["mask"]

        if "mask_image" in unit:
            mask = unit["mask_image"]
            del unit["mask_image"]

-        if 'image' in unit and not isinstance(unit['image'], dict):
-            unit['image'] = {'image': unit['image'], 'mask': mask} if mask is not None else unit['image'] if unit[
-                'image'] else None
+        if "image" in unit and not isinstance(unit["image"], dict):
+            unit["image"] = (
+                {"image": unit["image"], "mask": mask}
+                if mask is not None
+                else unit["image"] if unit["image"] else None
+            )

        # Parse ipadapter_input
        if "ipadapter_input" in unit:
+
            def decode_base64(b: str) -> torch.Tensor:
                decoded_bytes = base64.b64decode(b)
                return unsafe_torch_load(io.BytesIO(decoded_bytes))
@ -411,12 +425,18 @@ def to_processing_unit(unit: Union[Dict[str, Any], ControlNetUnit]) -> ControlNe
            if isinstance(unit["ipadapter_input"], str):
                unit["ipadapter_input"] = [unit["ipadapter_input"]]

-            unit["ipadapter_input"] = [decode_base64(b) for b in unit["ipadapter_input"]]
+            unit["ipadapter_input"] = [
+                decode_base64(b) for b in unit["ipadapter_input"]
+            ]

-        if 'guess_mode' in unit:
-            logger.warning('Guess Mode is removed since 1.1.136. Please use Control Mode instead.')
+        if "guess_mode" in unit:
+            logger.warning(
+                "Guess Mode is removed since 1.1.136. Please use Control Mode instead."
+            )

-        unit = ControlNetUnit(**{k: v for k, v in unit.items() if k in vars(ControlNetUnit).keys()})
+        unit = ControlNetUnit(
+            **{k: v for k, v in unit.items() if k in vars(ControlNetUnit).keys()}
+        )

    # temporary, check #602
    # assert isinstance(unit, ControlNetUnit), f'bad argument to controlnet extension: {unit}\nexpected Union[dict[str, Any], ControlNetUnit]'
@ -424,9 +444,9 @@ def to_processing_unit(unit: Union[Dict[str, Any], ControlNetUnit]) -> ControlNe


 def update_cn_script_in_processing(
-        p: processing.StableDiffusionProcessing,
-        cn_units: List[ControlNetUnit],
-        **_kwargs,  # for backwards compatibility
+    p: processing.StableDiffusionProcessing,
+    cn_units: List[ControlNetUnit],
+    **_kwargs,  # for backwards compatibility
 ):
    """
    Update the arguments of the ControlNet script in `p.script_args` in place, reading from `cn_units`.
@ -464,13 +484,17 @@ def update_cn_script(

    # fill in remaining parameters to satisfy max models, just in case script needs it.
    max_models = shared.opts.data.get("control_net_unit_count", 3)
-    cn_units = cn_units + [ControlNetUnit(enabled=False)] * max(max_models - len(cn_units), 0)
+    cn_units = cn_units + [ControlNetUnit(enabled=False)] * max(
+        max_models - len(cn_units), 0
+    )

    cn_script_args_diff = 0
    for script in script_runner.alwayson_scripts:
        if script is cn_script:
-            cn_script_args_diff = len(cn_units) - (cn_script.args_to - cn_script.args_from)
-            updated_script_args[script.args_from:script.args_to] = cn_units
+            cn_script_args_diff = len(cn_units) - (
+                cn_script.args_to - cn_script.args_from
+            )
+            updated_script_args[script.args_from : script.args_to] = cn_units
            script.args_to = script.args_from + len(cn_units)
        else:
            script.args_from += cn_script_args_diff
@ -480,10 +504,10 @@ def update_cn_script(


 def update_cn_script_in_place(
-        script_runner: scripts.ScriptRunner,
-        script_args: List[Any],
-        cn_units: List[ControlNetUnit],
-        **_kwargs,  # for backwards compatibility
+    script_runner: scripts.ScriptRunner,
+    script_args: List[Any],
+    cn_units: List[ControlNetUnit],
+    **_kwargs,  # for backwards compatibility
 ):
    """
    @Deprecated(Raises assertion error if script_args passed in is Tuple)
@ -503,13 +527,17 @@ def update_cn_script_in_place(

    # fill in remaining parameters to satisfy max models, just in case script needs it.
    max_models = shared.opts.data.get("control_net_unit_count", 3)
-    cn_units = cn_units + [ControlNetUnit(enabled=False)] * max(max_models - len(cn_units), 0)
+    cn_units = cn_units + [ControlNetUnit(enabled=False)] * max(
+        max_models - len(cn_units), 0
+    )

    cn_script_args_diff = 0
    for script in script_runner.alwayson_scripts:
        if script is cn_script:
-            cn_script_args_diff = len(cn_units) - (cn_script.args_to - cn_script.args_from)
-            script_args[script.args_from:script.args_to] = cn_units
+            cn_script_args_diff = len(cn_units) - (
+                cn_script.args_to - cn_script.args_from
+            )
+            script_args[script.args_from : script.args_to] = cn_units
            script.args_to = script.args_from + len(cn_units)
        else:
            script.args_from += cn_script_args_diff
@ -539,13 +567,10 @@ def get_modules(alias_names: bool = False) -> List[str]:
    Keyword arguments:
    alias_names -- Whether to get the ui alias names instead of internal keys
    """
-
-    modules = list(global_state.cn_preprocessor_modules.keys())
-
-    if alias_names:
-        modules = [global_state.preprocessor_aliases.get(module, module) for module in modules]
-
-    return modules
+    return [
+        (p.label if alias_names else p.name)
+        for p in Preprocessor.get_sorted_preprocessors()
+    ]


 def get_modules_detail(alias_names: bool = False) -> Dict[str, Any]:
@ -562,17 +587,22 @@ def get_modules_detail(alias_names: bool = False) -> Dict[str, Any]:
    _module_list_alias = get_modules(True)

    _output_list = _module_list if not alias_names else _module_list_alias
-    for index, module in enumerate(_output_list):
-        if _module_list[index] in preprocessor_sliders_config:
-            _module_detail[module] = {
-                "model_free": module in model_free_preprocessors,
-                "sliders": preprocessor_sliders_config[_module_list[index]]
-            }
-        else:
-            _module_detail[module] = {
-                "model_free": False,
-                "sliders": []
-            }
+    for module_name in _output_list:
+        preprocessor = Preprocessor.get_preprocessor(module_name)
+        assert preprocessor is not None
+        _module_detail[module_name] = dict(
+            model_free=preprocessor.do_not_need_model,
+            sliders=[
+                s.api_json
+                for s in (
+                    preprocessor.slider_resolution,
+                    preprocessor.slider_1,
+                    preprocessor.slider_2,
+                    preprocessor.slider_3,
+                )
+                if s.visible
+            ],
+        )

    return _module_detail

@ -595,4 +625,4 @@ def is_cn_script(script: scripts.Script) -> bool:
    Determine whether `script` is a ControlNet script.
    """

-    return script.title().lower() == 'controlnet'
+    return script.title().lower() == "controlnet"
--- a/pyproject.toml
+++ b/pyproject.toml
@ -8,8 +8,9 @@ exclude = [
  "web_tests",
  "example",
  "extract_controlnet_diff.py",
-  "scripts/global_state.py",
  "scripts/movie2movie.py",
+	"scripts/preprocessor/legacy/preprocessor_compiled.py",
+	"scripts/preprocessor/__init__.py",
 ]

 ignore = [
--- a/scripts/api.py
+++ b/scripts/api.py
@ -15,9 +15,9 @@ from modules.api.models import *  # noqa:F403
 from modules.api import api

 from scripts import external_code, global_state
-from scripts.processor import preprocessor_filters
 from scripts.logging import logger
 from scripts.external_code import ControlNetUnit
+from scripts.supported_preprocessor import Preprocessor
 from annotator.openpose import draw_poses, decode_json_as_poses
 from annotator.openpose.animalpose import draw_animalposes

@ -87,7 +87,7 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
                control_type: format_control_type(
                    *global_state.select_control_type(control_type)
                )
-                for control_type in preprocessor_filters.keys()
+                for control_type in Preprocessor.get_all_preprocessor_tags()
            }
        }

@ -96,10 +96,6 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
        max_models_num = external_code.get_max_models_num()
        return {"control_net_unit_count": max_models_num}

-    cached_cn_preprocessors = global_state.cache_preprocessors(
-        global_state.cn_preprocessor_modules
-    )
-
    @app.post("/controlnet/detect")
    async def detect(
        controlnet_module: str = Body("none", title="Controlnet Module"),
@ -111,14 +107,17 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
        controlnet_threshold_b: float = Body(-1, title="Controlnet Threshold b"),
        low_vram: bool = Body(False, title="Low vram"),
    ):
-        controlnet_module = global_state.reverse_preprocessor_aliases.get(
-            controlnet_module, controlnet_module
-        )
+        preprocessor = Preprocessor.get_preprocessor(controlnet_module)

-        if controlnet_module not in cached_cn_preprocessors:
+        if preprocessor is None:
            raise HTTPException(status_code=422, detail="Module not available")

-        if controlnet_module in ("clip_vision", "revision_clipvision", "revision_ignore_prompt"):
+        if controlnet_module in (
+            "clip_vision",
+            "revision_clipvision",
+            "revision_ignore_prompt",
+            "ip-adapter-auto",
+        ):
            raise HTTPException(status_code=422, detail="Module not supported")

        if len(controlnet_input_images) == 0:
@ -129,7 +128,7 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
        )

        unit = ControlNetUnit(
-            module=controlnet_module,
+            module=preprocessor.label,
            processor_res=controlnet_processor_res,
            threshold_a=controlnet_threshold_a,
            threshold_b=controlnet_threshold_b,
@ -139,8 +138,6 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
        results = []
        poses = []

-        processor_module = cached_cn_preprocessors[controlnet_module]
-
        for input_image in controlnet_input_images:
            img = external_code.to_base64_nparray(input_image)

@ -152,11 +149,11 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
                    self.value = json_dict

            json_acceptor = JsonAcceptor()
-            detected_map, is_image = processor_module(
+            detected_map = preprocessor.cached_call(
                img,
-                res=unit.processor_res,
-                thr_a=unit.threshold_a,
-                thr_b=unit.threshold_b,
+                resolution=unit.processor_res,
+                slider_1=unit.threshold_a,
+                slider_2=unit.threshold_b,
                json_pose_callback=json_acceptor.accept,
                low_vram=low_vram,
            )
@ -166,9 +163,8 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
                assert json_acceptor.value is not None
                poses.append(json_acceptor.value)

-        global_state.cn_preprocessor_unloadable.get(controlnet_module, lambda: None)()
        res = {"info": "Success"}
-        if is_image:
+        if preprocessor.returns_image:
            res["images"] = [encode_to_base64(r) for r in results]
            if poses:
                res["poses"] = poses
@ -176,7 +172,6 @@ def controlnet_api(_: gr.Blocks, app: FastAPI):
            res["tensor"] = [encode_tensor_to_base64(r) for r in results]
        return res

-
    class Person(BaseModel):
        pose_keypoints_2d: List[float]
        hand_right_keypoints_2d: Optional[List[float]]
--- a/scripts/controlnet.py
+++ b/scripts/controlnet.py
@ -12,18 +12,21 @@ import gradio as gr
 import time

 from einops import rearrange
+
+# Register all preprocessors.
+import scripts.preprocessor as preprocessor_init  # noqa
+from annotator.util import HWC3
 from scripts import global_state, hook, external_code, batch_hijack, controlnet_version, utils
 from scripts.controlnet_lora import bind_control_lora, unbind_control_lora
-from scripts.processor import HWC3
 from scripts.controlnet_lllite import clear_all_lllite
 from scripts.ipadapter.plugable_ipadapter import ImageEmbed, clear_all_ip_adapter
-from scripts.ipadapter.presets import IPAdapterPreset
 from scripts.utils import load_state_dict, get_unique_axis0, align_dim_latent
 from scripts.hook import ControlParams, UnetHook, HackedImageRNG
 from scripts.enums import ControlModelType, StableDiffusionVersion, HiResFixOption
 from scripts.controlnet_ui.controlnet_ui_group import ControlNetUiGroup, UiControlNetUnit
 from scripts.controlnet_ui.photopea import Photopea
 from scripts.logging import logger
+from scripts.supported_preprocessor import Preprocessor
 from scripts.animate_diff.batch import add_animate_diff_batch_input
 from modules.processing import StableDiffusionProcessingImg2Img, StableDiffusionProcessingTxt2Img, StableDiffusionProcessing
 from modules.images import save_image
@ -35,7 +38,6 @@ import torch

 from PIL import Image, ImageFilter, ImageOps
 from scripts.lvminthin import lvmin_thin, nake_nms
-from scripts.processor import model_free_preprocessors
 from scripts.controlnet_model_guess import build_model_by_guess, ControlModel
 from scripts.hook import torch_dfs

@ -220,7 +222,7 @@ def get_control(
    unit: external_code.ControlNetUnit,
    idx: int,
    control_model_type: ControlModelType,
-    preprocessor,
+    preprocessor: Preprocessor,
 ):
    """Get input for a ControlNet unit."""
    if unit.is_animate_diff_batch:
@ -264,16 +266,18 @@ def get_control(

    def preprocess_input_image(input_image: np.ndarray):
        """ Preprocess single input image. """
-        detected_map, is_image = preprocessor(
+        detected_map = preprocessor.cached_call(
            input_image,
-            res=unit.processor_res,
-            thr_a=unit.threshold_a,
-            thr_b=unit.threshold_b,
+            resolution=unit.processor_res,
+            slider_1=unit.threshold_a,
+            slider_2=unit.threshold_b,
            low_vram=(
                ("clip" in unit.module or unit.module == "ip-adapter_face_id_plus") and
                shared.opts.data.get("controlnet_clip_detector_on_cpu", False)
            ),
+            model=unit.model,
        )
+        is_image = preprocessor.returns_image
        if high_res_fix:
            if is_image:
                hr_control, hr_detected_map = Script.detectmap_proc(detected_map, unit.module, resize_mode, hr_y, hr_x)
@ -320,8 +324,6 @@ class Script(scripts.Script, metaclass=(
    def __init__(self) -> None:
        super().__init__()
        self.latest_network = None
-        self.preprocessor = global_state.cache_preprocessors(global_state.cn_preprocessor_modules)
-        self.unloadable = global_state.cn_preprocessor_unloadable
        self.input_image = None
        self.latest_model_hash = ""
        self.enabled_units: List[external_code.ControlNetUnit] = []
@ -353,7 +355,6 @@ class Script(scripts.Script, metaclass=(
        group = ControlNetUiGroup(
            is_img2img,
            Script.get_default_ui_unit(),
-            self.preprocessor,
            photopea,
        )
        return group, group.render(tabname, elem_id_tabname)
@ -664,11 +665,6 @@ class Script(scripts.Script, metaclass=(
            if not local_unit.enabled:
                continue

-            # Consolidate meta preprocessors.
-            if local_unit.module == "ip-adapter-auto":
-                local_unit.module = IPAdapterPreset.match_model(local_unit.model).module
-                logger.info(f"ip-adapter-auto => {local_unit.module}")
-
            if hasattr(local_unit, "unfold_merged"):
                enabled_units.extend(local_unit.unfold_merged())
            else:
@ -938,15 +934,6 @@ class Script(scripts.Script, metaclass=(
        if self.latest_model_hash != p.sd_model.sd_model_hash:
            Script.clear_control_model_cache()

-        for idx, unit in enumerate(self.enabled_units):
-            unit.module = global_state.get_module_basename(unit.module)
-
-        # unload unused preproc
-        module_list = [unit.module for unit in self.enabled_units]
-        for key in self.unloadable:
-            if key not in module_list:
-                self.unloadable.get(key, lambda:None)()
-
        self.latest_model_hash = p.sd_model.sd_model_hash
        high_res_fix = isinstance(p, StableDiffusionProcessingTxt2Img) and getattr(p, 'enable_hr', False)

@ -961,7 +948,10 @@ class Script(scripts.Script, metaclass=(
                logger.warning('A1111 inpaint and ControlNet inpaint duplicated. Falls back to inpaint_global_harmonious.')
                unit.module = 'inpaint'

-            if unit.module in model_free_preprocessors:
+            preprocessor = Preprocessor.get_preprocessor(unit.module)
+            assert preprocessor is not None
+
+            if preprocessor.do_not_need_model:
                model_net = None
                if 'reference' in unit.module:
                    control_model_type = ControlModelType.AttentionInjection
@ -990,7 +980,7 @@ class Script(scripts.Script, metaclass=(
                hr_controls = unit.ipadapter_input
            else:
                controls, hr_controls, additional_maps = get_control(
-                    p, unit, idx, control_model_type, self.preprocessor[unit.module])
+                    p, unit, idx, control_model_type, preprocessor)
                detected_maps.extend(additional_maps)

            if len(controls) == len(hr_controls) == 1 and control_model_type not in [ControlModelType.SparseCtrl]:
--- a/scripts/controlnet_ui/controlnet_ui_group.py
+++ b/scripts/controlnet_ui/controlnet_ui_group.py
@ -2,23 +2,17 @@ import json
 import gradio as gr
 import functools
 from copy import copy
-from typing import List, Optional, Union, Callable, Dict, Tuple, Literal
+from typing import List, Optional, Union, Dict, Tuple, Literal
 from dataclasses import dataclass
 import numpy as np

+from scripts.supported_preprocessor import Preprocessor
 from scripts.utils import svg_preprocess, read_image
 from scripts import (
    global_state,
    external_code,
 )
-from scripts.processor import (
-    preprocessor_sliders_config,
-    no_control_mode_preprocessors,
-    flag_preprocessor_resolution,
-    model_free_preprocessors,
-    preprocessor_filters,
-    HWC3,
-)
+from annotator.util import HWC3
 from scripts.logging import logger
 from scripts.controlnet_ui.openpose_editor import OpenposeEditor
 from scripts.controlnet_ui.preset import ControlNetPresetUI
@ -227,7 +221,6 @@ class ControlNetUiGroup(object):
        self,
        is_img2img: bool,
        default_unit: external_code.ControlNetUnit,
-        preprocessors: List[Callable],
        photopea: Optional[Photopea],
    ):
        # Whether callbacks have been registered.
@ -237,7 +230,6 @@ class ControlNetUiGroup(object):

        self.is_img2img = is_img2img
        self.default_unit = default_unit
-        self.preprocessors = preprocessors
        self.photopea = photopea
        self.webcam_enabled = False
        self.webcam_mirrored = False
@ -300,10 +292,6 @@ class ControlNetUiGroup(object):
        self.batch_image_dir_state = None
        self.output_dir_state = None

-        # Internal states for UI state pasting.
-        self.prevent_next_n_module_update = 0
-        self.prevent_next_n_slider_value_update = 0
-
        # API-only fields
        self.advanced_weighting = gr.State(None)
        self.ipadapter_input = gr.State(None)
@ -526,7 +514,7 @@ class ControlNetUiGroup(object):

        with gr.Row(elem_classes=["controlnet_control_type", "controlnet_row"]):
            self.type_filter = gr.Radio(
-                list(preprocessor_filters.keys()),
+                Preprocessor.get_all_preprocessor_tags(),
                label="Control Type",
                value="All",
                elem_id=f"{elem_id_tabname}_{tabname}_controlnet_type_filter_radio",
@ -535,7 +523,7 @@ class ControlNetUiGroup(object):

        with gr.Row(elem_classes=["controlnet_preprocessor_model", "controlnet_row"]):
            self.module = gr.Dropdown(
-                global_state.ui_preprocessor_keys,
+                [p.label for p in Preprocessor.get_sorted_preprocessors()],
                label="Preprocessor",
                value=self.default_unit.module,
                elem_id=f"{elem_id_tabname}_{tabname}_controlnet_preprocessor_dropdown",
@ -798,82 +786,21 @@ class ControlNetUiGroup(object):

    def register_build_sliders(self):
        def build_sliders(module: str, pp: bool):
-            logger.debug(
-                f"Prevent update slider value: {self.prevent_next_n_slider_value_update}"
-            )
-            logger.debug(f"Build slider for module: {module} - {pp}")
+            preprocessor = Preprocessor.get_preprocessor(module)
+            slider_resolution_kwargs = preprocessor.slider_resolution.gradio_update_kwargs.copy()

-            # Clear old slider values so that they do not cause confusion in
-            # infotext.
-            clear_slider_update = gr.update(
-                visible=False,
-                interactive=True,
-                minimum=-1,
-                maximum=-1,
-                value=-1,
-            )
+            if pp:
+                slider_resolution_kwargs['visible'] = False

-            grs = []
-            module = global_state.get_module_basename(module)
-            if module not in preprocessor_sliders_config:
-                default_res_slider_config = dict(
-                    label=flag_preprocessor_resolution,
-                    minimum=64,
-                    maximum=2048,
-                    step=1,
-                )
-                if self.prevent_next_n_slider_value_update == 0:
-                    default_res_slider_config["value"] = 512
-
-                grs += [
-                    gr.update(
-                        **default_res_slider_config,
-                        visible=not pp,
-                        interactive=True,
-                    ),
-                    copy(clear_slider_update),
-                    copy(clear_slider_update),
-                    gr.update(visible=True),
-                ]
-            else:
-                for slider_config in preprocessor_sliders_config[module]:
-                    if isinstance(slider_config, dict):
-                        visible = True
-                        if slider_config["name"] == flag_preprocessor_resolution:
-                            visible = not pp
-                        slider_update = gr.update(
-                            label=slider_config["name"],
-                            minimum=slider_config["min"],
-                            maximum=slider_config["max"],
-                            step=slider_config["step"]
-                            if "step" in slider_config
-                            else 1,
-                            visible=visible,
-                            interactive=True,
-                        )
-                        if self.prevent_next_n_slider_value_update == 0:
-                            slider_update["value"] = slider_config["value"]
-
-                        grs.append(slider_update)
-
-                    else:
-                        grs.append(copy(clear_slider_update))
-                while len(grs) < 3:
-                    grs.append(copy(clear_slider_update))
-                grs.append(gr.update(visible=True))
-            if module in model_free_preprocessors:
-                grs += [
-                    gr.update(visible=False, value="None"),
-                    gr.update(visible=False),
-                ]
-            else:
-                grs += [gr.update(visible=True), gr.update(visible=True)]
-
-            self.prevent_next_n_slider_value_update = max(
-                0, self.prevent_next_n_slider_value_update - 1
-            )
-
-            grs += [gr.update(visible=module not in no_control_mode_preprocessors)]
+            grs = [
+                gr.update(**slider_resolution_kwargs),
+                gr.update(**preprocessor.slider_1.gradio_update_kwargs.copy()),
+                gr.update(**preprocessor.slider_2.gradio_update_kwargs.copy()),
+                gr.update(visible=True),
+                gr.update(visible=not preprocessor.do_not_need_model),
+                gr.update(visible=not preprocessor.do_not_need_model),
+                gr.update(visible=preprocessor.show_control_mode),
+            ]

            return grs

@ -898,7 +825,6 @@ class ControlNetUiGroup(object):
        )

        def filter_selected(k: str):
-            logger.debug(f"Prevent update {self.prevent_next_n_module_update}")
            logger.debug(f"Switch to control type {k}")
            (
                filtered_preprocessor_list,
@ -906,22 +832,14 @@ class ControlNetUiGroup(object):
                default_option,
                default_model,
            ) = global_state.select_control_type(k, global_state.get_sd_version())
-
-            if self.prevent_next_n_module_update > 0:
-                self.prevent_next_n_module_update -= 1
-                return [
-                    gr.Dropdown.update(choices=filtered_preprocessor_list),
-                    gr.Dropdown.update(choices=filtered_model_list),
-                ]
-            else:
-                return [
-                    gr.Dropdown.update(
-                        value=default_option, choices=filtered_preprocessor_list
-                    ),
-                    gr.Dropdown.update(
-                        value=default_model, choices=filtered_model_list
-                    ),
-                ]
+            return [
+                gr.Dropdown.update(
+                    value=default_option, choices=filtered_preprocessor_list
+                ),
+                gr.Dropdown.update(
+                    value=default_model, choices=filtered_model_list
+                ),
+            ]

        self.type_filter.change(
            fn=filter_selected,
@ -959,7 +877,7 @@ class ControlNetUiGroup(object):
            )

    def register_run_annotator(self):
-        def run_annotator(image, module, pres, pthr_a, pthr_b, t2i_w, t2i_h, pp, rm):
+        def run_annotator(image, module, pres, pthr_a, pthr_b, t2i_w, t2i_h, pp, rm, model: str):
            if image is None:
                return (
                    gr.update(value=None, visible=True),
@ -981,8 +899,7 @@ class ControlNetUiGroup(object):
            ):
                img = HWC3(image["mask"][:, :, 0])

-            module = global_state.get_module_basename(module)
-            preprocessor = self.preprocessors[module]
+            preprocessor = Preprocessor.get_preprocessor(module)

            if pp:
                pres = external_code.pixel_perfect_resolution(
@ -1013,23 +930,25 @@ class ControlNetUiGroup(object):
            # effect.
            # TODO: Maybe we should let `preprocessor` return a Dict to alleviate this issue?
            # This requires changing all callsites though.
-            result, is_image = preprocessor(
+            result = preprocessor.cached_call(
                img,
-                res=pres,
-                thr_a=pthr_a,
-                thr_b=pthr_b,
+                resolution=pres,
+                slider_1=pthr_a,
+                slider_2=pthr_b,
                low_vram=(
                    ("clip" in module or module == "ip-adapter_face_id_plus")
                    and shared.opts.data.get("controlnet_clip_detector_on_cpu", False)
                ),
-                json_pose_callback=json_acceptor.accept
-                if is_openpose(module)
-                else None,
+                json_pose_callback=(
+                    json_acceptor.accept
+                    if is_openpose(module)
+                    else None
+                ),
+                model=model,
            )

-            if not is_image:
+            if not preprocessor.returns_image:
                result = img
-                is_image = True

            result = external_code.visualize_inpaint_mask(result)
            return (
@ -1057,6 +976,7 @@ class ControlNetUiGroup(object):
                else ControlNetUiGroup.a1111_context.txt2img_h_slider,
                self.pixel_perfect,
                self.resize_mode,
+                self.model,
            ],
            outputs=[
                self.generated_image,
--- a/scripts/controlnet_ui/preset.py
+++ b/scripts/controlnet_ui/preset.py
@ -7,8 +7,8 @@ from modules import scripts
 from scripts.infotext import parse_unit, serialize_unit
 from scripts.controlnet_ui.tool_button import ToolButton
 from scripts.logging import logger
-from scripts.processor import preprocessor_filters
 from scripts import external_code
+from scripts.supported_preprocessor import Preprocessor

 save_symbol = "\U0001f4be"  # 💾
 delete_symbol = "\U0001f5d1\ufe0f"  # 🗑️
@ -38,7 +38,7 @@ def infer_control_type(module: str, model: str) -> str:
    def matches_control_type(input_string: str, control_type: str) -> bool:
        return any(t.lower() in input_string for t in control_type.split("/"))

-    control_types = preprocessor_filters.keys()
+    control_types = Preprocessor.get_all_preprocessor_tags()
    control_type_candidates = [
        control_type
        for control_type in control_types
--- a/scripts/global_state.py
+++ b/scripts/global_state.py
@ -1,17 +1,14 @@
 import os.path
 import stat
-import functools
 from collections import OrderedDict

 from modules import shared, scripts, sd_models
 from modules.paths import models_path
-from scripts.processor import *  # noqa: E403
-import scripts.processor as processor
-from scripts.utils import ndarray_lru_cache
-from scripts.logging import logger
-from scripts.enums import StableDiffusionVersion

-from typing import Dict, Callable, Optional, Tuple, List
+from scripts.enums import StableDiffusionVersion
+from scripts.supported_preprocessor import Preprocessor
+
+from typing import Dict, Tuple, List

 CN_MODEL_EXTS = [".pt", ".pth", ".ckpt", ".safetensors", ".bin"]
 cn_models_dir = os.path.join(models_path, "ControlNet")
@ -19,187 +16,6 @@ cn_models_dir_old = os.path.join(scripts.basedir(), "models")
 cn_models = OrderedDict()      # "My_Lora(abcd1234)" -> C:/path/to/model.safetensors
 cn_models_names = {}  # "my_lora" -> "My_Lora(abcd1234)"

-def cache_preprocessors(preprocessor_modules: Dict[str, Callable]) -> Dict[str, Callable]:
-    """ We want to share the preprocessor results in a single big cache, instead of a small
-     cache for each preprocessor function. """
-    CACHE_SIZE = getattr(shared.cmd_opts, "controlnet_preprocessor_cache_size", 0)
-
-    # Set CACHE_SIZE = 0 will completely remove the caching layer. This can be
-    # helpful when debugging preprocessor code.
-    if CACHE_SIZE == 0:
-        return preprocessor_modules
-
-    logger.debug(f'Create LRU cache (max_size={CACHE_SIZE}) for preprocessor results.')
-
-    @ndarray_lru_cache(max_size=CACHE_SIZE)
-    def unified_preprocessor(preprocessor_name: str, *args, **kwargs):
-        logger.debug(f'Calling preprocessor {preprocessor_name} outside of cache.')
-        return preprocessor_modules[preprocessor_name](*args, **kwargs)
-
-    # TODO: Introduce a seed parameter for shuffle preprocessor?
-    uncacheable_preprocessors = ['shuffle']
-
-    return {
-        k: (
-            v if k in uncacheable_preprocessors
-            else functools.partial(unified_preprocessor, k)
-        )
-        for k, v
-        in preprocessor_modules.items()
-    }
-
-cn_preprocessor_modules = {
-    "none": lambda x, *args, **kwargs: (x, True),
-    "canny": canny,
-    "depth": midas,
-    "depth_leres": functools.partial(leres, boost=False),
-    "depth_leres++": functools.partial(leres, boost=True),
-    "depth_hand_refiner": g_hand_refiner_model.run_model,
-    "depth_anything": functools.partial(depth_anything, colored=False),
-    "hed": hed,
-    "hed_safe": hed_safe,
-    "mediapipe_face": mediapipe_face,
-    "mlsd": mlsd,
-    "normal_map": midas_normal,
-    "openpose": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=False, include_face=False),
-    "openpose_hand": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=True, include_face=False),
-    "openpose_face": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=False, include_face=True),
-    "openpose_faceonly": functools.partial(g_openpose_model.run_model, include_body=False, include_hand=False, include_face=True),
-    "openpose_full": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=True, include_face=True),
-    "dw_openpose_full": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=True, include_face=True, use_dw_pose=True),
-    "animal_openpose": functools.partial(g_openpose_model.run_model, include_body=True, include_hand=False, include_face=False, use_animal_pose=True),
-    "clip_vision": functools.partial(clip, config='clip_vitl'),
-    "revision_clipvision": functools.partial(clip, config='clip_g'),
-    "revision_ignore_prompt": functools.partial(clip, config='clip_g'),
-    "ip-adapter_clip_sd15": functools.partial(clip, config='clip_h'),
-    "ip-adapter_clip_sdxl_plus_vith": functools.partial(clip, config='clip_h'),
-    "ip-adapter_clip_sdxl": functools.partial(clip, config='clip_g'),
-    "ip-adapter_face_id": g_insight_face_model.run_model,
-    "ip-adapter_face_id_plus": face_id_plus,
-    "instant_id_face_keypoints": functools.partial(g_insight_face_instant_id_model.run_model_instant_id, return_keypoints=True),
-    "instant_id_face_embedding": functools.partial(g_insight_face_instant_id_model.run_model_instant_id, return_keypoints=False),
-    "color": color,
-    "pidinet": pidinet,
-    "pidinet_safe": pidinet_safe,
-    "pidinet_sketch": pidinet_ts,
-    "pidinet_scribble": scribble_pidinet,
-    "scribble_xdog": scribble_xdog,
-    "scribble_hed": scribble_hed,
-    "segmentation": uniformer,
-    "threshold": threshold,
-    "depth_zoe": zoe_depth,
-    "normal_bae": normal_bae,
-    "oneformer_coco": oneformer_coco,
-    "oneformer_ade20k": oneformer_ade20k,
-    "lineart": lineart,
-    "lineart_coarse": lineart_coarse,
-    "lineart_anime": lineart_anime,
-    "lineart_standard": lineart_standard,
-    "shuffle": shuffle,
-    "tile_resample": tile_resample,
-    "invert": invert,
-    "lineart_anime_denoise": lineart_anime_denoise,
-    "reference_only": identity,
-    "reference_adain": identity,
-    "reference_adain+attn": identity,
-    "inpaint": identity,
-    "inpaint_only": identity,
-    "inpaint_only+lama": lama_inpaint,
-    "tile_colorfix": identity,
-    "tile_colorfix+sharp": identity,
-    "recolor_luminance": recolor_luminance,
-    "recolor_intensity": recolor_intensity,
-    "blur_gaussian": blur_gaussian,
-    "anime_face_segment": anime_face_segment,
-    "densepose": functools.partial(densepose, cmap="viridis"),
-    "densepose_parula": functools.partial(densepose, cmap="parula"),
-    "te_hed":te_hed,
-    "normal_dsine": normal_dsine,
-}
-
-cn_preprocessor_unloadable = {
-    "hed": unload_hed,
-    "fake_scribble": unload_hed,
-    "mlsd": unload_mlsd,
-    "clip_vision": functools.partial(unload_clip, config='clip_vitl'),
-    "revision_clipvision": functools.partial(unload_clip, config='clip_g'),
-    "revision_ignore_prompt": functools.partial(unload_clip, config='clip_g'),
-    "ip-adapter_clip_sd15": functools.partial(unload_clip, config='clip_h'),
-    "ip-adapter_clip_sdxl_plus_vith": functools.partial(unload_clip, config='clip_h'),
-    "ip-adapter_face_id_plus": functools.partial(unload_clip, config='clip_h'),
-    "ip-adapter_clip_sdxl": functools.partial(unload_clip, config='clip_g'),
-    "depth": unload_midas,
-    "depth_leres": unload_leres,
-    "depth_anything": unload_depth_anything,
-    "normal_map": unload_midas,
-    "pidinet": unload_pidinet,
-    "openpose": g_openpose_model.unload,
-    "openpose_hand": g_openpose_model.unload,
-    "openpose_face": g_openpose_model.unload,
-    "openpose_full": g_openpose_model.unload,
-    "dw_openpose_full": g_openpose_model.unload,
-    "animal_openpose": g_openpose_model.unload,
-    "segmentation": unload_uniformer,
-    "depth_zoe": unload_zoe_depth,
-    "normal_bae": unload_normal_bae,
-    "oneformer_coco": unload_oneformer_coco,
-    "oneformer_ade20k": unload_oneformer_ade20k,
-    "lineart": unload_lineart,
-    "lineart_coarse": unload_lineart_coarse,
-    "lineart_anime": unload_lineart_anime,
-    "lineart_anime_denoise": unload_lineart_anime_denoise,
-    "inpaint_only+lama": unload_lama_inpaint,
-    "anime_face_segment": unload_anime_face_segment,
-    "densepose": unload_densepose,
-    "densepose_parula": unload_densepose,
-    "depth_hand_refiner": g_hand_refiner_model.unload,
-    "te_hed":unload_te_hed,
-    "normal_dsine": unload_normal_dsine,
-}
-
-preprocessor_aliases = {
-    "invert": "invert (from white bg & black line)",
-    "lineart_standard": "lineart_standard (from white bg & black line)",
-    "lineart": "lineart_realistic",
-    "color": "t2ia_color_grid",
-    "clip_vision": "t2ia_style_clipvision",
-    "pidinet_sketch": "t2ia_sketch_pidi",
-    "depth": "depth_midas",
-    "normal_map": "normal_midas",
-    "hed": "softedge_hed",
-    "hed_safe": "softedge_hedsafe",
-    "pidinet": "softedge_pidinet",
-    "pidinet_safe": "softedge_pidisafe",
-    "segmentation": "seg_ufade20k",
-    "oneformer_coco": "seg_ofcoco",
-    "oneformer_ade20k": "seg_ofade20k",
-    "pidinet_scribble": "scribble_pidinet",
-    "inpaint": "inpaint_global_harmonious",
-    "anime_face_segment": "seg_anime_face",
-    "densepose": "densepose (pruple bg & purple torso)",
-    "densepose_parula": "densepose_parula (black bg & blue torso)",
-    "te_hed": "softedge_teed",
-    "ip-adapter_clip_sd15": "ip-adapter_clip_h",
-    "ip-adapter_clip_sdxl": "ip-adapter_clip_g",
-}
-
-# Preprocessor that automatically maps to other preprocessors.
-meta_preprocessors = ["ip-adapter-auto"]
-
-ui_preprocessor_keys = ['none', preprocessor_aliases['invert']]
-ui_preprocessor_keys += meta_preprocessors
-ui_preprocessor_keys += sorted([preprocessor_aliases.get(k, k)
-                                for k in cn_preprocessor_modules.keys()
-                                if preprocessor_aliases.get(k, k) not in ui_preprocessor_keys])
-
-reverse_preprocessor_aliases = {preprocessor_aliases[k]: k for k in preprocessor_aliases.keys()}
-
-
-def get_module_basename(module: Optional[str]) -> str:
-    if module is None:
-        module = 'none'
-    return reverse_preprocessor_aliases.get(module, module)
-

 default_detectedmap_dir = os.path.join("detected_maps")
 script_dir = scripts.basedir()
@ -300,50 +116,28 @@ def select_control_type(
    sd_version: StableDiffusionVersion = StableDiffusionVersion.UNKNOWN,
    cn_models: Dict = cn_models, # Override or testing
 ) -> Tuple[List[str], List[str], str, str]:
-    default_option = processor.preprocessor_filters[control_type]
    pattern = control_type.lower()
-    preprocessor_list = ui_preprocessor_keys
    all_models = list(cn_models.keys())

    if pattern == "all":
        return [
-            preprocessor_list,
+            [p.label for p in Preprocessor.get_sorted_preprocessors()],
            all_models,
            'none', #default option
            "None"  #default model
        ]
-    filtered_preprocessor_list = [
-        x
-        for x in preprocessor_list
-        if ((
-            pattern in x.lower() or
-            any(a in x.lower() for a in processor.preprocessor_filters_aliases.get(pattern, [])) or
-            x.lower() == "none"
-        ) and (
-            sd_version.is_compatible_with(StableDiffusionVersion.detect_from_model_name(x))
-        ))
-    ]
-    if pattern in ["canny", "lineart", "scribble/sketch", "mlsd"]:
-        filtered_preprocessor_list += [
-            x for x in preprocessor_list if "invert" in x.lower()
-        ]
-    if pattern in ["sparsectrl"]:
-        filtered_preprocessor_list += [
-            x for x in preprocessor_list if "scribble" in x.lower()
-        ]
+
    filtered_model_list = [
        model for model in all_models
        if model.lower() == "none" or
        ((
            pattern in model.lower() or
-            any(a in model.lower() for a in processor.preprocessor_filters_aliases.get(pattern, []))
+            any(a in model.lower() for a in Preprocessor.tag_to_filters(control_type))
        ) and (
            sd_version.is_compatible_with(StableDiffusionVersion.detect_from_model_name(model))
        ))
    ]
    assert len(filtered_model_list) > 0, "'None' model should always be available."
-    if default_option not in filtered_preprocessor_list:
-        default_option = filtered_preprocessor_list[0]
    if len(filtered_model_list) == 1:
        default_model = "None"
    else:
@ -354,8 +148,10 @@ def select_control_type(
                break

    return (
-        filtered_preprocessor_list,
+        [p.label for p in Preprocessor.get_filtered_preprocessors(control_type)],
        filtered_model_list,
-        default_option,
+        Preprocessor.get_default_preprocessor(control_type).label,
        default_model
    )
+
+
--- a/scripts/preprocessor/init.py
+++ b/scripts/preprocessor/init.py
@ -0,0 +1,4 @@
+from .ip_adapter_auto import *
+from .normal_dsine import *
+from .model_free_preprocessors import *
+from .legacy.legacy_preprocessors import *
--- a/scripts/preprocessor/ip_adapter_auto.py
+++ b/scripts/preprocessor/ip_adapter_auto.py
@ -0,0 +1,25 @@
+from ..ipadapter.presets import IPAdapterPreset
+from ..supported_preprocessor import Preprocessor
+from ..logging import logger
+
+
+class PreprocessorIPAdapterAuto(Preprocessor):
+    def __init__(self):
+        super().__init__(name="ip-adapter-auto")
+        self.tags = ["IP-Adapter"]
+        self.sorting_priority = 1000
+        self.returns_image = False
+        self.show_control_mode = False
+
+    def __call__(self, *args, **kwargs):
+        assert "model" in kwargs
+        model: str = kwargs["model"]
+        module: str = IPAdapterPreset.match_model(model).module
+        logger.info(f"ip-adapter-auto => {module}")
+
+        p = Preprocessor.get_preprocessor(module)
+        assert p is not None
+        return p(*args, **kwargs)
+
+
+Preprocessor.add_supported_preprocessor(PreprocessorIPAdapterAuto())
--- a/scripts/preprocessor/legacy/legacy_preprocessors.py
+++ b/scripts/preprocessor/legacy/legacy_preprocessors.py
@ -0,0 +1,112 @@
+# This is a python script to convert all old preprocessors to new format.
+# However, the old preprocessors are not very memory effective
+# and eventually we should move all old preprocessors to new format manually
+# see also the forge_preprocessor_normalbae/scripts/preprocessor_normalbae for
+# how to make better implementation of preprocessors.
+# No newer preprocessors should be written in this legacy way.
+
+# Never add new leagcy preprocessors please.
+# The new forge_preprocessor_normalbae/scripts/preprocessor_normalbae
+# is much more effective and maintainable
+
+
+from annotator.util import HWC3
+from .preprocessor_compiled import legacy_preprocessors
+from ...supported_preprocessor import Preprocessor, PreprocessorParameter
+
+
+###
+
+# This file has lots of unreasonable historical designs and should be viewed as a frozen blackbox library.
+
+# If you want to add preprocessor,
+# please instead look at `extensions-builtin/forge_preprocessor_normalbae/scripts/preprocessor_normalbae`
+# If you want to use preprocessor,
+# please instead use `from modules_forge.shared import supported_preprocessors`
+# and then use any preprocessor like: depth_midas = supported_preprocessors['depth_midas']
+
+# Please do not hack/edit/modify/rely-on any codes in this file.
+
+# Never use methods in this file to add anything!
+# This file will be eventually removed but the workload is super high and we need more time to do this.
+
+###
+
+
+class LegacyPreprocessor(Preprocessor):
+    def __init__(self, name: str, legacy_dict):
+        super().__init__(name)
+        self._label = legacy_dict["label"]
+        self.call_function = legacy_dict["call_function"]
+        self.unload_function = legacy_dict["unload_function"]
+        self.managed_model = legacy_dict["managed_model"]
+        self.do_not_need_model = legacy_dict["model_free"]
+        self.show_control_mode = not legacy_dict["no_control_mode"]
+        self.sorting_priority = legacy_dict["priority"]
+        self.tags = legacy_dict["tags"]
+        self.returns_image = legacy_dict.get("returns_image", True)
+
+        if legacy_dict.get("use_soft_projection_in_hr_fix", False):
+            self.use_soft_projection_in_hr_fix = True
+
+        if legacy_dict["resolution"] is None:
+            self.resolution = PreprocessorParameter(visible=False)
+        else:
+            legacy_dict["resolution"]["label"] = "Resolution"
+            legacy_dict["resolution"]["step"] = 8
+            self.resolution = PreprocessorParameter(
+                **legacy_dict["resolution"], visible=True
+            )
+
+        if legacy_dict["slider_1"] is None:
+            self.slider_1 = PreprocessorParameter(visible=False)
+        else:
+            self.slider_1 = PreprocessorParameter(
+                **legacy_dict["slider_1"], visible=True
+            )
+
+        if legacy_dict["slider_2"] is None:
+            self.slider_2 = PreprocessorParameter(visible=False)
+        else:
+            self.slider_2 = PreprocessorParameter(
+                **legacy_dict["slider_2"], visible=True
+            )
+
+        if legacy_dict["slider_3"] is None:
+            self.slider_3 = PreprocessorParameter(visible=False)
+        else:
+            self.slider_3 = PreprocessorParameter(
+                **legacy_dict["slider_3"], visible=True
+            )
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        **kwargs
+    ):
+        # Legacy Preprocessors does not have slider 3
+        del slider_3
+
+        if self.managed_model is not None:
+            assert self.unload_function is not None
+
+        result, is_image = self.call_function(
+            img=input_image, res=resolution, thr_a=slider_1, thr_b=slider_2, **kwargs
+        )
+
+        if is_image:
+            result = HWC3(result)
+
+        if self.unload_function is not None:
+            self.unload_function()
+
+        return result
+
+
+for name, data in legacy_preprocessors.items():
+    p = LegacyPreprocessor(name, data)
+    Preprocessor.add_supported_preprocessor(p)
--- a/scripts/preprocessor/legacy/preprocessor_compiled.py
+++ b/scripts/preprocessor/legacy/preprocessor_compiled.py
--- a/scripts/preprocessor/legacy/processor.py
+++ b/scripts/preprocessor/legacy/processor.py
@ -51,24 +51,9 @@ def resize_image_with_pad(input_image, resolution, skip_hwc3=False):
    return safer_memory(img_padded), remove_pad


-model_canny = None
-
-
 def canny(img, res=512, thr_a=100, thr_b=200, **kwargs):
-    l, h = thr_a, thr_b  # noqa: E741
    img, remove_pad = resize_image_with_pad(img, res)
-    global model_canny
-    if model_canny is None:
-        from annotator.canny import apply_canny
-        model_canny = apply_canny
-    result = model_canny(img, l, h)
-    return remove_pad(result), True
-
-
-def scribble_thr(img, res=512, **kwargs):
-    img, remove_pad = resize_image_with_pad(img, res)
-    result = np.zeros_like(img, dtype=np.uint8)
-    result[np.min(img, axis=2) < 127] = 255
+    result = cv2.Canny(img, thr_a, thr_b)
    return remove_pad(result), True


@ -620,20 +605,6 @@ def unload_oneformer_ade20k():
        model_oneformer_ade20k.unload_model()


-model_shuffle = None
-
-
-def shuffle(img, res=512, **kwargs):
-    img, remove_pad = resize_image_with_pad(img, res)
-    img = remove_pad(img)
-    global model_shuffle
-    if model_shuffle is None:
-        from annotator.shuffle import ContentShuffleDetector
-        model_shuffle = ContentShuffleDetector()
-    result = model_shuffle(img)
-    return result, True
-
-
 def recolor_luminance(img, res=512, thr_a=1.0, **kwargs):
    result = cv2.cvtColor(HWC3(img), cv2.COLOR_BGR2LAB)
    result = result[:, :, 0].astype(np.float32) / 255.0
@ -706,25 +677,6 @@ def unload_te_hed():
    if model_te_hed is not None:
        model_te_hed.unload_model()

-
-model_normal_dsine = None
-
-
-def normal_dsine(img, res=512, thr_a=60.0,thr_b=5, **kwargs):
-    global model_normal_dsine
-    if model_normal_dsine is None:
-        from annotator.normaldsine import NormalDsineDetector
-        model_normal_dsine = NormalDsineDetector()
-    result = model_normal_dsine(img, new_fov=float(thr_a), iterations=int(thr_b), resulotion=res)
-    return result, True
-
-
-def unload_normal_dsine():
-    global model_normal_dsine
-    if model_normal_dsine is not None:
-        model_normal_dsine.unload_model()
-
-
 class InsightFaceModel:
    def __init__(self, face_analysis_model_name: str = "buffalo_l"):
        self.model = None
@ -775,7 +727,7 @@ class InsightFaceModel:

    def run_model(self, img: np.ndarray, **kwargs) -> Tuple[torch.Tensor, bool]:
        self.load_model()
-        assert img.shape[2] == 3, f"Expect 3 channels, but get {img.shape} channels"
+        img = img[:, :, :3]  # Drop alpha channel if there is one.
        faces = self.model.get(cv2.cvtColor(img, cv2.COLOR_RGB2BGR))
        face = InsightFaceModel.pick_largest_face(faces)
        return torch.from_numpy(face.normed_embedding).unsqueeze(0), False
@ -886,487 +838,3 @@ class HandRefinerModel:


 g_hand_refiner_model = HandRefinerModel()
-
-
-model_free_preprocessors = [
-    "reference_only",
-    "reference_adain",
-    "reference_adain+attn",
-    "revision_clipvision",
-    "revision_ignore_prompt"
-]
-
-no_control_mode_preprocessors = [
-    "revision_clipvision",
-    "revision_ignore_prompt",
-    "clip_vision",
-    "ip-adapter_clip_sd15",
-    "ip-adapter_clip_sdxl",
-    "ip-adapter_clip_sdxl_plus_vith",
-    "t2ia_style_clipvision",
-    "ip-adapter_face_id",
-    "ip-adapter_face_id_plus",
-]
-
-flag_preprocessor_resolution = "Preprocessor Resolution"
-preprocessor_sliders_config = {
-    "none": [],
-    "inpaint": [],
-    "inpaint_only": [],
-    "revision_clipvision": [
-        None,
-        {
-            "name": "Noise Augmentation",
-            "value": 0.0,
-            "min": 0.0,
-            "max": 1.0
-        },
-    ],
-    "revision_ignore_prompt": [
-        None,
-        {
-            "name": "Noise Augmentation",
-            "value": 0.0,
-            "min": 0.0,
-            "max": 1.0
-        },
-    ],
-    "canny": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        },
-        {
-            "name": "Canny Low Threshold",
-            "value": 100,
-            "min": 1,
-            "max": 255
-        },
-        {
-            "name": "Canny High Threshold",
-            "value": 200,
-            "min": 1,
-            "max": 255
-        },
-    ],
-    "mlsd": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        },
-        {
-            "name": "MLSD Value Threshold",
-            "min": 0.01,
-            "max": 2.0,
-            "value": 0.1,
-            "step": 0.01
-        },
-        {
-            "name": "MLSD Distance Threshold",
-            "min": 0.01,
-            "max": 20.0,
-            "value": 0.1,
-            "step": 0.01
-        }
-    ],
-    "hed": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "scribble_hed": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "hed_safe": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "openpose": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "openpose_full": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "dw_openpose_full": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "animal_openpose": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "segmentation": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "depth": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "depth_leres": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        },
-        {
-            "name": "Remove Near %",
-            "min": 0,
-            "max": 100,
-            "value": 0,
-            "step": 0.1,
-        },
-        {
-            "name": "Remove Background %",
-            "min": 0,
-            "max": 100,
-            "value": 0,
-            "step": 0.1,
-        }
-    ],
-    "depth_leres++": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        },
-        {
-            "name": "Remove Near %",
-            "min": 0,
-            "max": 100,
-            "value": 0,
-            "step": 0.1,
-        },
-        {
-            "name": "Remove Background %",
-            "min": 0,
-            "max": 100,
-            "value": 0,
-            "step": 0.1,
-        }
-    ],
-    "normal_map": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        },
-        {
-            "name": "Normal Background Threshold",
-            "min": 0.0,
-            "max": 1.0,
-            "value": 0.4,
-            "step": 0.01
-        }
-    ],
-    "threshold": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        },
-        {
-            "name": "Binarization Threshold",
-            "min": 0,
-            "max": 255,
-            "value": 127
-        }
-    ],
-
-    "scribble_xdog": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        },
-        {
-            "name": "XDoG Threshold",
-            "min": 1,
-            "max": 64,
-            "value": 32,
-        }
-    ],
-    "blur_gaussian": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        },
-        {
-            "name": "Sigma",
-            "min": 0.01,
-            "max": 64.0,
-            "value": 9.0,
-        }
-    ],
-    "tile_resample": [
-        None,
-        {
-            "name": "Down Sampling Rate",
-            "value": 1.0,
-            "min": 1.0,
-            "max": 8.0,
-            "step": 0.01
-        }
-    ],
-    "tile_colorfix": [
-        None,
-        {
-            "name": "Variation",
-            "value": 8.0,
-            "min": 3.0,
-            "max": 32.0,
-            "step": 1.0
-        }
-    ],
-    "tile_colorfix+sharp": [
-        None,
-        {
-            "name": "Variation",
-            "value": 8.0,
-            "min": 3.0,
-            "max": 32.0,
-            "step": 1.0
-        },
-        {
-            "name": "Sharpness",
-            "value": 1.0,
-            "min": 0.0,
-            "max": 2.0,
-            "step": 0.01
-        }
-    ],
-    "reference_only": [
-        None,
-        {
-            "name": r'Style Fidelity (only for "Balanced" mode)',
-            "value": 0.5,
-            "min": 0.0,
-            "max": 1.0,
-            "step": 0.01
-        }
-    ],
-    "reference_adain": [
-        None,
-        {
-            "name": r'Style Fidelity (only for "Balanced" mode)',
-            "value": 0.5,
-            "min": 0.0,
-            "max": 1.0,
-            "step": 0.01
-        }
-    ],
-    "reference_adain+attn": [
-        None,
-        {
-            "name": r'Style Fidelity (only for "Balanced" mode)',
-            "value": 0.5,
-            "min": 0.0,
-            "max": 1.0,
-            "step": 0.01
-        }
-    ],
-    "inpaint_only+lama": [],
-    "color": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048,
-        }
-    ],
-    "mediapipe_face": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048,
-        },
-        {
-            "name": "Max Faces",
-            "value": 1,
-            "min": 1,
-            "max": 10,
-            "step": 1
-        },
-        {
-            "name": "Min Face Confidence",
-            "value": 0.5,
-            "min": 0.01,
-            "max": 1.0,
-            "step": 0.01
-        }
-    ],
-    "recolor_luminance": [
-        None,
-        {
-            "name": "Gamma Correction",
-            "value": 1.0,
-            "min": 0.1,
-            "max": 2.0,
-            "step": 0.001
-        }
-    ],
-    "recolor_intensity": [
-        None,
-        {
-            "name": "Gamma Correction",
-            "value": 1.0,
-            "min": 0.1,
-            "max": 2.0,
-            "step": 0.001
-        }
-    ],
-    "anime_face_segment": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        }
-    ],
-    "densepose": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "densepose_parula": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        }
-    ],
-    "depth_hand_refiner": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        }
-    ],
-    "te_hed": [
-        {
-            "name": flag_preprocessor_resolution,
-            "value": 512,
-            "min": 64,
-            "max": 2048
-        },
-        {
-            "name": "Safe Steps",
-            "min": 0,
-            "max": 10,
-            "value": 2,
-            "step": 1,
-        },
-    ],
-    "normal_dsine": [
-        {
-            "name": flag_preprocessor_resolution,
-            "min": 64,
-            "max": 2048,
-            "value": 512
-        },
-        {
-            "name": "Fov",
-            "min": 0.0,
-            "max": 360.0,
-            "value": 60.0,
-            "step": 0.1,
-        },
-        {
-            "name": "Iterations",
-            "min": 1,
-            "max": 20,
-            "value": 5,
-            "step": 1,
-        },
-    ],
-}
-
-preprocessor_filters = {
-    "All": "none",
-    "Canny": "canny",
-    "Depth": "depth_midas",
-    "NormalMap": "normal_bae",
-    "OpenPose": "openpose_full",
-    "MLSD": "mlsd",
-    "Lineart": "lineart_standard (from white bg & black line)",
-    "SoftEdge": "softedge_pidinet",
-    "Scribble/Sketch": "scribble_pidinet",
-    "Segmentation": "seg_ofade20k",
-    "Shuffle": "shuffle",
-    "Tile/Blur": "tile_resample",
-    "Inpaint": "inpaint_only",
-    "InstructP2P": "none",
-    "Reference": "reference_only",
-    "Recolor": "recolor_luminance",
-    "Revision": "revision_clipvision",
-    "T2I-Adapter": "none",
-    "IP-Adapter": "ip-adapter-auto",
-    "Instant_ID": "instant_id",
-    "SparseCtrl": "none",
-}
-
-preprocessor_filters_aliases = {
-    'instructp2p': ['ip2p'],
-    'segmentation': ['seg'],
-    'normalmap': ['normal'],
-    't2i-adapter': ['t2i_adapter', 't2iadapter', 't2ia'],
-    'ip-adapter': ['ip_adapter', 'ipadapter'],
-    'scribble/sketch': ['scribble', 'sketch'],
-    'tile/blur': ['tile', 'blur'],
-    'openpose':['openpose', 'densepose'],
-}  # must use all lower texts
--- a/scripts/preprocessor/model_free_preprocessors.py
+++ b/scripts/preprocessor/model_free_preprocessors.py
@ -0,0 +1,184 @@
+"""Preprocessors that do not need to run a torch model."""
+
+import cv2
+import numpy as np
+
+from ..supported_preprocessor import Preprocessor, PreprocessorParameter
+from ..utils import resize_image_with_pad
+from annotator.util import HWC3
+
+
+class PreprocessorNone(Preprocessor):
+    def __init__(self):
+        super().__init__(name="none")
+        self.sorting_priority = 10
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        input_mask=None,
+        **kwargs
+    ):
+        return input_image
+
+
+class PreprocessorCanny(Preprocessor):
+    def __init__(self):
+        super().__init__(name="canny")
+        self.tags = ["Canny"]
+        self.slider_1 = PreprocessorParameter(
+            minimum=1,
+            maximum=255,
+            step=1,
+            value=100,
+            label="Low Threshold",
+        )
+        self.slider_2 = PreprocessorParameter(
+            minimum=1,
+            maximum=255,
+            step=1,
+            value=200,
+            label="High Threshold",
+        )
+        self.sorting_priority = 100
+        self.use_soft_projection_in_hr_fix = True
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        **kwargs
+    ):
+        input_image, remove_pad = resize_image_with_pad(input_image, resolution)
+        canny_image = cv2.cvtColor(
+            cv2.Canny(input_image, int(slider_1), int(slider_2)), cv2.COLOR_GRAY2RGB
+        )
+        return remove_pad(canny_image)
+
+
+class PreprocessorInvert(Preprocessor):
+    def __init__(self):
+        super().__init__(name="invert")
+        self._label = "invert (from white bg & black line)"
+        self.tags = [
+            "Canny",
+            "Lineart",
+            "Scribble",
+            "Sketch",
+            "MLSD",
+        ]
+        self.slider_resolution = PreprocessorParameter(visible=False)
+        self.sorting_priority = 20
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        **kwargs
+    ):
+        return 255 - HWC3(input_image)
+
+
+class PreprocessorBlurGaussian(Preprocessor):
+    def __init__(self):
+        super().__init__(name="blur_gaussian")
+        self.slider_1 = PreprocessorParameter(
+            label="Sigma", minimum=64, maximum=2048, value=512
+        )
+        self.tags = ["Tile", "Blur"]
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        input_mask=None,
+        **kwargs
+    ):
+        img, remove_pad = resize_image_with_pad(input_image, resolution)
+        img = remove_pad(img)
+        result = cv2.GaussianBlur(img, (0, 0), float(slider_1))
+        return result
+
+
+class PreprocessorScribbleXdog(Preprocessor):
+    def __init__(self):
+        super().__init__(name="scribble_xdog")
+        self.slider_1 = PreprocessorParameter(
+            label="XDoG Threshold", minimum=1, maximum=64, value=32
+        )
+        self.tags = [
+            "Scribble",
+            "Sketch",
+            "SparseCtrl",
+        ]
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        input_mask=None,
+        **kwargs
+    ):
+        img, remove_pad = resize_image_with_pad(input_image, resolution)
+        g1 = cv2.GaussianBlur(img.astype(np.float32), (0, 0), 0.5)
+        g2 = cv2.GaussianBlur(img.astype(np.float32), (0, 0), 5.0)
+        dog = (255 - np.min(g2 - g1, axis=2)).clip(0, 255).astype(np.uint8)
+        result = np.zeros_like(img, dtype=np.uint8)
+        result[2 * (255 - dog) > slider_1] = 255
+        return remove_pad(result)
+
+
+class PreprocessorShuffle(Preprocessor):
+    def __init__(self):
+        super().__init__(name="shuffle")
+        self.tags = ["Shuffle"]
+        self.model_shuffle = None
+        # Fix res to 512.
+        self.slider_resolution = PreprocessorParameter(value=512, visible=False)
+
+    def cached_call(self, *args, **kwargs):
+        """No cache for shuffle, as each call depends on different numpy seed."""
+        return self(*args, **kwargs)
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        input_mask=None,
+        **kwargs
+    ):
+        img, remove_pad = resize_image_with_pad(input_image, resolution)
+        img = remove_pad(img)
+        if self.model_shuffle is None:
+            from annotator.shuffle import ContentShuffleDetector
+
+            self.model_shuffle = ContentShuffleDetector()
+        result = self.model_shuffle(img)
+        return result
+
+
+Preprocessor.add_supported_preprocessor(PreprocessorNone())
+Preprocessor.add_supported_preprocessor(PreprocessorCanny())
+Preprocessor.add_supported_preprocessor(PreprocessorInvert())
+Preprocessor.add_supported_preprocessor(PreprocessorBlurGaussian())
+Preprocessor.add_supported_preprocessor(PreprocessorScribbleXdog())
+Preprocessor.add_supported_preprocessor(PreprocessorShuffle())
--- a/scripts/preprocessor/normal_dsine.py
+++ b/scripts/preprocessor/normal_dsine.py
@ -0,0 +1,48 @@
+from ..supported_preprocessor import Preprocessor, PreprocessorParameter
+
+
+class PreprocessorNormalDsine(Preprocessor):
+    def __init__(self):
+        super().__init__(name="normal_dsine")
+        self.tags = ["NormalMap"]
+        self.slider_1 = PreprocessorParameter(
+            minimum=0,
+            maximum=360,
+            step=0.1,
+            value=60,
+            label="Fov",
+        )
+        self.slider_2 = PreprocessorParameter(
+            minimum=1,
+            maximum=20,
+            step=1,
+            value=5,
+            label="Iterations",
+        )
+        self.model = None
+
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        **kwargs
+    ):
+        if self.model is None:
+            from annotator.normaldsine import NormalDsineDetector
+
+            self.model = NormalDsineDetector()
+
+        result = self.model(
+            input_image,
+            new_fov=float(slider_1),
+            iterations=int(slider_2),
+            resulotion=resolution,
+        )
+        self.model.unload_model()
+        return result
+
+
+Preprocessor.add_supported_preprocessor(PreprocessorNormalDsine())
--- a/scripts/supported_preprocessor.py
+++ b/scripts/supported_preprocessor.py
@ -0,0 +1,189 @@
+from abc import ABC, abstractmethod
+from typing import List, ClassVar, Dict, Optional, Set
+from dataclasses import dataclass, field
+
+from modules import shared
+from scripts.logging import logger
+from scripts.utils import ndarray_lru_cache
+
+
+CACHE_SIZE = getattr(shared.cmd_opts, "controlnet_preprocessor_cache_size", 0)
+
+
+@dataclass
+class PreprocessorParameter:
+    """
+    Class representing a parameter for a preprocessor.
+
+    Attributes:
+        label (str): The label for the parameter.
+        minimum (float): The minimum value of the parameter. Default is 0.0.
+        maximum (float): The maximum value of the parameter. Default is 1.0.
+        step (float): The step size for the parameter. Default is 0.01.
+        value (float): The initial value of the parameter. Default is 0.5.
+        visible (bool): Whether the parameter is visible or not. Default is False.
+    """
+
+    label: str = "EMPTY_LABEL"
+    minimum: float = 0.0
+    maximum: float = 1.0
+    step: float = 0.01
+    value: float = 0.5
+    visible: bool = True
+
+    @property
+    def gradio_update_kwargs(self) -> dict:
+        return dict(
+            minimum=self.minimum,
+            maximum=self.maximum,
+            step=self.step,
+            label=self.label,
+            value=self.value,
+            visible=self.visible,
+        )
+
+    @property
+    def api_json(self) -> dict:
+        return dict(
+            name=self.label,
+            value=self.value,
+            min=self.minimum,
+            max=self.maximum,
+            step=self.step,
+        )
+
+
+@dataclass
+class Preprocessor(ABC):
+    """
+    Class representing a preprocessor.
+
+    Attributes:
+        name (str): The name of the preprocessor.
+        tags (List[str]): The tags associated with the preprocessor.
+        slider_resolution (PreprocessorParameter): The parameter representing the resolution of the slider.
+        slider_1 (PreprocessorParameter): The first parameter of the slider.
+        slider_2 (PreprocessorParameter): The second parameter of the slider.
+        slider_3 (PreprocessorParameter): The third parameter of the slider.
+        show_control_mode (bool): Whether to show the control mode or not.
+        do_not_need_model (bool): Whether the preprocessor needs a model or not.
+        sorting_priority (int): The sorting priority of the preprocessor.
+        corp_image_with_a1111_mask_when_in_img2img_inpaint_tab (bool): Whether to crop the image with a1111 mask when in img2img inpaint tab or not.
+        fill_mask_with_one_when_resize_and_fill (bool): Whether to fill the mask with one when resizing and filling or not.
+        use_soft_projection_in_hr_fix (bool): Whether to use soft projection in hr fix or not.
+        expand_mask_when_resize_and_fill (bool): Whether to expand the mask when resizing and filling or not.
+    """
+
+    name: str
+    _label: str = None
+    tags: List[str] = field(default_factory=list)
+    slider_resolution = PreprocessorParameter(
+        label="Resolution",
+        minimum=64,
+        maximum=2048,
+        value=512,
+        step=8,
+        visible=True,
+    )
+    slider_1 = PreprocessorParameter(visible=False)
+    slider_2 = PreprocessorParameter(visible=False)
+    slider_3 = PreprocessorParameter(visible=False)
+    returns_image: bool = True
+    show_control_mode = True
+    do_not_need_model = False
+    sorting_priority = 0  # higher goes to top in the list
+    corp_image_with_a1111_mask_when_in_img2img_inpaint_tab = True
+    fill_mask_with_one_when_resize_and_fill = False
+    use_soft_projection_in_hr_fix = False
+    expand_mask_when_resize_and_fill = False
+
+    all_processors: ClassVar[Dict[str, "Preprocessor"]] = {}
+    all_processors_by_name: ClassVar[Dict[str, "Preprocessor"]] = {}
+
+    @property
+    def label(self) -> str:
+        """Display name on UI."""
+        return self._label if self._label is not None else self.name
+
+    @classmethod
+    def add_supported_preprocessor(cls, p: "Preprocessor"):
+        assert p.label not in cls.all_processors, f"{p.label} already registered!"
+        cls.all_processors[p.label] = p
+        assert p.name not in cls.all_processors_by_name, f"{p.name} already registered!"
+        cls.all_processors_by_name[p.name] = p
+        logger.debug(f"{p.name} registered. Total preprocessors ({len(cls.all_processors)}).")
+
+    @classmethod
+    def get_preprocessor(cls, name: str) -> Optional["Preprocessor"]:
+        return cls.all_processors.get(name, cls.all_processors_by_name.get(name, None))
+
+    @classmethod
+    def get_sorted_preprocessors(cls) -> List["Preprocessor"]:
+        preprocessors = [p for k, p in cls.all_processors.items() if k != "none"]
+        return [cls.all_processors["none"]] + sorted(
+            preprocessors,
+            key=lambda x: str(x.sorting_priority).zfill(8) + x.label,
+            reverse=True,
+        )
+
+    @classmethod
+    def get_all_preprocessor_tags(cls):
+        tags = set()
+        for _, p in cls.all_processors.items():
+            tags.update(set(p.tags))
+        return ["All"] + sorted(list(tags))
+
+    @classmethod
+    def get_filtered_preprocessors(cls, tag: str) -> List["Preprocessor"]:
+        if tag == "All":
+            return cls.all_processors
+        return [
+            p
+            for p in cls.get_sorted_preprocessors()
+            if tag in p.tags or p.label == "none"
+        ]
+
+    @classmethod
+    def get_default_preprocessor(cls, tag: str) -> "Preprocessor":
+        ps = cls.get_filtered_preprocessors(tag)
+        assert len(ps) > 0
+        return ps[0] if len(ps) == 1 else ps[1]
+
+    @classmethod
+    def tag_to_filters(cls, tag: str) -> Set[str]:
+        filters_aliases = {
+            "instructp2p": ["ip2p"],
+            "segmentation": ["seg"],
+            "normalmap": ["normal"],
+            "t2i-adapter": ["t2i_adapter", "t2iadapter", "t2ia"],
+            "ip-adapter": ["ip_adapter", "ipadapter"],
+            "openpose": ["openpose", "densepose"],
+            "instant-id": ["instant_id", "instantid"],
+        }
+
+        tag = tag.lower()
+        return set([tag] + filters_aliases.get(tag, []))
+
+    @ndarray_lru_cache(max_size=CACHE_SIZE)
+    def cached_call(self, *args, **kwargs):
+        logger.debug(f"Calling preprocessor {self.name} outside of cache.")
+        return self(*args, **kwargs)
+
+    def __hash__(self):
+        return hash(self.name)
+
+    def __eq__(self, other):
+        return self.__hash__() == other.__hash__()
+
+    @abstractmethod
+    def __call__(
+        self,
+        input_image,
+        resolution,
+        slider_1=None,
+        slider_2=None,
+        slider_3=None,
+        input_mask=None,
+        **kwargs,
+    ):
+        pass
--- a/scripts/utils.py
+++ b/scripts/utils.py
@ -178,4 +178,29 @@ def align_dim_latent(x: int) -> int:
    """ Align the pixel dimension (w/h) to latent dimension.
    Stable diffusion 1:8 ratio for latent/pixel, i.e.,
    1 latent unit == 8 pixel unit."""
-    return (x // 8) * 8
+    return (x // 8) * 8
+
+
+def pad64(x):
+    return int(np.ceil(float(x) / 64.0) * 64 - x)
+
+
+def safer_memory(x):
+    # Fix many MAC/AMD problems
+    return np.ascontiguousarray(x.copy()).copy()
+
+
+def resize_image_with_pad(img, resolution):
+    H_raw, W_raw, _ = img.shape
+    k = float(resolution) / float(min(H_raw, W_raw))
+    interpolation = cv2.INTER_CUBIC if k > 1 else cv2.INTER_AREA
+    H_target = int(np.round(float(H_raw) * k))
+    W_target = int(np.round(float(W_raw) * k))
+    img = cv2.resize(img, (W_target, H_target), interpolation=interpolation)
+    H_pad, W_pad = pad64(H_target), pad64(W_target)
+    img_padded = np.pad(img, [[0, H_pad], [0, W_pad], [0, 0]], mode='edge')
+
+    def remove_pad(x):
+        return safer_memory(x[:H_target, :W_target])
+
+    return safer_memory(img_padded), remove_pad
--- a/scripts/xyz_grid_support.py
+++ b/scripts/xyz_grid_support.py
@ -4,8 +4,9 @@ import numpy as np
 from modules import scripts, shared

 try:
-    from scripts.global_state import update_cn_models, cn_models_names, cn_preprocessor_modules
+    from scripts.global_state import update_cn_models, cn_models_names
    from scripts.external_code import ResizeMode, ControlMode
+    from scripts.supported_preprocessor import Preprocessor

 except (ImportError, NameError):
    import_error = True
@ -408,7 +409,7 @@ def add_axis_options(xyz_grid):
        return [e.value for e in ResizeMode]

    def choices_preprocessor():
-        return list(cn_preprocessor_modules)
+        return list(Preprocessor.all_processors.keys())

    def make_excluded_list():
        pattern = re.compile(r"\[(\w+)\]")
--- a/tests/cn_script/cn_script_test.py
+++ b/tests/cn_script/cn_script_test.py
@ -1,4 +1,3 @@
-from typing import Any, Dict, List
 import unittest
 from PIL import Image
 import numpy as np
@ -8,7 +7,7 @@ import importlib
 utils = importlib.import_module("extensions.sd-webui-controlnet.tests.utils", "utils")


-from scripts import external_code, processor
+from scripts import external_code
 from scripts.controlnet import prepare_mask, Script, set_numpy_seed
 from modules import processing

@ -122,25 +121,6 @@ class TestScript(unittest.TestCase):
        [[100, 200, 50], [150, 75, 225], [30, 120, 180]], dtype=np.uint8
    )

-    def test_bound_check_params(self):
-        def param_required(module: str, param: str) -> bool:
-            configs = processor.preprocessor_sliders_config[module]
-            config_index = ("processor_res", "threshold_a", "threshold_b").index(param)
-            return config_index < len(configs) and configs[config_index] is not None
-
-        for module in processor.preprocessor_sliders_config.keys():
-            for param in ("processor_res", "threshold_a", "threshold_b"):
-                with self.subTest(param=param, module=module):
-                    unit = external_code.ControlNetUnit(
-                        module=module,
-                        **{param: -100},
-                    )
-                    unit.bound_check_params()
-                    if param_required(module, param):
-                        self.assertGreaterEqual(getattr(unit, param), 0)
-                    else:
-                        self.assertEqual(getattr(unit, param), -100)
-
    def test_choose_input_image(self):
        with self.subTest(name="no image"):
            with self.assertRaises(ValueError):
--- a/tests/cn_script/global_state_test.py
+++ b/tests/cn_script/global_state_test.py
@ -1,67 +0,0 @@
-import importlib
-utils = importlib.import_module("extensions.sd-webui-controlnet.tests.utils", "utils")
-
-from scripts.global_state import select_control_type, ui_preprocessor_keys
-from scripts.enums import StableDiffusionVersion
-
-
-dummy_value = "dummy"
-cn_models = {
-    "None": dummy_value,
-    "canny_sd15": dummy_value,
-    "canny_sdxl": dummy_value,
-}
-
-
-# Tests for the select_control_type function
-class TestSelectControlType:
-    def test_all_control_type(self):
-        result = select_control_type("All", cn_models=cn_models)
-        assert result == (
-            [ui_preprocessor_keys, list(cn_models.keys()), "none", "None"]
-        ), "Expected all preprocessors and models"
-
-    def test_sd_version(self):
-        (_, filtered_model_list, _, default_model) = select_control_type(
-            "Canny", sd_version=StableDiffusionVersion.UNKNOWN, cn_models=cn_models
-        )
-        assert filtered_model_list == [
-            "None",
-            "canny_sd15",
-            "canny_sdxl",
-        ], "UNKNOWN sd version should match all models"
-        assert default_model == "canny_sd15"
-
-        (_, filtered_model_list, _, default_model) = select_control_type(
-            "Canny", sd_version=StableDiffusionVersion.SD1x, cn_models=cn_models
-        )
-        assert filtered_model_list == [
-            "None",
-            "canny_sd15",
-        ], "sd1x version should only sd1x"
-        assert default_model == "canny_sd15"
-
-        (_, filtered_model_list, _, default_model) = select_control_type(
-            "Canny", sd_version=StableDiffusionVersion.SDXL, cn_models=cn_models
-        )
-        assert filtered_model_list == [
-            "None",
-            "canny_sdxl",
-        ], "sdxl version should only sdxl"
-        assert default_model == "canny_sdxl"
-
-    def test_invert_preprocessor(self):
-        for control_type in ("Canny", "Lineart", "Scribble/Sketch", "MLSD"):
-            filtered_preprocessor_list, _, _, _ = select_control_type(
-                control_type, cn_models=cn_models
-            )
-            assert any(
-                "invert" in module.lower() for module in filtered_preprocessor_list
-            )
-
-    def test_no_module_available(self):
-        (_, filtered_model_list, _, default_model) = select_control_type(
-            "Depth", cn_models=cn_models
-        )
-        assert filtered_model_list == ["None"]
-        assert default_model == "None"
--- a/tests/web_api/control_types_test.py
+++ b/tests/web_api/control_types_test.py
@ -1,24 +0,0 @@
-import unittest
-import importlib
-import requests
-
-utils = importlib.import_module(
-    'extensions.sd-webui-controlnet.tests.utils', 'utils')
-
-
-from scripts.processor import preprocessor_filters
-
-
-class TestControlTypes(unittest.TestCase):
-    def test_fetching_control_types(self):
-        response = requests.get(utils.BASE_URL + "/controlnet/control_types")
-        self.assertEqual(response.status_code, 200)
-        result = response.json()
-        self.assertIn('control_types', result)
-
-        for control_type in preprocessor_filters:
-            self.assertIn(control_type, result['control_types'])
-
-
-if __name__ == "__main__":
-    unittest.main()
--- a/tests/web_api/generation_test.py
+++ b/tests/web_api/generation_test.py
@ -90,9 +90,11 @@ def test_invalid_param(gen_type, param_name):
            unit_overrides={param_name: -1},
            input_image=girl_img,
        ).exec()
-        assert log_context.is_in_console_logs([
-            f"[canny.{param_name}] Invalid value(-1), using default value",
-        ])
+        assert log_context.is_in_console_logs(
+            [
+                f"[canny.{param_name}] Invalid value(-1), using default value",
+            ]
+        )


@pytest.mark.parametrize("save_map", [True, False])
@ -285,3 +287,20 @@ def test_lama_outpaint():
            "resize_mode": "Resize and Fill",  # OUTER_FIT
        },
    ).exec()
+
+
+@disable_in_cq
+def test_ip_adapter_auto():
+    with console_log_context() as log_context:
+        assert APITestTemplate(
+            "txt2img_ip_adapter_auto",
+            "txt2img",
+            payload_overrides={},
+            unit_overrides={
+                "image": girl_img,
+                "model": get_model("ip-adapter_sd15"),
+                "module": "ip-adapter-auto",
+            },
+        ).exec()
+
+        assert log_context.is_in_console_logs(["ip-adapter-auto => ip-adapter_clip_h"])
--- a/tests/web_api/modules_test.py
+++ b/tests/web_api/modules_test.py
@ -0,0 +1,172 @@
+import pytest
+import requests
+
+from .template import APITestTemplate
+
+
+expected_module_names = {
+    "animal_openpose",
+    "anime_face_segment",
+    "blur_gaussian",
+    "canny",
+    "clip_vision",
+    "color",
+    "densepose",
+    "densepose_parula",
+    "depth",
+    "depth_anything",
+    "depth_hand_refiner",
+    "depth_leres",
+    "depth_leres++",
+    "depth_zoe",
+    "dw_openpose_full",
+    "hed",
+    "hed_safe",
+    "inpaint",
+    "inpaint_only",
+    "inpaint_only+lama",
+    "instant_id_face_embedding",
+    "instant_id_face_keypoints",
+    "invert",
+    "ip-adapter-auto",
+    "ip-adapter_clip_sd15",
+    "ip-adapter_clip_sdxl",
+    "ip-adapter_clip_sdxl_plus_vith",
+    "ip-adapter_face_id",
+    "ip-adapter_face_id_plus",
+    "lineart",
+    "lineart_anime",
+    "lineart_anime_denoise",
+    "lineart_coarse",
+    "lineart_standard",
+    "mediapipe_face",
+    "mlsd",
+    "none",
+    "normal_bae",
+    "normal_dsine",
+    "normal_map",
+    "oneformer_ade20k",
+    "oneformer_coco",
+    "openpose",
+    "openpose_face",
+    "openpose_faceonly",
+    "openpose_full",
+    "openpose_hand",
+    "pidinet",
+    "pidinet_safe",
+    "pidinet_scribble",
+    "pidinet_sketch",
+    "recolor_intensity",
+    "recolor_luminance",
+    "reference_adain",
+    "reference_adain+attn",
+    "reference_only",
+    "revision_clipvision",
+    "revision_ignore_prompt",
+    "scribble_hed",
+    "scribble_xdog",
+    "segmentation",
+    "shuffle",
+    "te_hed",
+    "threshold",
+    "tile_colorfix",
+    "tile_colorfix+sharp",
+    "tile_resample",
+}
+
+# Display name (label)
+expected_module_alias = {
+    "animal_openpose",
+    "blur_gaussian",
+    "canny",
+    "densepose (pruple bg & purple torso)",
+    "densepose_parula (black bg & blue torso)",
+    "depth_anything",
+    "depth_hand_refiner",
+    "depth_leres",
+    "depth_leres++",
+    "depth_midas",
+    "depth_zoe",
+    "dw_openpose_full",
+    "inpaint_global_harmonious",
+    "inpaint_only",
+    "inpaint_only+lama",
+    "instant_id_face_embedding",
+    "instant_id_face_keypoints",
+    "invert (from white bg & black line)",
+    "ip-adapter-auto",
+    "ip-adapter_clip_g",
+    "ip-adapter_clip_h",
+    "ip-adapter_clip_sdxl_plus_vith",
+    "ip-adapter_face_id",
+    "ip-adapter_face_id_plus",
+    "lineart_anime",
+    "lineart_anime_denoise",
+    "lineart_coarse",
+    "lineart_realistic",
+    "lineart_standard (from white bg & black line)",
+    "mediapipe_face",
+    "mlsd",
+    "none",
+    "normal_bae",
+    "normal_dsine",
+    "normal_midas",
+    "openpose",
+    "openpose_face",
+    "openpose_faceonly",
+    "openpose_full",
+    "openpose_hand",
+    "recolor_intensity",
+    "recolor_luminance",
+    "reference_adain",
+    "reference_adain+attn",
+    "reference_only",
+    "revision_clipvision",
+    "revision_ignore_prompt",
+    "scribble_hed",
+    "scribble_pidinet",
+    "scribble_xdog",
+    "seg_anime_face",
+    "seg_ofade20k",
+    "seg_ofcoco",
+    "seg_ufade20k",
+    "shuffle",
+    "softedge_hed",
+    "softedge_hedsafe",
+    "softedge_pidinet",
+    "softedge_pidisafe",
+    "softedge_teed",
+    "t2ia_color_grid",
+    "t2ia_sketch_pidi",
+    "t2ia_style_clipvision",
+    "threshold",
+    "tile_colorfix",
+    "tile_colorfix+sharp",
+    "tile_resample",
+}
+
+
+@pytest.mark.parametrize("alias", ("true", "false"))
+def test_module_list(alias):
+    json_resp = requests.get(
+        APITestTemplate.BASE_URL + f"controlnet/module_list?alias_names={alias}"
+    ).json()
+    module_list = json_resp["module_list"]
+    module_detail: dict = json_resp["module_detail"]
+    expected_list = expected_module_alias if alias == "true" else expected_module_names
+    assert set(module_list).issuperset(expected_list), expected_list - set(module_list)
+    assert set(module_list) == set(module_detail.keys())
+    assert module_detail["canny"] == dict(
+        model_free=False,
+        sliders=[
+            {
+                "name": "Resolution",
+                "value": 512,
+                "min": 64,
+                "max": 2048,
+                "step": 8,
+            },
+            {"name": "Low Threshold", "value": 100, "min": 1, "max": 255, "step": 1},
+            {"name": "High Threshold", "value": 200, "min": 1, "max": 255, "step": 1},
+        ],
+    )