complete refactored to a InfZoomer class. none can read those chunks of parameters and irritating scopes

2023-05-10 23:28:17 +02:00 · 2023-05-10 23:28:17 +02:00 · 6abc11d3f8
parent 8bdf8549ae
commit 6abc11d3f8
2 changed files with 389 additions and 574 deletions
--- a/iz_helpers/run.py
+++ b/iz_helpers/run.py
@ -1,9 +1,12 @@
 import math, time, os
+from dataclasses import dataclass
 import numpy as np
-from PIL import Image, ImageFilter, ImageDraw
+from PIL import Image, ImageFilter, ImageOps, ImageDraw
+
 from modules.ui import plaintext_to_html
 import modules.shared as shared
 from modules.paths_internal import script_path
+
 from .helpers import (
    fix_env_Path_ffprobe,
    closest_upper_divisible_by_eight,
@ -14,602 +17,414 @@ from .sd_helpers import renderImg2Img, renderTxt2Img
 from .image import shrink_and_paste_on_blank
 from .video import ContinuousVideoWriter

-def crop_fethear_ellipse(image, feather_margin=30, width_offset=0, height_offset=0):
-    # Create a blank mask image with the same size as the original image
-    mask = Image.new("L", image.size, 0)
-    draw = ImageDraw.Draw(mask)
-
-    # Calculate the ellipse's bounding box
-    ellipse_box = (
-        width_offset,
-        height_offset,
-        image.width - width_offset,
-        image.height - height_offset,
-    )
-
-    # Draw the ellipse on the mask
-    draw.ellipse(ellipse_box, fill=255)
-
-    # Apply the mask to the original image
-    result = Image.new("RGBA", image.size)
-    result.paste(image, mask=mask)
-
-    # Crop the resulting image to the ellipse's bounding box
-    cropped_image = result.crop(ellipse_box)
-
-    # Create a new mask image with a black background (0)
-    mask = Image.new("L", cropped_image.size, 0)
-    draw = ImageDraw.Draw(mask)
-
-    # Draw an ellipse on the mask image
-    draw.ellipse(
-        (
-            0 + feather_margin,
-            0 + feather_margin,
-            cropped_image.width - feather_margin,
-            cropped_image.height - feather_margin,
-        ),
-        fill=255,
-        outline=0,
-    )
-
-    # Apply a Gaussian blur to the mask image
-    mask = mask.filter(ImageFilter.GaussianBlur(radius=feather_margin / 2))
-    cropped_image.putalpha(mask)
-    res = Image.new(cropped_image.mode, (image.width, image.height))
-    paste_pos = (
-        int((res.width - cropped_image.width) / 2),
-        int((res.height - cropped_image.height) / 2),
-    )
-    res.paste(cropped_image, paste_pos)
-
-    return res
-
-
-def outpaint_steps(
-    width,
-    height,
-    common_prompt_pre,
-    common_prompt_suf,
-    prompts,
-    negative_prompt,
-    seed,
-    sampler,
-    num_inference_steps,
-    guidance_scale,
-    inpainting_denoising_strength,
-    inpainting_mask_blur,
-    inpainting_fill_mode,
-    inpainting_full_res,
-    inpainting_padding,
-    init_img,
-    outpaint_steps,
-    out_config,
-    mask_width,
-    mask_height,
-    custom_exit_image,
-    overmask,
-    frame_correction=False,  # TODO: add frame_Correction in UI
-):
-    main_frames = [init_img.convert("RGB")]
-
-    for i in range(outpaint_steps):
-        print_out = (
-            "Outpaint step: "
-            + str(i + 1)
-            + " / "
-            + str(outpaint_steps)
-            + " Seed: "
-            + str(seed)
-        )
-        print(print_out)
-        current_image = main_frames[-1]
-        current_image = shrink_and_paste_on_blank(
-            current_image, mask_width, mask_height
-        )
-
-        mask_image = np.array(current_image.resize((current_image.width-overmask, current_image.height-overmask)))[:, :, 3]
-        mask_image = Image.fromarray(255 - mask_image).convert("RGB")
-        # create mask (black image with white mask_width width edges)
-
-        if custom_exit_image and ((i + 1) == outpaint_steps):
-            current_image = custom_exit_image.resize(
-                (width, height), resample=Image.LANCZOS
-            )
-            main_frames.append(current_image.convert("RGB"))
-            # print("using Custom Exit Image")
-            save2Collect(current_image, out_config, f"exit_img.png")
-        else:
-            pr = prompts[max(k for k in prompts.keys() if k <= i)]
-            processed, newseed = renderImg2Img(
-                f"{common_prompt_pre}\n{pr}\n{common_prompt_suf}".strip(),
-                negative_prompt,
-                sampler,
-                num_inference_steps,
-                guidance_scale,
-                seed,
-                width,
-                height,
-                current_image,
-                mask_image,
-                inpainting_denoising_strength,
-                inpainting_mask_blur,
-                inpainting_fill_mode,
-                inpainting_full_res,
-                inpainting_padding,
-            )
-
-            if len(processed.images) > 0:
-                main_frames.append(processed.images[0].convert("RGB"))
-                save2Collect(processed.images[0], out_config, f"outpain_step_{i}.png")
-            seed = newseed
-            # TODO: seed behavior
-
-        if frame_correction and inpainting_mask_blur > 0:
-            corrected_frame = crop_inner_image(
-                main_frames[i + 1], mask_width, mask_height
-            )
-
-            enhanced_img = crop_fethear_ellipse(
-                main_frames[i],
-                30,
-                inpainting_mask_blur / 3 // 2,
-                inpainting_mask_blur / 3 // 2,
-            )
-            save2Collect(main_frames[i], out_config, f"main_frame_{i}")
-            save2Collect(enhanced_img, out_config, f"main_frame_enhanced_{i}")
-            corrected_frame.paste(enhanced_img, mask=enhanced_img)
-            main_frames[i] = corrected_frame
-        # else :TEST
-        # current_image.paste(prev_image, mask=prev_image)
-    return main_frames, processed
-
-
-def outpaint_steps_cornerStrategy(
-    width,
-    height,
-    common_prompt_pre,
-    common_prompt_suf,
-    prompts,
-    negative_prompt,
-    seed,
-    sampler,
-    num_inference_steps,
-    guidance_scale,
-    inpainting_denoising_strength,
-    inpainting_mask_blur,
-    inpainting_fill_mode,
-    inpainting_full_res,
-    inpainting_padding,
-    init_img,
-    outpaint_steps,
-    out_config,
-    mask_width,
-    mask_height,
-    custom_exit_image,
-    overmask,
-    frame_correction=False,  # TODO: add frame_Correction in UI
-):
-    from PIL import Image, ImageOps, ImageDraw
-    main_frames = [init_img.convert("RGB")]
-
-    currentImage = main_frames[-1]
-
-    # Größe des ursprünglichen Bildes
-    original_width, original_height = currentImage.size
-
-    # Berechne die neue Größe des Bildes
-    new_width = original_width + mask_width
-    new_height = original_height + mask_height
-    left = top = int(mask_width/2)
-    right = bottom = int(mask_height/2)
-
-    corners = [
-        (0, 0),  # Oben links
-        (new_width - 512, 0),  # Oben rechts
-        (0, new_height - 512),  # Unten links
-        (new_width - 512, new_height - 512),  # Unten rechts
-    ]
-    masked_images = []
+@dataclass
+class InfZoomConfig():
+    common_prompt_pre:str
+    prompts_array:list[str]
+    common_prompt_suf:str
+    negative_prompt:str
+    num_outpainting_steps: int
+    guidance_scale:float
+    num_inference_steps:int
+    custom_init_image:Image
+    custom_exit_image:Image
+    video_frame_rate:int
+    video_zoom_mode:int
+    video_start_frame_dupe_amount:int
+    video_last_frame_dupe_amount:int
+    inpainting_mask_blur:int
+    inpainting_fill_mode:int
+    zoom_speed:float
+    seed:int
+    outputsizeW:int
+    outputsizeH:int
+    batchcount:int
+    sampler:str
+    upscale_do:bool
+    upscaler_name:str
+    upscale_by:float
+    overmask:int
+    inpainting_denoising_strength:float=1
+    inpainting_full_res:int =0
+    inpainting_padding:int=0
+    progress:any=None
    
-    for idx, corner in enumerate(corners):
-        white = Image.new("1", (new_width,new_height), 1)
-        draw = ImageDraw.Draw(white)
-        draw.rectangle([corner[0], corner[1], corner[0]+512, corner[1]+512], fill=0)
-        masked_images.append(white)
+class InfZoomer:
+    def __init__(self, config: InfZoomConfig) -> None:
+        self.C = config
+        self.prompts = {}

-   
-    for i in range(outpaint_steps):
-        print (f"Outpaint step: {str(i + 1)}/{str(outpaint_steps)} Seed: {str(seed)}")
-        currentImage = main_frames[-1]
+        for x in self.C.prompts_array:
+            try:
+                key = int(x[0])
+                value = str(x[1])
+                self.prompts[key] = value
+            except ValueError:
+                pass

-        if custom_exit_image and ((i + 1) == outpaint_steps):
-            currentImage = custom_exit_image.resize(
-                (width, height), resample=Image.LANCZOS
-            )
-            main_frames.append(currentImage.convert("RGB"))
-            # print("using Custom Exit Image")
-            save2Collect(currentImage, out_config, f"exit_img.png")
-        else:
-            expanded_image = ImageOps.expand(currentImage, (left, top, right, bottom), fill=(0, 0, 0))
-            pr = prompts[max(k for k in prompts.keys() if k <= i)]
-            
-            # outpaint 4 corners loop
-            for idx,cornermask in enumerate(masked_images):
-                processed, newseed = renderImg2Img(
-                    f"{common_prompt_pre}\n{pr}\n{common_prompt_suf}".strip(),
-                    negative_prompt,
-                    sampler,
-                    num_inference_steps,
-                    guidance_scale,
-                    seed,
-                    512,  #outpaintsizeW
-                    512,  #outpaintsizeH
-                    expanded_image,
-                    cornermask,
-                    1, #inpainting_denoising_strength,
-                    0, # inpainting_mask_blur,
-                    2, ## noise? fillmode
-                    True,  # only masked, not full, keep size of expandedimage!
-                    0 #inpainting_padding,
-                )
-                expanded_image = processed.images[0]
-            #
-            
-            if len(processed.images) > 0:
-                zoomed_img = expanded_image.resize((width,height), Image.Resampling.LANCZOS)
-                main_frames.append(zoomed_img)
-                processed.images[0]=main_frames[-1]
-                save2Collect(processed.images[0], out_config, f"outpaint_step_{i}.png")
-            seed = newseed
-            # TODO: seed behavior
+        assert len(self.C.prompts_array) > 0, "prompts is empty"

+        fix_env_Path_ffprobe()
+        self.out_config = self.prepare_output_path()

-    return main_frames, processed
-
-
-
-def create_zoom(
-    common_prompt_pre,
-    prompts_array,
-    common_prompt_suf,
-    negative_prompt,
-    num_outpainting_steps,
-    guidance_scale,
-    num_inference_steps,
-    custom_init_image,
-    custom_exit_image,
-    video_frame_rate,
-    video_zoom_mode,
-    video_start_frame_dupe_amount,
-    video_last_frame_dupe_amount,
-    inpainting_mask_blur,
-    inpainting_fill_mode,
-    zoom_speed,
-    seed,
-    outputsizeW,
-    outputsizeH,
-    batchcount,
-    sampler,
-    upscale_do,
-    upscaler_name,
-    upscale_by,
-    overmask,
-    inpainting_denoising_strength=1,
-    inpainting_full_res=0,
-    inpainting_padding=0,
-    progress=None,
-):
-    for i in range(batchcount):
-        print(f"Batch {i+1}/{batchcount}")
-        result = create_zoom_single(
-            common_prompt_pre,
-            prompts_array,
-            common_prompt_suf,
-            negative_prompt,
-            num_outpainting_steps,
-            guidance_scale,
-            num_inference_steps,
-            custom_init_image,
-            custom_exit_image,
-            video_frame_rate,
-            video_zoom_mode,
-            video_start_frame_dupe_amount,
-            video_last_frame_dupe_amount,
-            inpainting_mask_blur,
-            inpainting_fill_mode,
-            zoom_speed,
-            seed,
-            outputsizeW,
-            outputsizeH,
-            sampler,
-            upscale_do,
-            upscaler_name,
-            upscale_by,
-            overmask,
-            inpainting_denoising_strength,
-            inpainting_full_res,
-            inpainting_padding,
-            progress,
-        )
-    return result
-
-
-def prepare_output_path():
-    isCollect = shared.opts.data.get("infzoom_collectAllResources", False)
-    output_path = shared.opts.data.get("infzoom_outpath", "outputs")
-
-    save_path = os.path.join(
-        output_path, shared.opts.data.get("infzoom_outSUBpath", "infinite-zooms")
-    )
-
-    if isCollect:
-        save_path = os.path.join(save_path, "iz_collect" + str(int(time.time())))
-
-    if not os.path.exists(save_path):
-        os.makedirs(save_path)
-
-    video_filename = os.path.join(
-        save_path, "infinite_zoom_" + str(int(time.time())) + ".mp4"
-    )
-
-    return {
-        "isCollect": isCollect,
-        "save_path": save_path,
-        "video_filename": video_filename,
-    }
-
-
-def save2Collect(img, out_config, name):
-    if out_config["isCollect"]:
-        img.save(f'{out_config["save_path"]}/{name}.png')
-
-
-def frame2Collect(all_frames, out_config):
-    save2Collect(all_frames[-1], out_config, f"frame_{len(all_frames)}")
-
-
-def frames2Collect(all_frames, out_config):
-    for i, f in enumerate(all_frames):
-        save2Collect(f, out_config, f"frame_{i}")
-
-
-def crop_inner_image(outpainted_img, width_offset, height_offset):
-    width, height = outpainted_img.size
-
-    center_x, center_y = int(width / 2), int(height / 2)
-
-    # Crop the image to the center
-    cropped_img = outpainted_img.crop(
-        (
-            center_x - width_offset,
-            center_y - height_offset,
-            center_x + width_offset,
-            center_y + height_offset,
-        )
-    )
-    prev_step_img = cropped_img.resize((width, height), resample=Image.LANCZOS)
-    # resized_img = resized_img.filter(ImageFilter.SHARPEN)
-
-    return prev_step_img
-
-
-def create_zoom_single(
-    common_prompt_pre,
-    prompts_array,
-    common_prompt_suf,
-    negative_prompt,
-    num_outpainting_steps,
-    guidance_scale,
-    num_inference_steps,
-    custom_init_image,
-    custom_exit_image,
-    video_frame_rate,
-    video_zoom_mode,
-    video_start_frame_dupe_amount,
-    video_last_frame_dupe_amount,
-    inpainting_mask_blur,
-    inpainting_fill_mode,
-    zoom_speed,
-    seed,
-    outputsizeW,
-    outputsizeH,
-    sampler,
-    upscale_do,
-    upscaler_name,
-    upscale_by,
-    overmask,
-    inpainting_denoising_strength,
-    inpainting_full_res,
-    inpainting_padding,
-    progress,
-):
-    # try:
-    #     if gr.Progress() is not None:
-    #         progress = gr.Progress()
-    #         progress(0, desc="Preparing Initial Image")
-    # except Exception:
-    #     pass
-    fix_env_Path_ffprobe()
-    out_config = prepare_output_path()
-
+    out_config = {}
    prompts = {}
+    main_frames:Image = []

-    for x in prompts_array:
-        try:
-            key = int(x[0])
-            value = str(x[1])
-            prompts[key] = value
-        except ValueError:
-            pass
+    mask_width: int
+    mask_height: int
+    current_seed: int
+    contVW: ContinuousVideoWriter

-    assert len(prompts_array) > 0, "prompts is empty"
+    def create_zoom(self):
+        for i in range(self.C.batchcount):
+            print(f"Batch {i+1}/{self.C.batchcount}")
+            result = self.create_zoom_single()
+        return result

-    width = closest_upper_divisible_by_eight(outputsizeW)
-    height = closest_upper_divisible_by_eight(outputsizeH)
+    def create_zoom_single(self):
+        # try:
+        #     if gr.Progress() is not None:
+        #         progress = gr.Progress()
+        #         progress(0, desc="Preparing Initial Image")
+        # except Exception:
+        #     pass

-    current_image = Image.new(mode="RGBA", size=(width, height))
-    mask_image = np.array(current_image)[:, :, 3]
-    mask_image = Image.fromarray(255 - mask_image).convert("RGB")
-    current_image = current_image.convert("RGB")
-    current_seed = seed
+        self.width = closest_upper_divisible_by_eight(self.C.outputsizeW)
+        self.height = closest_upper_divisible_by_eight(self.C.outputsizeH)

-    if custom_init_image:
-        current_image = custom_init_image.resize(
-            (width, height), resample=Image.LANCZOS
-        )
-        save2Collect(current_image, out_config, f"init_custom.png")
+        self.current_seed = self.C.seed
+
+        if self.C.custom_init_image:
+            current_image = Image.new(mode="RGBA", size=(self.width, self.height))
+            current_image = current_image.convert("RGB")
+            current_image = self.C.custom_init_image.resize(
+                (self.width, self.height), resample=Image.LANCZOS
+            )
+            self.save2Collect(current_image, f"init_custom.png")
+
+        else:
+            load_model_from_setting(
+                "infzoom_txt2img_model", self.C.progress, "Loading Model for txt2img: "
+            )
+
+            processed, newseed = self.renderFirstFrame()
+
+            if len(processed.images) > 0:
+                current_image = processed.images[0]
+                self.save2Collect(current_image, f"init_txt2img.png")
+            self.current_seed = newseed
+
+        self.mask_width = math.trunc(self.width / 4)  # was initially 512px => 128px
+        self.mask_height = math.trunc(self.height / 4)  # was initially 512px => 128px
+
+        self.num_interpol_frames = round(self.C.video_frame_rate * self.C.zoom_speed)

-    else:
        load_model_from_setting(
-            "infzoom_txt2img_model", progress, "Loading Model for txt2img: "
+            "infzoom_inpainting_model", self.C.progress, "Loading Model for inpainting/img2img: "
+        )
+        self.main_frames.append(current_image) # init or first txt2img
+        self.main_frames, processed = self.outpaint_steps_cornerStrategy()
+        
+        if (self.C.upscale_do):
+            for idx,mf in enumerate(self.main_frames):
+                print (f"\033[KInfZoom: Upscaling mainframe: {idx}   \r")
+                self.main_frames[idx]=do_upscaleImg(mf, self.C.upscale_do, self.C.upscaler_name, self.C.upscale_by)
+
+            self.width  = self.main_frames[0].width
+            self.height = self.main_frames[0].height
+            self.mask_width = self.width/4
+            self.mask_height = self.height/4
+
+        if self.C.video_zoom_mode:
+            self.main_frames = self.main_frames[::-1]
+
+        self.contVW = ContinuousVideoWriter(self.out_config["video_filename"], self.main_frames[0],self.C.video_frame_rate,int(self.C.video_start_frame_dupe_amount))
+        
+        self.interpolateFrames()
+
+        self.contVW.finish(self.main_frames[-1],int(self.C.video_last_frame_dupe_amount))
+
+        print("Video saved in: " + os.path.join(script_path, self.out_config["video_filename"]))
+
+        return (
+            self.out_config["video_filename"],
+            self.main_frames,
+            processed.js(),
+            plaintext_to_html(processed.info),
+            plaintext_to_html(""),
        )

-        pr = prompts[min(k for k in prompts.keys() if k >= 0)]
-        processed, newseed = renderTxt2Img(
-            f"{common_prompt_pre}\n{pr}\n{common_prompt_suf}".strip(),
-            negative_prompt,
-            sampler,
-            num_inference_steps,
-            guidance_scale,
-            current_seed,
-            width,
-            height,
+    def renderFirstFrame(self):
+        pr = self.getInitialPrompt()
+
+        return renderTxt2Img(
+                f"{self.C.common_prompt_pre}\n{pr}\n{self.C.common_prompt_suf}".strip(),
+                self.C.negative_prompt,
+                self.C.sampler,
+                self.C.num_inference_steps,
+                self.C.guidance_scale,
+                self.current_seed,
+                self.width,
+                self.height
+            )
+
+    def getInitialPrompt(self):
+        return self.prompts[min(k for k in self.prompts.keys() if k >= 0)]
+    
+    def outpaint_steps_cornerStrategy(self):
+        currentImage = self.main_frames[-1]
+
+        original_width, original_height = currentImage.size
+
+        new_width = original_width + self.mask_width*2
+        new_height = original_height + self.mask_height*2
+        left = right = int(self.mask_width)
+        top = bottom = int(self.mask_height)
+
+        corners = [
+            (0, 0),  
+            (new_width - 512, 0),  
+            (0, new_height - 512),  
+            (new_width - 512, new_height - 512),  
+        ]
+        masked_images = []
+        
+        for idx, corner in enumerate(corners):
+            white = Image.new("1", (new_width,new_height), 1)
+            draw = ImageDraw.Draw(white)
+            draw.rectangle([corner[0], corner[1], corner[0]+512, corner[1]+512], fill=0)
+            masked_images.append(white)
+
+        outpaint_steps=len(self.prompts) 
+        for i in range(outpaint_steps):
+            print (f"Outpaint step: {str(i + 1)}/{str(outpaint_steps)} Seed: {str(self.current_seed)}")
+            currentImage = self.main_frames[-1]
+
+            if self.C.custom_exit_image and ((i + 1) == outpaint_steps):
+                currentImage = self.C.custom_exit_image.resize(
+                    (self.C.width, self.C.height), resample=Image.LANCZOS
+                )
+                self.main_frames.append(currentImage.convert("RGB"))
+                # print("using Custom Exit Image")
+                self.save2Collect(currentImage, self.out_config, f"exit_img.png")
+            else:
+                expanded_image = ImageOps.expand(currentImage, (left, top, right, bottom), fill=(0, 0, 0))
+                pr = self.prompts[max(k for k in self.prompts.keys() if k <= i)]
+                
+                # outpaint 4 corners loop
+                for idx,cornermask in enumerate(masked_images):
+                    processed, newseed = renderImg2Img(
+                        f"{self.C.common_prompt_pre}\n{pr}\n{self.C.common_prompt_suf}".strip(),
+                        self.C.negative_prompt,
+                        self.C.sampler,
+                        self.C.num_inference_steps,
+                        self.C.guidance_scale,
+                        self.current_seed,
+                        512,  #outpaintsizeW
+                        512,  #outpaintsizeH
+                        expanded_image,
+                        cornermask,
+                        1, #inpainting_denoising_strength,
+                        0, # inpainting_mask_blur,
+                        2, ## noise? fillmode
+                        True,  # only masked, not full, keep size of expandedimage!
+                        0 #inpainting_padding,
+                    )
+                    expanded_image = processed.images[0]
+                #
+                
+                if len(processed.images) > 0:
+                    zoomed_img = expanded_image.resize((self.width,self.height), Image.Resampling.LANCZOS)
+                    self.main_frames.append(zoomed_img)
+                    processed.images[0]=self.main_frames[-1]
+                    self.save2Collect(processed.images[0], f"outpaint_step_{i}.png")
+                seed = newseed
+                # TODO: seed behavior
+
+        return self.main_frames, processed
+
+    def interpolateFrames(self):
+        for i in range(len(self.main_frames) - 1):
+            # interpolation steps between 2 inpainted images (=sequential zoom and crop)
+            for j in range(self.num_interpol_frames - 1):
+
+                print (f"\033[KInfZoom: Interpolate frame: main/inter: {i}/{j}   \r")
+                #todo: howto zoomIn when writing each frame; self.main_frames are inverted, howto interpolate?
+                if self.C.video_zoom_mode:
+                    current_image = self.main_frames[i + 1]
+                else:
+                    current_image = self.main_frames[i + 1]
+                    
+                interpol_image = current_image
+                self.save2Collect(interpol_image, f"interpol_img_{i}_{j}].png")
+
+                interpol_width = math.ceil(
+                    ( 1 - (1 - 2 * self.mask_width / self.width) **(1 - (j + 1) / self.num_interpol_frames) ) 
+                    * self.width / 2
+                )
+
+                interpol_height = math.ceil(
+                    ( 1 - (1 - 2 * self.mask_height / self.height) ** (1 - (j + 1) / self.num_interpol_frames) )
+                    * self.height/2
+                )
+
+                interpol_image = interpol_image.crop(
+                    (
+                        interpol_width,
+                        interpol_height,
+                        self.width - interpol_width,
+                        self.height - interpol_height,
+                    )
+                )
+
+                interpol_image = interpol_image.resize((self.width, self.height))
+                self.save2Collect(interpol_image, f"interpol_resize_{i}_{j}.png")
+
+                # paste the higher resolution previous image in the middle to avoid drop in quality caused by zooming
+                interpol_width2 = math.ceil(
+                    (1 - (self.width - 2 * self.mask_width) / (self.width - 2 * interpol_width))
+                    / 2 * self.width
+                )
+
+                interpol_height2 = math.ceil(
+                    (1 - (self.height - 2 * self.mask_height) / (self.height - 2 * interpol_height))
+                    / 2 * self.height
+                )
+
+                prev_image_fix_crop = shrink_and_paste_on_blank(
+                    self.main_frames[i], interpol_width2, interpol_height2
+                )
+
+                interpol_image.paste(prev_image_fix_crop, mask=prev_image_fix_crop)
+                self.save2Collect(interpol_image, f"interpol_prevcrop_{i}_{j}.png")
+
+                self.contVW.append([interpol_image])
+
+            self.contVW.append([current_image])
+
+
+    def prepare_output_path(self):
+        isCollect = shared.opts.data.get("infzoom_collectAllResources", False)
+        output_path = shared.opts.data.get("infzoom_outpath", "outputs")
+
+        save_path = os.path.join(
+            output_path, shared.opts.data.get("infzoom_outSUBpath", "infinite-zooms")
        )
-        if len(processed.images) > 0:
-            current_image = processed.images[0]
-            save2Collect(current_image, out_config, f"init_txt2img.png")
-        current_seed = newseed

-    mask_width = math.trunc(width / 4)  # was initially 512px => 128px
-    mask_height = math.trunc(height / 4)  # was initially 512px => 128px
+        if isCollect:
+            save_path = os.path.join(save_path, "iz_collect" + str(int(time.time())))

-    num_interpol_frames = round(video_frame_rate * zoom_speed)
+        if not os.path.exists(save_path):
+            os.makedirs(save_path)

-    load_model_from_setting(
-        "infzoom_inpainting_model", progress, "Loading Model for inpainting/img2img: "
-    )
-    main_frames, processed = outpaint_steps_cornerStrategy(
-        width,
-        height,
+        video_filename = os.path.join(
+            save_path, "infinite_zoom_" + str(int(time.time())) + ".mp4"
+        )
+
+        return {
+            "isCollect": isCollect,
+            "save_path": save_path,
+            "video_filename": video_filename,
+        }
+
+
+    def save2Collect(self, img, name):
+        if self.out_config["isCollect"]:
+            img.save(f'{self.out_config["save_path"]}/{name}.png')
+
+
+    def frame2Collect(self,all_frames):
+        self.save2Collect(all_frames[-1], self.out_config, f"frame_{len(all_frames)}")
+
+
+    def frames2Collect(self, all_frames):
+        for i, f in enumerate(all_frames):
+            self.save2Collect(f, self.out_config, f"frame_{i}")
+
+
+    def crop_inner_image(self, outpainted_img, width_offset, height_offset):
+        width, height = outpainted_img.size
+
+        center_x, center_y = int(width / 2), int(height / 2)
+
+        # Crop the image to the center
+        cropped_img = outpainted_img.crop(
+            (
+                center_x - width_offset,
+                center_y - height_offset,
+                center_x + width_offset,
+                center_y + height_offset,
+            )
+        )
+        prev_step_img = cropped_img.resize((width, height), resample=Image.LANCZOS)
+        # resized_img = resized_img.filter(ImageFilter.SHARPEN)
+
+        return prev_step_img
+
+
+
+# to be called from Gradio or other client
+def createZoom(
+    common_prompt_pre:str,
+    prompts_array:list[str],
+    common_prompt_suf:str,
+    negative_prompt:str,
+    num_outpainting_steps: int,
+    guidance_scale:float,
+    num_inference_steps:int,
+    custom_init_image:Image,
+    custom_exit_image:Image,
+    video_frame_rate:int,
+    video_zoom_mode:int,
+    video_start_frame_dupe_amount:int,
+    video_last_frame_dupe_amount:int,
+    inpainting_mask_blur:int,
+    inpainting_fill_mode:int,
+    zoom_speed:float,
+    seed:int,
+    outputsizeW:int,
+    outputsizeH:int,
+    batchcount:int,
+    sampler:str,
+    upscale_do:bool,
+    upscaler_name:str,
+    upscale_by:float,
+    overmask:int,
+    inpainting_denoising_strength:float=1,
+    inpainting_full_res:int =0,
+    inpainting_padding:int=0,
+    progress:any=None
+):
+    iz = InfZoomConfig(
        common_prompt_pre,
+        prompts_array,
        common_prompt_suf,
-        prompts,
        negative_prompt,
-        seed,
-        sampler,
-        num_inference_steps,
+        num_outpainting_steps,
        guidance_scale,
-        inpainting_denoising_strength,
+        num_inference_steps,
+        custom_init_image,
+        custom_exit_image,
+        video_frame_rate,
+        video_zoom_mode,
+        video_start_frame_dupe_amount,
+        video_last_frame_dupe_amount,
        inpainting_mask_blur,
        inpainting_fill_mode,
+        zoom_speed,
+        seed,
+        outputsizeW,
+        outputsizeH,
+        batchcount,
+        sampler,
+        upscale_do,
+        upscaler_name,
+        upscale_by,
+        overmask,
+        inpainting_denoising_strength,
        inpainting_full_res,
        inpainting_padding,
-        current_image,
-        num_outpainting_steps,
-        out_config,
-        mask_width,
-        mask_height,
-        custom_exit_image,
-        overmask
+        progress
    )
-    
-    if (upscale_do):
-        for idx,mf in enumerate(main_frames):
-            print (f"\033[KInfZoom: Upscaling mainframe: {idx}   \r")
-            main_frames[idx]=do_upscaleImg(mf, upscale_do, upscaler_name, upscale_by)
-
-        width  = main_frames[0].width
-        height = main_frames[0].height
-        mask_width = width/4
-        mask_height = height/4
-
-    if video_zoom_mode:
-        main_frames = main_frames[::-1]
-
-    contVW = ContinuousVideoWriter(out_config["video_filename"], main_frames[0],video_frame_rate,int(video_start_frame_dupe_amount))
-    
-    interpolateFrames(out_config, width, height, mask_width, mask_height, num_interpol_frames, contVW, main_frames, video_zoom_mode)
-
-    contVW.finish(main_frames[-1],int(video_last_frame_dupe_amount))
-
-    print("Video saved in: " + os.path.join(script_path, out_config["video_filename"]))
-
-    return (
-        out_config["video_filename"],
-        main_frames,
-        processed.js(),
-        plaintext_to_html(processed.info),
-        plaintext_to_html(""),
-    )
-
-def interpolateFrames(out_config, width, height, mask_width, mask_height, num_interpol_frames, contVW, main_frames, zoomIn):
-    for i in range(len(main_frames) - 1):
-        # interpolation steps between 2 inpainted images (=sequential zoom and crop)
-        for j in range(num_interpol_frames - 1):
-
-            print (f"\033[KInfZoom: Interpolate frame: main/inter: {i}/{j}   \r")
-            #todo: howto zoomIn when writing each frame; main_frames are inverted, howto interpolate?
-            if zoomIn:
-                current_image = main_frames[i + 1]
-            else:
-                current_image = main_frames[i + 1]
-                
-            interpol_image = current_image
-            save2Collect(interpol_image, out_config, f"interpol_img_{i}_{j}].png")
-
-            interpol_width = math.ceil(
-                (
-                    1
-                    - (1 - 2 * mask_width / width)
-                    ** (1 - (j + 1) / num_interpol_frames)
-                )
-                * width
-                / 2
-            )
-
-            interpol_height = math.ceil(
-                (
-                    1
-                    - (1 - 2 * mask_height / height)
-                    ** (1 - (j + 1) / num_interpol_frames)
-                )
-                * height
-                / 2
-            )
-
-            interpol_image = interpol_image.crop(
-                (
-                    interpol_width,
-                    interpol_height,
-                    width - interpol_width,
-                    height - interpol_height,
-                )
-            )
-
-            interpol_image = interpol_image.resize((width, height))
-            save2Collect(interpol_image, out_config, f"interpol_resize_{i}_{j}.png")
-
-            # paste the higher resolution previous image in the middle to avoid drop in quality caused by zooming
-            interpol_width2 = math.ceil(
-                (1 - (width - 2 * mask_width) / (width - 2 * interpol_width))
-                / 2
-                * width
-            )
-
-            interpol_height2 = math.ceil(
-                (1 - (height - 2 * mask_height) / (height - 2 * interpol_height))
-                / 2
-                * height
-            )
-
-            prev_image_fix_crop = shrink_and_paste_on_blank(
-                main_frames[i], interpol_width2, interpol_height2
-            )
-
-            #interpol_image.paste(prev_image_fix_crop, mask=prev_image_fix_crop)
-            save2Collect(interpol_image, out_config, f"interpol_prevcrop_{i}_{j}.png")
-
-            contVW.append([interpol_image])
-
-        contVW.append([current_image])
+    return InfZoomer(iz).create_zoom()
--- a/iz_helpers/ui.py
+++ b/iz_helpers/ui.py
@ -1,5 +1,5 @@
 import gradio as gr
-from .run import create_zoom
+from .run import createZoom
 import modules.shared as shared
 from webui import wrap_gradio_gpu_call
 from modules.ui import create_output_panel
@ -273,7 +273,7 @@ Our best experience and trade-off is the R-ERSGAn4x upscaler.
                )

        generate_btn.click(
-            fn=wrap_gradio_gpu_call(create_zoom, extra_outputs=[None, "", ""]),
+            fn=wrap_gradio_gpu_call(createZoom, extra_outputs=[None, "", ""]),
            inputs=[
                main_common_prompt_pre,
                main_prompts,