ebsynth_utility/scripts/custom_script.py

import modules.scripts as scripts
import gradio as gr
import os

from modules.processing import process_images, Processed
from modules.paths import models_path
from modules.textual_inversion import autocrop
import cv2
import copy
import numpy as np
from PIL import Image
import glob


def x_ceiling(value, step):
  return -(-value // step) * step

def remove_pngs_in_dir(path):
    if not os.path.isdir(path):
        return
    pngs = glob.glob( os.path.join(path, "*.png") )
    for png in pngs:
        os.remove(png)


def resize_img(img, w, h):
    if img.shape[0] + img.shape[1] < h + w:
        interpolation = interpolation=cv2.INTER_CUBIC
    else:
        interpolation = interpolation=cv2.INTER_AREA

    return cv2.resize(img, (w, h), interpolation=interpolation)


class Script(scripts.Script):
    face_detector = None
    face_merge_mask_filename = "face_crop_img2img_mask.png"
    face_merge_mask_image = None

# The title of the script. This is what will be displayed in the dropdown menu.
    def title(self):
        return "ebsynth utility"

# Determines when the script should be shown in the dropdown menu via the
# returned value. As an example:
# is_img2img is True if the current tab is img2img, and False if it is txt2img.
# Thus, return is_img2img to only show the script on the img2img tab.

    def show(self, is_img2img):
        return is_img2img

# How the script's is displayed in the UI. See https://gradio.app/docs/#components
# for the different UI components you can use and how to create them.
# Most UI components can return a value, such as a boolean for a checkbox.
# The returned values are passed to the run method as parameters.

    def ui(self, is_img2img):
        project_dir = gr.Textbox(label='Project directory', lines=1)

        with gr.Group():
            is_facecrop = gr.Checkbox(False, label="use Face Crop img2img")
            max_crop_size = gr.Slider(minimum=0, maximum=2048, step=1, value=1024, label="Max Crop Size")
            face_denoising_strength = gr.Slider(minimum=0.00, maximum=1.00, step=0.01, value=0.5, label="Face Denoising Strength")
            face_area_magnification = gr.Slider(minimum=1.00, maximum=3.00, step=0.01, value=1.5, label="Face Area Magnification")

            with gr.Column():
                enable_face_prompt = gr.Checkbox(False, label="Enable Face Prompt")
                face_prompt = gr.Textbox(label="Face Prompt", show_label=False, lines=2,
                    placeholder="Prompt for Face",
                    value = "face close up,"
                )

        return [project_dir, is_facecrop, max_crop_size, face_denoising_strength, face_area_magnification, enable_face_prompt, face_prompt]


    def detect_face(self, img_array):
        if not self.face_detector:
            dnn_model_path = autocrop.download_and_cache_models(os.path.join(models_path, "opencv"))
            self.face_detector = cv2.FaceDetectorYN.create(dnn_model_path, "", (0, 0))

        # image without alpha
        img_array = img_array[:,:,:3]

        self.face_detector.setInputSize((img_array.shape[1], img_array.shape[0]))
        return self.face_detector.detect(img_array)

    def get_mask(self):
        def create_mask( output, x_rate, y_rate, k_size ):
            img = np.zeros((512, 512, 3))
            img = cv2.ellipse(img, ((256, 256), (int(512 * x_rate), int(512 * y_rate)), 0), (255, 255, 255), thickness=-1)
            img = cv2.GaussianBlur(img, (k_size, k_size), 0)
            cv2.imwrite(output, img)

        if self.face_merge_mask_image is None:
            mask_file_path = os.path.join( scripts.basedir(), self.face_merge_mask_filename )
            if not os.path.isfile(mask_file_path):
                create_mask( mask_file_path, 0.9, 0.9, 91)

            self.face_merge_mask_image = cv2.imread( mask_file_path ) / 255

        return self.face_merge_mask_image

    def face_crop_img2img(self, p, max_crop_size, face_denoising_strength, face_area_magnification, enable_face_prompt, face_prompt):

        def img_crop( img, face_coords,face_area_magnification,max_crop_size):
            img_array = np.array(img)
            face_imgs =[]
            new_coords = []

            for face in face_coords:
                x = int(face[0])
                y = int(face[1])
                w = int(face[2])
                h = int(face[3])
                print([x,y,w,h])

                if max(w,h) > max_crop_size:
                    print("ignore big face")
                    continue

                cx = x + int(w/2)
                cy = y + int(h/2)

                x = cx - int(w*face_area_magnification / 2)
                x = x if x > 0 else 0
                w = cx + int(w*face_area_magnification / 2) - x
                w = w if x+w < img.width else img.width - x

                y = cy - int(h*face_area_magnification / 2)
                y = y if y > 0 else 0
                h = cy + int(h*face_area_magnification / 2) - y
                h = h if y+h < img.height else img.height - y

                print([x,y,w,h])

                face_imgs.append( img_array[y: y+h, x: x+w] )
                new_coords.append( [x,y,w,h] )

            resized = []
            for face_img in face_imgs:
                if face_img.shape[1] < face_img.shape[0]:
                    re_w = 512
                    re_h = int(x_ceiling( (512 / face_img.shape[1]) * face_img.shape[0] , 64))
                else:
                    re_w = int(x_ceiling( (512 / face_img.shape[0]) * face_img.shape[1] , 64))
                    re_h = 512
                face_img = resize_img(face_img, re_w, re_h)
                resized.append( Image.fromarray(face_img))

            return resized, new_coords

        def merge_face(img, face_img, face_coord, base_img_size, mask):
            x_rate = img.width / base_img_size[0]
            y_rate = img.height / base_img_size[1]

            img_array = np.array(img)
            x = int(face_coord[0] * x_rate)
            y = int(face_coord[1] * y_rate)
            w = int(face_coord[2] * x_rate)
            h = int(face_coord[3] * y_rate)

            face_array = np.array(face_img)
            face_array = resize_img(face_array, w, h)
            mask = resize_img(mask, w, h)

            bg = img_array[y: y+h, x: x+w]
            img_array[y: y+h, x: x+w] = mask * face_array + (1-mask)*bg

            return Image.fromarray(img_array)

        def detect_face(img, mask):
            img_array = np.array(img)

            if mask is None:
                return self.detect_face(img_array)

            mask_array = np.array(mask)/255

            img_array = mask_array * img_array

            return self.detect_face(img_array.astype(np.uint8))

        ### face detect in base img
        base_img = p.init_images[0]
        base_img_size = (base_img.width, base_img.height)

        _, face_coords = detect_face(base_img, p.image_mask)

        if face_coords is None:
            print("no face detected")
            return process_images(p)

        print(face_coords)
        face_imgs, new_coords = img_crop(base_img, face_coords, face_area_magnification, max_crop_size)

        if not face_imgs:
            return process_images(p)

        face_p = copy.copy(p)

        ### img2img base img
        proc = process_images(p)


        ### img2img for each face
        face_img2img_results = []

        for face, coord in zip(face_imgs, new_coords):
            # cv2.imwrite("scripts/face.png", np.array(face)[:, :, ::-1])
            face_p.init_images = [face]
            face_p.width = face.width
            face_p.height = face.height
            face_p.denoising_strength = face_denoising_strength

            if enable_face_prompt:
                face_p.prompt = face_prompt
            else:
                face_p.prompt = "close-up face ," + face_p.prompt

            if p.image_mask is not None:
                x,y,w,h = coord
                face_p.image_mask = Image.fromarray( np.array(p.image_mask)[y: y+h, x: x+w] )

            face_proc = process_images(face_p)
            face_img2img_results.append((face_proc.images[0], coord))

        ### merge faces
        bg = proc.images[0]
        mask = self.get_mask()

        for face_img, coord in face_img2img_results:
            bg = merge_face(bg, face_img, coord, base_img_size, mask)

        proc.images[0] = bg

        return proc


# This is where the additional processing is implemented. The parameters include
# self, the model object "p" (a StableDiffusionProcessing class, see
# processing.py), and the parameters returned by the ui method.
# Custom functions can be defined here, and additional libraries can be imported
# to be used in processing. The return value should be a Processed object, which is
# what is returned by the process_images method.

    def run(self, p, project_dir, is_facecrop, max_crop_size, face_denoising_strength, face_area_magnification, enable_face_prompt, face_prompt):

        if not os.path.isdir(project_dir):
            print("project_dir not found")
            return process_images(p)

        frame_mask_path = os.path.join(project_dir, "video_mask")
        org_key_path = os.path.join(project_dir, "video_key")
        img2img_key_path = os.path.join(project_dir, "img2img_key")

        remove_pngs_in_dir(img2img_key_path)
        os.makedirs(img2img_key_path, exist_ok=True)

        imgs = glob.glob( os.path.join(org_key_path ,"*.png") )
        for img in imgs:

            image = Image.open(img)

            img_basename = os.path.basename(img)
            mask_path = os.path.join( frame_mask_path , img_basename )

            mask = None
            if os.path.isfile( mask_path ):
                mask = Image.open(mask_path)

            _p = copy.copy(p)

            _p.init_images=[image]
            _p.image_mask = mask

            if is_facecrop:
                proc = self.face_crop_img2img(_p, max_crop_size, face_denoising_strength, face_area_magnification, enable_face_prompt, face_prompt)
            else:
                proc = process_images(_p)

            proc.images[0].save( os.path.join( img2img_key_path , img_basename ) )

        return proc