SHARK-Studio/apps/shark_studio/web/ui/sd.py

import os
import json
import gradio as gr
import numpy as np
from inspect import signature
from PIL import Image
from pathlib import Path
from datetime import datetime as dt
from gradio.components.image_editor import (
    EditorValue,
)
from apps.shark_studio.web.utils.file_utils import (
    get_generated_imgs_path,
    get_checkpoints_path,
    get_checkpoints,
    get_configs_path,
    get_configs,
    write_default_sd_configs,
)
from apps.shark_studio.api.sd import (
    shark_sd_fn_dict_input,
    cancel_sd,
    unload_sd,
)
from apps.shark_studio.api.controlnet import (
    cnet_preview,
)
from apps.shark_studio.modules.schedulers import (
    scheduler_model_map,
)
from apps.shark_studio.modules.img_processing import (
    resampler_list,
    resize_stencil,
)
from apps.shark_studio.modules.shared_cmd_opts import cmd_opts
from apps.shark_studio.web.ui.utils import (
    amdlogo_loc,
    none_to_str_none,
    str_none_to_none,
)
from apps.shark_studio.web.utils.state import (
    status_label,
)
from apps.shark_studio.web.ui.common_events import lora_changed
from apps.shark_studio.modules import logger
import apps.shark_studio.web.utils.globals as global_obj

# Disabled some models for demo purposes
sd_default_models = [
    # "runwayml/stable-diffusion-v1-5",
    # "stabilityai/stable-diffusion-2-1-base",
    # "stabilityai/stable-diffusion-2-1",
    # "stabilityai/stable-diffusion-xl-base-1.0",
    # "stabilityai/sdxl-turbo",
]
sd_default_models.extend(get_checkpoints(model_type="scripts"))


def view_json_file(file_path):
    content = ""
    with open(file_path, "r") as fopen:
        content = fopen.read()
    return content


def submit_to_cnet_config(
    stencil: str,
    preprocessed_hint: str,
    cnet_strength: int,
    control_mode: str,
    curr_config: dict,
):
    if any(i in [None, ""] for i in [stencil, preprocessed_hint]):
        return gr.update()
    if curr_config is not None:
        if "controlnets" in curr_config:
            curr_config["controlnets"]["control_mode"] = control_mode
            curr_config["controlnets"]["model"].append(stencil)
            curr_config["controlnets"]["hint"].append(preprocessed_hint)
            curr_config["controlnets"]["strength"].append(cnet_strength)
            return curr_config

    cnet_map = {}
    cnet_map["controlnets"] = {
        "control_mode": control_mode,
        "model": [stencil],
        "hint": [preprocessed_hint],
        "strength": [cnet_strength],
    }
    return cnet_map


def update_embeddings_json(embedding):
    return {"embeddings": [embedding]}


def submit_to_main_config(input_cfg: dict, main_cfg: dict):
    if main_cfg in [None, "", {}]:
        return input_cfg

    for base_key in input_cfg:
        main_cfg[base_key] = input_cfg[base_key]
    return main_cfg


def pull_sd_configs(
    prompt,
    negative_prompt,
    sd_init_image,
    height,
    width,
    steps,
    strength,
    guidance_scale,
    seed,
    batch_count,
    batch_size,
    scheduler,
    base_model_id,
    custom_weights,
    custom_vae,
    precision,
    device,
    target_triple,
    ondemand,
    compiled_pipeline,
    resample_type,
    controlnets,
    embeddings,
):
    sd_args = str_none_to_none(locals())
    sd_cfg = {}
    for arg in sd_args:
        if arg in [
            "prompt",
            "negative_prompt",
            "sd_init_image",
        ]:
            sd_cfg[arg] = [sd_args[arg]]
        elif arg in ["controlnets", "embeddings"]:
            if isinstance(arg, dict):
                sd_cfg[arg] = json.loads(sd_args[arg])
            else:
                sd_cfg[arg] = {}
        else:
            sd_cfg[arg] = sd_args[arg]

    return json.dumps(sd_cfg)


def load_sd_cfg(sd_json: dict, load_sd_config: str):
    if os.path.exists(load_sd_config):
        config = load_sd_config
    elif os.path.exists(os.path.join(get_configs_path(), load_sd_config)):
        config = os.path.join(get_configs_path(), load_sd_config)
    else:
        print(
            "Default config not found as absolute path or in configs folder. Using sdxl-turbo as default config."
        )
        config = sd_json
    new_sd_config = none_to_str_none(json.loads(view_json_file(config)))
    if sd_json:
        for key in new_sd_config:
            sd_json[key] = new_sd_config[key]
    else:
        sd_json = new_sd_config
    for i in sd_json["sd_init_image"]:
        if i is not None:
            if os.path.isfile(i):
                sd_image = [Image.open(i, mode="r")]
    else:
        sd_image = None
    if not sd_json["device"]:
        sd_json["device"] = gr.update()

    return [
        sd_json["prompt"][0],
        sd_json["negative_prompt"][0],
        sd_image,
        sd_json["height"],
        sd_json["width"],
        gr.update(),
        sd_json["strength"],
        sd_json["guidance_scale"],
        sd_json["seed"],
        sd_json["batch_count"],
        sd_json["batch_size"],
        sd_json["scheduler"],
        sd_json["base_model_id"],
        sd_json["custom_weights"],
        sd_json["custom_vae"],
        sd_json["precision"],
        sd_json["device"],
        sd_json["target_triple"],
        sd_json["ondemand"],
        sd_json["compiled_pipeline"],
        sd_json["resample_type"],
        sd_json["controlnets"],
        sd_json["embeddings"],
        sd_json,
    ]


def save_sd_cfg(config: dict, save_name: str):
    if os.path.exists(save_name):
        filepath = save_name
    elif cmd_opts.configs_path:
        filepath = os.path.join(cmd_opts.configs_path, save_name)
    else:
        filepath = os.path.join(get_configs_path(), save_name)
    if ".json" not in filepath:
        filepath += ".json"
    with open(filepath, mode="w") as f:
        f.write(json.dumps(config))
    return save_name


def create_canvas(width, height):
    data = Image.fromarray(
        np.zeros(
            shape=(height, width, 3),
            dtype=np.uint8,
        )
        + 255
    )
    img_dict = {
        "background": data,
        "layers": [],
        "composite": None,
    }
    return EditorValue(img_dict)


def import_original(original_img, width, height):
    if original_img is None:
        resized_img = create_canvas(width, height)
        return resized_img
    else:
        resized_img, _, _ = resize_stencil(original_img, width, height)
        img_dict = {
            "background": resized_img,
            "layers": [],
            "composite": None,
        }
        return EditorValue(img_dict)


def base_model_changed(base_model_id):
    new_choices = get_checkpoints(
        os.path.join("checkpoints", os.path.basename(str(base_model_id)))
    ) + get_checkpoints(model_type="checkpoints")
    if "turbo" in base_model_id:
        new_steps = gr.Dropdown(
            value=2,
            choices=[1, 2],
            label="\U0001F3C3\U0000FE0F Steps",
            allow_custom_value=True,
        )
    if "stable-diffusion-xl-base-1.0" in base_model_id:
        new_steps = gr.Dropdown(
            value=40,
            choices=[20, 25, 30, 35, 40, 45, 50],
            label="\U0001F3C3\U0000FE0F Steps",
            allow_custom_value=True,
        )
    elif ".py" in base_model_id:
        new_steps = gr.Dropdown(
            value=20,
            choices=[10, 15, 20],
            label="\U0001F3C3\U0000FE0F Steps",
            allow_custom_value=True,
        )
    else:
        new_steps = gr.Dropdown(
            value=20,
            choices=[10, 20, 30, 40, 50],
            label="\U0001F3C3\U0000FE0F Steps",
            allow_custom_value=True,
        )

    return [
        gr.Dropdown(
            value=new_choices[0] if len(new_choices) > 0 else "None",
            choices=["None"] + new_choices,
        ),
        new_steps,
    ]


init_config = global_obj.get_init_config()
init_config = none_to_str_none(json.loads(view_json_file(init_config)))

with gr.Blocks(title="Stable Diffusion") as sd_element:
    with gr.Column(elem_id="ui_body"):
        with gr.Row():
            with gr.Column(scale=2, min_width=600):
                with gr.Group(elem_id="prompt_box_outer"):
                    prompt = gr.Textbox(
                        label="\U00002795\U0000FE0F Prompt",
                        value=init_config["prompt"][0],
                        lines=4,
                        elem_id="prompt_box",
                        show_copy_button=True,
                    )
                    negative_prompt = gr.Textbox(
                        label="\U00002796\U0000FE0F Negative Prompt",
                        value=init_config["negative_prompt"][0],
                        lines=4,
                        elem_id="negative_prompt_box",
                        show_copy_button=True,
                    )
                with gr.Accordion(
                    label="\U0001F4D0\U0000FE0F Advanced Settings", open=False
                ):
                    with gr.Accordion(label="Device Settings", open=False):
                        device = gr.Dropdown(
                            elem_id="device",
                            label="Device",
                            value=(
                                init_config["device"]
                                if init_config["device"]
                                else "rocm"
                            ),
                            choices=global_obj.get_device_list(),
                            allow_custom_value=True,
                        )
                        target_triple = gr.Textbox(
                            elem_id="target_triple",
                            label="Architecture",
                            value=init_config["target_triple"],
                        )
                        with gr.Row():
                            ondemand = gr.Checkbox(
                                value=init_config["ondemand"],
                                label="Low VRAM",
                                interactive=True,
                                visible=False,
                            )
                            precision = gr.Radio(
                                label="Precision",
                                value=init_config["precision"],
                                choices=[
                                    "fp16",
                                    "fp32",
                                ],
                                visible=False,
                            )
                    with gr.Row():
                        height = gr.Slider(
                            512,
                            1024,
                            value=512,
                            step=512,
                            label="\U00002195\U0000FE0F Height",
                            interactive=False,  # DEMO
                            visible=False,  # DEMO
                        )
                        width = gr.Slider(
                            512,
                            1024,
                            value=512,
                            step=512,
                            label="\U00002194\U0000FE0F Width",
                            interactive=False,  # DEMO
                            visible=False,  # DEMO
                        )

                    with gr.Accordion(
                        label="\U0001F9EA\U0000FE0F Input Image Processing",
                        open=False,
                        visible=False,
                    ):
                        strength = gr.Slider(
                            0,
                            1,
                            value=init_config["strength"],
                            step=0.01,
                            label="Denoising Strength",
                        )
                        resample_type = gr.Dropdown(
                            value=init_config["resample_type"],
                            choices=resampler_list,
                            label="Resample Type",
                            allow_custom_value=True,
                        )
                    with gr.Row():
                        sd_model_info = (
                            f"Checkpoint Path: {str(get_checkpoints_path())}"
                        )
                        base_model_id = gr.Dropdown(
                            label="\U000026F0\U0000FE0F Base Model",
                            info="Select or enter HF model ID",
                            elem_id="custom_model",
                            value=init_config["base_model_id"],
                            choices=sd_default_models,
                            allow_custom_value=True,
                        )  # base_model_id
                    with gr.Row(equal_height=True):
                        seed = gr.Textbox(
                            value=init_config["seed"],
                            label="\U0001F331\U0000FE0F Seed",
                            info="An integer, -1 for random",
                            show_copy_button=True,
                        )
                        scheduler = gr.Dropdown(
                            elem_id="scheduler",
                            label="\U0001F4C5\U0000FE0F Scheduler",
                            info="\U000E0020",  # forces same height as seed
                            value=init_config["scheduler"],
                            choices=scheduler_model_map.keys(),
                            allow_custom_value=False,
                            visible=False,
                        )
                    with gr.Row():
                        steps = gr.Dropdown(
                            value=20,
                            choices=[10, 15, 20],
                            label="\U0001F3C3\U0000FE0F Steps",
                            allow_custom_value=True,
                        )
                        guidance_scale = gr.Slider(
                            0,
                            5,  # DEMO
                            value=4,
                            step=0.1,
                            label="\U0001F5C3\U0000FE0F CFG Scale",
                            visible=False,
                        )
                    with gr.Row():
                        batch_count = gr.Slider(
                            1,
                            100,
                            value=init_config["batch_count"],
                            step=1,
                            label="Batch Count",
                            interactive=True,
                            visible=False,
                        )
                        batch_size = gr.Slider(
                            1,
                            4,
                            value=init_config["batch_size"],
                            step=1,
                            label="Batch Size",
                            interactive=False,  # DEMO
                            visible=False,
                        )
                        compiled_pipeline = gr.Checkbox(
                            value=init_config["compiled_pipeline"],
                            label="Faster txt2img (SDXL only)",
                            visible=False,  # DEMO
                        )
                    with gr.Row(elem_classes=["fill"], visible=False):
                        Path(get_configs_path()).mkdir(parents=True, exist_ok=True)
                        write_default_sd_configs(get_configs_path())
                        default_config_file = global_obj.get_init_config()
                        sd_json = gr.JSON(
                            elem_classes=["fill"],
                            value=view_json_file(default_config_file),
                        )
                    with gr.Row(visible=False):
                        with gr.Row():
                            load_sd_config = gr.Dropdown(
                                label="Load Config",
                                value=cmd_opts.defaults,
                                choices=get_configs(),
                                allow_custom_value=True,
                                visible=False,
                            )
                        with gr.Row():
                            save_sd_config = gr.Button(value="Save Config", size="sm")
                            clear_sd_config = gr.ClearButton(
                                value="Clear Config",
                                size="sm",
                                components=sd_json,
                            )
                            # with gr.Row():
                            sd_config_name = gr.Textbox(
                                value="Config Name",
                                info="Name of the file this config will be saved to.",
                                interactive=True,
                                show_label=False,
                            )
                with gr.Accordion(
                    label="\U00002696\U0000FE0F Model Weights",
                    open=False,
                    visible=False,  # DEMO
                ):
                    with gr.Column():
                        custom_weights = gr.Dropdown(
                            label="Checkpoint Weights",
                            info="Select or enter HF model ID",
                            elem_id="custom_model",
                            value=init_config["custom_weights"],
                            allow_custom_value=True,
                            choices=["None"]
                            + get_checkpoints(os.path.basename(str(base_model_id))),
                        )  # custom_weights
                        sd_vae_info = (str(get_checkpoints_path("vae"))).replace(
                            "\\", "\n\\"
                        )
                        sd_vae_info = f"VAE Path: {sd_vae_info}"
                        custom_vae = gr.Dropdown(
                            label=f"VAE Model",
                            info=sd_vae_info,
                            elem_id="custom_model",
                            value=init_config["custom_vae"],
                            choices=["None"] + get_checkpoints("vae"),
                            allow_custom_value=True,
                            scale=1,
                        )
                        sd_lora_info = (str(get_checkpoints_path("loras"))).replace(
                            "\\", "\n\\"
                        )
                        lora_opt = gr.Dropdown(
                            allow_custom_value=True,
                            label=f"Standalone LoRA Weights",
                            info=sd_lora_info,
                            elem_id="lora_weights",
                            value=(
                                init_config["embeddings"][0]
                                if (len(init_config["embeddings"].keys()) > 1)
                                else "None"
                            ),
                            multiselect=True,
                            choices=[] + get_checkpoints("lora"),
                            scale=2,
                        )
                        lora_tags = gr.HTML(
                            value="<div><i>No LoRA selected</i></div>",
                            elem_classes="lora-tags",
                        )
                        embeddings_config = gr.JSON(
                            label="Embeddings Options", min_width=50, scale=1
                        )
                        gr.on(
                            triggers=[lora_opt.change],
                            fn=lora_changed,
                            inputs=[lora_opt],
                            outputs=[lora_tags],
                            queue=True,
                            show_progress=False,
                        ).then(
                            fn=update_embeddings_json,
                            inputs=[lora_opt],
                            outputs=[embeddings_config],
                            show_progress=False,
                        )
                with gr.Accordion(
                    label="Controlnet Options",
                    open=False,
                    visible=False,
                ):
                    preprocessed_hints = gr.State([])
                    with gr.Column():
                        sd_cnet_info = (
                            str(get_checkpoints_path("controlnet"))
                        ).replace("\\", "\n\\")
                    with gr.Row():
                        cnet_config = gr.JSON()
                        with gr.Column():
                            clear_config = gr.ClearButton(
                                value="Clear Controlnet Config",
                                size="sm",
                                components=cnet_config,
                            )
                            control_mode = gr.Radio(
                                choices=["Prompt", "Balanced", "Controlnet"],
                                value="Balanced",
                                label="Control Mode",
                            )
                    with gr.Row():
                        with gr.Column(scale=1):
                            cnet_model = gr.Dropdown(
                                allow_custom_value=True,
                                label=f"Controlnet Model",
                                info=sd_cnet_info,
                                value="None",
                                choices=[
                                    "None",
                                    "canny",
                                    "openpose",
                                    "scribble",
                                    "zoedepth",
                                ]
                                + get_checkpoints("controlnet"),
                            )
                            cnet_strength = gr.Slider(
                                label="Controlnet Strength",
                                minimum=0,
                                maximum=100,
                                value=50,
                                step=1,
                            )
                            with gr.Row():
                                canvas_width = gr.Slider(
                                    label="Canvas Width",
                                    minimum=512,
                                    maximum=1024,
                                    value=512,
                                    step=512,
                                )
                                canvas_height = gr.Slider(
                                    label="Canvas Height",
                                    minimum=512,
                                    maximum=1024,
                                    value=512,
                                    step=512,
                                )
                            make_canvas = gr.Button(
                                value="Make Canvas!",
                            )
                            use_input_img = gr.Button(
                                value="Use Original Image",
                                size="sm",
                            )
                        cnet_input = gr.Image(
                            value=None,
                            type="pil",
                            image_mode="RGB",
                            interactive=True,
                        )
                        with gr.Column(scale=1):
                            cnet_output = gr.Image(
                                value=None,
                                visible=True,
                                label="Preprocessed Hint",
                                interactive=False,
                                show_label=True,
                            )
                            cnet_gen = gr.Button(
                                value="Preprocess controlnet input",
                            )
                            use_result = gr.Button(
                                "Submit",
                                size="sm",
                            )
                        make_canvas.click(
                            fn=create_canvas,
                            inputs=[canvas_width, canvas_height],
                            outputs=[cnet_input],
                            queue=False,
                        )
                        cnet_gen.click(
                            fn=cnet_preview,
                            inputs=[
                                cnet_model,
                                cnet_input,
                            ],
                            outputs=[
                                cnet_output,
                                preprocessed_hints,
                            ],
                        )
                        use_result.click(
                            fn=submit_to_cnet_config,
                            inputs=[
                                cnet_model,
                                cnet_output,
                                cnet_strength,
                                control_mode,
                                cnet_config,
                            ],
                            outputs=[
                                cnet_config,
                            ],
                            queue=False,
                        )
            with gr.Column(scale=3, min_width=600):
                with gr.Tabs() as sd_tabs:
                    sd_element.load(
                        # Workaround for Gradio issue #7085
                        # TODO: revert to setting selected= in gr.Tabs declaration
                        # once this is resolved in Gradio
                        lambda: gr.Tabs(selected=101),
                        outputs=[sd_tabs],
                    )
                    with gr.Tab(
                        label="Input Image", id=100, visible=False
                    ) as sd_tab_init_image:  # DEMO
                        with gr.Column(elem_classes=["sd-right-panel"]):
                            with gr.Row(elem_classes=["fill"]):
                                # TODO: make this import image prompt info if it exists
                                sd_init_image = gr.Image(
                                    type="pil",
                                    interactive=True,
                                    show_label=False,
                                )
                                use_input_img.click(
                                    fn=import_original,
                                    inputs=[
                                        sd_init_image,
                                        canvas_width,
                                        canvas_height,
                                    ],
                                    outputs=[cnet_input],
                                    queue=False,
                                )
                    with gr.Tab(label="Generate Images", id=101) as sd_tab_gallery:
                        with gr.Column(elem_classes=["sd-right-panel"]):
                            with gr.Row(elem_classes=["fill"]):
                                sd_gallery = gr.Gallery(
                                    label="Generated images",
                                    show_label=False,
                                    elem_id="gallery",
                                    columns=2,
                                    object_fit="fit",
                                    preview=True,
                                )
                            with gr.Row():
                                stable_diffusion = gr.Button("Start")
                                unload = gr.Button("Unload Models")
                                unload.click(
                                    fn=unload_sd,
                                    queue=False,
                                    show_progress=False,
                                )
                                stop_batch = gr.Button("Stop", visible=False)
                    # with gr.Tab(label="Config", id=102) as sd_tab_config:
                    #     with gr.Group():#elem_classes=["sd-right-panel"]):
                    #         with gr.Row(elem_classes=["fill"], visible=False):
                    #             Path(get_configs_path()).mkdir(
                    #                 parents=True, exist_ok=True
                    #             )
                    #             write_default_sd_configs(get_configs_path())
                    #             default_config_file = global_obj.get_init_config()
                    #             sd_json = gr.JSON(
                    #                 elem_classes=["fill"],
                    #                 value=view_json_file(default_config_file),
                    #             )
                    #         with gr.Row():
                    #             with gr.Row():
                    #                 load_sd_config = gr.Dropdown(
                    #                     label="Load Config",
                    #                     value=cmd_opts.defaults,
                    #                     choices=get_configs(),
                    #                     allow_custom_value=True,
                    #                 )
                    #             with gr.Row():
                    #                 save_sd_config = gr.Button(
                    #                     value="Save Config", size="sm"
                    #                 )
                    #                 clear_sd_config = gr.ClearButton(
                    #                     value="Clear Config",
                    #                     size="sm",
                    #                     components=sd_json,
                    #                 )
                    #                 # with gr.Row():
                    #                 sd_config_name = gr.Textbox(
                    #                     value="Config Name",
                    #                     info="Name of the file this config will be saved to.",
                    #                     interactive=True,
                    #                     show_label=False,
                    #                 )
                    with gr.Tab(label="Log", id=103, visible=False) as sd_tab_log:
                        with gr.Row():
                            std_output = gr.Textbox(
                                value=f"{sd_model_info}\n"
                                f"Images will be saved at "
                                f"{get_generated_imgs_path()}",
                                lines=2,
                                elem_id="std_output",
                                show_label=True,
                                label="Log",
                                show_copy_button=True,
                            )
                            sd_element.load(
                                logger.read_sd_logs, None, std_output, every=1
                            )
                            sd_status = gr.Textbox(visible=False)
    base_model_id.change(
        fn=base_model_changed,
        inputs=[base_model_id],
        outputs=[custom_weights, steps],
    )
    load_sd_config.change(
        fn=load_sd_cfg,
        inputs=[sd_json, load_sd_config],
        outputs=[
            prompt,
            negative_prompt,
            sd_init_image,
            height,
            width,
            steps,
            strength,
            guidance_scale,
            seed,
            batch_count,
            batch_size,
            scheduler,
            base_model_id,
            custom_weights,
            custom_vae,
            precision,
            device,
            target_triple,
            ondemand,
            compiled_pipeline,
            resample_type,
            cnet_config,
            embeddings_config,
            sd_json,
        ],
    )
    save_sd_config.click(
        fn=save_sd_cfg,
        inputs=[sd_json, sd_config_name],
        outputs=[sd_config_name],
    )
    pull_kwargs = dict(
        fn=pull_sd_configs,
        inputs=[
            prompt,
            negative_prompt,
            sd_init_image,
            height,
            width,
            steps,
            strength,
            guidance_scale,
            seed,
            batch_count,
            batch_size,
            scheduler,
            base_model_id,
            custom_weights,
            custom_vae,
            precision,
            device,
            target_triple,
            ondemand,
            compiled_pipeline,
            resample_type,
            cnet_config,
            embeddings_config,
        ],
        outputs=[
            sd_json,
        ],
    )

    status_kwargs = dict(
        fn=lambda bc, bs: status_label("Stable Diffusion", 0, bc, bs),
        inputs=[batch_count, batch_size],
        outputs=sd_status,
    )

    gen_kwargs = dict(
        fn=shark_sd_fn_dict_input,
        inputs=[sd_json],
        outputs=[
            sd_gallery,
            sd_status,
        ],
    )

    prompt_submit = prompt.submit(**status_kwargs).then(**pull_kwargs)
    neg_prompt_submit = negative_prompt.submit(**status_kwargs).then(**pull_kwargs)
    generate_click = (
        stable_diffusion.click(**status_kwargs).then(**pull_kwargs).then(**gen_kwargs)
    )
    stop_batch.click(
        fn=cancel_sd,
        cancels=[prompt_submit, neg_prompt_submit, generate_click],
    )