onnx-web/api/onnx_web/chain/upscale_outpaint.py

from logging import getLogger
from typing import Callable, Optional, Tuple

import numpy as np
import torch
from PIL import Image

from ..diffusers.load import load_pipeline
from ..diffusers.utils import (
    encode_prompt,
    get_latents_from_seed,
    get_tile_latents,
    parse_prompt,
)
from ..image import mask_filter_none, noise_source_histogram
from ..output import save_image
from ..params import Border, ImageParams, Size, SizeChart, StageParams
from ..server import ServerContext
from ..utils import is_debug
from ..worker import ProgressCallback, WorkerContext
from .base import BaseStage
from .result import StageResult

logger = getLogger(__name__)


class UpscaleOutpaintStage(BaseStage):
    max_tile = SizeChart.max

    def run(
        self,
        worker: WorkerContext,
        server: ServerContext,
        stage: StageParams,
        params: ImageParams,
        sources: StageResult,
        *,
        border: Border,
        dims: Tuple[int, int, int],
        tile_mask: Image.Image,
        fill_color: str = "white",
        mask_filter: Callable = mask_filter_none,
        noise_source: Callable = noise_source_histogram,
        latents: Optional[np.ndarray] = None,
        callback: Optional[ProgressCallback] = None,
        stage_source: Optional[Image.Image] = None,
        stage_mask: Optional[Image.Image] = None,
        **kwargs,
    ) -> StageResult:
        prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(
            params
        )

        pipe_type = params.get_valid_pipeline("inpaint", params.pipeline)
        pipe = load_pipeline(
            server,
            params,
            pipe_type,
            worker.get_device(),
            embeddings=inversions,
            loras=loras,
        )

        outputs = []
        for source in sources.as_images():
            if is_debug():
                save_image(server, "tile-source.png", source)
                save_image(server, "tile-mask.png", tile_mask)

            # if the tile mask is all black, skip processing this tile
            if not tile_mask.getbbox():
                outputs.append(source)
                continue

            tile_size = params.unet_tile
            size = Size(*source.size)
            latent_size = size.min(tile_size, tile_size)

            # generate new latents or slice existing
            if latents is None:
                latents = get_latents_from_seed(params.seed, latent_size, params.batch)
            else:
                latents = get_tile_latents(latents, params.seed, latent_size, dims)

            if params.is_lpw():
                logger.debug("using LPW pipeline for inpaint")
                rng = torch.manual_seed(params.seed)
                result = pipe.inpaint(
                    source,
                    tile_mask,
                    prompt,
                    negative_prompt=negative_prompt,
                    height=latent_size.height,
                    width=latent_size.width,
                    num_inference_steps=params.steps,
                    guidance_scale=params.cfg,
                    generator=rng,
                    latents=latents,
                    callback=callback,
                )
            else:
                # encode and record alternative prompts outside of LPW
                if not params.is_xl():
                    prompt_embeds = encode_prompt(
                        pipe, prompt_pairs, params.batch, params.do_cfg()
                    )
                    pipe.unet.set_prompts(prompt_embeds)

                rng = np.random.RandomState(params.seed)
                result = pipe(
                    prompt,
                    source,
                    tile_mask,
                    negative_prompt=negative_prompt,
                    height=latent_size.height,
                    width=latent_size.width,
                    num_inference_steps=params.steps,
                    guidance_scale=params.cfg,
                    generator=rng,
                    latents=latents,
                    callback=callback,
                )

            outputs.extend(result.images)

        return StageResult(images=outputs, metadata=sources.metadata)
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`from logging import getLogger`
apply lint, add missing file 2023-11-19 00:13:13 +00:00			`from typing import Callable, Optional, Tuple`
feat(api): add inpaint as a chain stage 2023-01-28 14:19:40 +00:00
fix(api): switch RNG based on LPW parameter 2023-02-05 23:24:08 +00:00			`import numpy as np`
apply lint fixes again 2023-02-05 23:55:04 +00:00			`import torch`
linting 2023-07-09 05:02:27 +00:00			`from PIL import Image`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00
feat(api): parse alternative groups in prompts 2023-04-23 20:03:11 +00:00			`from ..diffusers.load import load_pipeline`
use tile size when completing partial latents 2023-07-10 04:49:34 +00:00			`from ..diffusers.utils import (`
			`encode_prompt,`
			`get_latents_from_seed,`
			`get_tile_latents,`
			`parse_prompt,`
			`)`
linting 2023-07-09 05:02:27 +00:00			`from ..image import mask_filter_none, noise_source_histogram`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00			`from ..output import save_image`
apply lint 2023-02-12 00:10:36 +00:00			`from ..params import Border, ImageParams, Size, SizeChart, StageParams`
background workers, logger 2023-02-26 05:49:39 +00:00			`from ..server import ServerContext`
fix imports 2023-02-19 02:28:21 +00:00			`from ..utils import is_debug`
lint all the new stuff 2023-02-26 20:15:30 +00:00			`from ..worker import ProgressCallback, WorkerContext`
feat(api): add chain pipeline stage result type 2023-11-18 23:18:23 +00:00			`from .base import BaseStage`
start replacing image output with results 2023-11-19 00:08:38 +00:00			`from .result import StageResult`
feat(api): add inpaint as a chain stage 2023-01-28 14:19:40 +00:00
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`logger = getLogger(__name__)`

feat(api): add inpaint as a chain stage 2023-01-28 14:19:40 +00:00
lint(api): make all other stages inherit from base stage 2023-07-02 23:21:21 +00:00			`class UpscaleOutpaintStage(BaseStage):`
remove unused schema, lint 2023-09-15 13:40:56 +00:00			`max_tile = SizeChart.max`
fix(api): remove tile size limit for img2img and outpaint stages 2023-07-05 22:16:30 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`def run(`
			`self,`
lint(api): use more accurate worker name throughout 2023-07-15 23:54:54 +00:00			`worker: WorkerContext,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`server: ServerContext,`
			`stage: StageParams,`
			`params: ImageParams,`
start replacing image output with results 2023-11-19 00:08:38 +00:00			`sources: StageResult,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`*,`
			`border: Border,`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`dims: Tuple[int, int, int],`
			`tile_mask: Image.Image,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`fill_color: str = "white",`
			`mask_filter: Callable = mask_filter_none,`
			`noise_source: Callable = noise_source_histogram,`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`latents: Optional[np.ndarray] = None,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`callback: Optional[ProgressCallback] = None,`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`stage_source: Optional[Image.Image] = None,`
			`stage_mask: Optional[Image.Image] = None,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`**kwargs,`
start replacing image output with results 2023-11-19 00:08:38 +00:00			`) -> StageResult:`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(`
			`params`
			`)`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00
			`pipe_type = params.get_valid_pipeline("inpaint", params.pipeline)`
			`pipe = load_pipeline(`
			`server,`
			`params,`
			`pipe_type,`
lint(api): use more accurate worker name throughout 2023-07-15 23:54:54 +00:00			`worker.get_device(),`
lint(api): start renaming inversions to embeddings in code 2023-09-24 23:15:58 +00:00			`embeddings=inversions,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`loras=loras,`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00			`)`
feat(api): add inpaint as a chain stage 2023-01-28 14:19:40 +00:00
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`outputs = []`
clean up result and metadata handling 2024-01-06 02:11:58 +00:00			`for source in sources.as_images():`
linting 2023-07-09 05:02:27 +00:00			`if is_debug():`
			`save_image(server, "tile-source.png", source)`
			`save_image(server, "tile-mask.png", tile_mask)`

			`# if the tile mask is all black, skip processing this tile`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`if not tile_mask.getbbox():`
			`outputs.append(source)`
			`continue`
linting 2023-07-09 05:02:27 +00:00
feat: split up UNet and VAE tile size and overlap/stride params 2023-11-05 01:41:58 +00:00			`tile_size = params.unet_tile`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`size = Size(*source.size)`
			`latent_size = size.min(tile_size, tile_size)`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00
			`# generate new latents or slice existing`
			`if latents is None:`
			`latents = get_latents_from_seed(params.seed, latent_size, params.batch)`
linting 2023-07-09 05:02:27 +00:00			`else:`
fix(api): generate new latents for partial tiles 2023-07-13 02:28:07 +00:00			`latents = get_tile_latents(latents, params.seed, latent_size, dims)`
linting 2023-07-09 05:02:27 +00:00
skip loading component models for XL 2023-08-21 03:28:08 +00:00			`if params.is_lpw():`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`logger.debug("using LPW pipeline for inpaint")`
			`rng = torch.manual_seed(params.seed)`
			`result = pipe.inpaint(`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`source,`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`tile_mask,`
			`prompt,`
			`negative_prompt=negative_prompt,`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`height=latent_size.height,`
			`width=latent_size.width,`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`num_inference_steps=params.steps,`
			`guidance_scale=params.cfg,`
			`generator=rng,`
			`latents=latents,`
			`callback=callback,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`)`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`else:`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`# encode and record alternative prompts outside of LPW`
fix(api): turn alternatives back off for SDXL 2023-11-12 20:23:02 +00:00			`if not params.is_xl():`
			`prompt_embeds = encode_prompt(`
			`pipe, prompt_pairs, params.batch, params.do_cfg()`
			`)`
			`pipe.unet.set_prompts(prompt_embeds)`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`rng = np.random.RandomState(params.seed)`
			`result = pipe(`
			`prompt,`
			`source,`
			`tile_mask,`
			`negative_prompt=negative_prompt,`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`height=latent_size.height,`
			`width=latent_size.width,`
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`num_inference_steps=params.steps,`
			`guidance_scale=params.cfg,`
			`generator=rng,`
			`latents=latents,`
			`callback=callback,`
			`)`
linting 2023-07-09 05:02:27 +00:00
new tiled inpainting method 2023-07-09 04:56:20 +00:00			`outputs.extend(result.images)`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00
clean up result and metadata handling 2024-01-06 02:11:58 +00:00			`return StageResult(images=outputs, metadata=sources.metadata)`