onnx-web/api/onnx_web/chain/blend_img2img.py

from logging import getLogger
from typing import List, Optional

import numpy as np
import torch
from PIL import Image

from ..diffusers.load import load_pipeline
from ..diffusers.utils import encode_prompt, parse_prompt, slice_prompt
from ..params import ImageParams, SizeChart, StageParams
from ..server import ServerContext
from ..worker import ProgressCallback, WorkerContext
from .stage import BaseStage

logger = getLogger(__name__)


class BlendImg2ImgStage(BaseStage):
    max_tile = SizeChart.unlimited

    def run(
        self,
        worker: WorkerContext,
        server: ServerContext,
        _stage: StageParams,
        params: ImageParams,
        sources: List[Image.Image],
        *,
        strength: float,
        callback: Optional[ProgressCallback] = None,
        stage_source: Optional[Image.Image] = None,
        prompt_index: Optional[int] = None,
        **kwargs,
    ) -> List[Image.Image]:
        params = params.with_args(**kwargs)

        # multi-stage prompting
        if prompt_index is not None:
            params = params.with_args(prompt=slice_prompt(params.prompt, prompt_index))

        logger.info(
            "blending image using img2img, %s steps: %s", params.steps, params.prompt
        )

        prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(
            params
        )

        pipe_type = params.get_valid_pipeline("img2img")
        pipe = load_pipeline(
            server,
            params,
            pipe_type,
            worker.get_device(),
            inversions=inversions,
            loras=loras,
        )

        pipe_params = {}
        if params.is_pix2pix():
            pipe_params["image_guidance_scale"] = strength
        elif params.is_control():
            pipe_params["controlnet_conditioning_scale"] = strength
        else:
            pipe_params["strength"] = strength

        outputs = []
        for source in sources:
            if params.is_lpw():
                logger.debug("using LPW pipeline for img2img")
                rng = torch.manual_seed(params.seed)
                result = pipe.img2img(
                    source,
                    prompt,
                    generator=rng,
                    guidance_scale=params.cfg,
                    negative_prompt=negative_prompt,
                    num_inference_steps=params.steps,
                    callback=callback,
                    **pipe_params,
                )
            else:
                # encode and record alternative prompts outside of LPW
                prompt_embeds = encode_prompt(
                    pipe, prompt_pairs, params.batch, params.do_cfg()
                )

                if not params.is_xl():
                    pipe.unet.set_prompts(prompt_embeds)

                rng = np.random.RandomState(params.seed)
                result = pipe(
                    prompt,
                    generator=rng,
                    guidance_scale=params.cfg,
                    image=source,
                    negative_prompt=negative_prompt,
                    num_inference_steps=params.steps,
                    callback=callback,
                    **pipe_params,
                )

            outputs.extend(result.images)

        return outputs

    def steps(
            self,
            params: ImageParams,
            *args,
    ) -> int:
        return params.steps # TODO: multiply by strength

    def outputs(
            self,
            params: ImageParams,
            sources: int,
    ) -> int:
        return sources + 1
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`from logging import getLogger`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`from typing import List, Optional`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
fix(api): switch RNG based on LPW parameter 2023-02-05 23:24:08 +00:00			`import numpy as np`
apply lint fixes again 2023-02-05 23:55:04 +00:00			`import torch`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00			`from PIL import Image`

fix(api): correct imports 2023-03-05 04:25:49 +00:00			`from ..diffusers.load import load_pipeline`
feat(api): add an experimental multi-prompt syntax 2023-08-26 04:31:43 +00:00			`from ..diffusers.utils import encode_prompt, parse_prompt, slice_prompt`
fix(api): remove tile size limit for img2img and outpaint stages 2023-07-05 22:16:30 +00:00			`from ..params import ImageParams, SizeChart, StageParams`
background workers, logger 2023-02-26 05:49:39 +00:00			`from ..server import ServerContext`
lint all the new stuff 2023-02-26 20:15:30 +00:00			`from ..worker import ProgressCallback, WorkerContext`
lint(api): make all other stages inherit from base stage 2023-07-02 23:21:21 +00:00			`from .stage import BaseStage`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`logger = getLogger(__name__)`

feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
lint(api): make all other stages inherit from base stage 2023-07-02 23:21:21 +00:00			`class BlendImg2ImgStage(BaseStage):`
fix(api): remove tile size limit for img2img and outpaint stages 2023-07-05 22:16:30 +00:00			`max_tile = SizeChart.unlimited`

feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`def run(`
			`self,`
lint(api): use more accurate worker name throughout 2023-07-15 23:54:54 +00:00			`worker: WorkerContext,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`server: ServerContext,`
			`_stage: StageParams,`
			`params: ImageParams,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`sources: List[Image.Image],`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`*,`
			`strength: float,`
			`callback: Optional[ProgressCallback] = None,`
			`stage_source: Optional[Image.Image] = None,`
feat(api): allow a different prompt for each highres stage 2023-08-30 01:53:16 +00:00			`prompt_index: Optional[int] = None,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`**kwargs,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`) -> List[Image.Image]:`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`params = params.with_args(**kwargs)`
feat(api): add an experimental multi-prompt syntax 2023-08-26 04:31:43 +00:00
feat(api): allow a different prompt for each highres stage 2023-08-30 01:53:16 +00:00			`# multi-stage prompting`
			`if prompt_index is not None:`
			`params = params.with_args(prompt=slice_prompt(params.prompt, prompt_index))`
feat(api): add an experimental multi-prompt syntax 2023-08-26 04:31:43 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`logger.info(`
			`"blending image using img2img, %s steps: %s", params.steps, params.prompt`
			`)`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(`
			`params`
			`)`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`pipe_type = params.get_valid_pipeline("img2img")`
			`pipe = load_pipeline(`
			`server,`
			`params,`
			`pipe_type,`
lint(api): use more accurate worker name throughout 2023-07-15 23:54:54 +00:00			`worker.get_device(),`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`inversions=inversions,`
			`loras=loras,`
			`)`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`pipe_params = {}`
feat(api): support for SDXL LoRAs 2023-08-26 04:33:41 +00:00			`if params.is_pix2pix():`
			`pipe_params["image_guidance_scale"] = strength`
			`elif params.is_control():`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`pipe_params["controlnet_conditioning_scale"] = strength`
feat(api): support for SDXL LoRAs 2023-08-26 04:33:41 +00:00			`else:`
fix(api): pass strength to LPW pipe from img2img blend 2023-07-03 13:27:37 +00:00			`pipe_params["strength"] = strength`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`outputs = []`
			`for source in sources:`
skip loading component models for XL 2023-08-21 03:28:08 +00:00			`if params.is_lpw():`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`logger.debug("using LPW pipeline for img2img")`
			`rng = torch.manual_seed(params.seed)`
			`result = pipe.img2img(`
			`source,`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`generator=rng,`
			`guidance_scale=params.cfg,`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`negative_prompt=negative_prompt,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`num_inference_steps=params.steps,`
			`callback=callback,`
			`**pipe_params,`
			`)`
			`else:`
			`# encode and record alternative prompts outside of LPW`
			`prompt_embeds = encode_prompt(`
			`pipe, prompt_pairs, params.batch, params.do_cfg()`
			`)`
skip loading component models for XL 2023-08-21 03:28:08 +00:00
make highres work with SDXL and use a full-size txt2img stage 2023-08-22 01:46:05 +00:00			`if not params.is_xl():`
skip loading component models for XL 2023-08-21 03:28:08 +00:00			`pipe.unet.set_prompts(prompt_embeds)`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`rng = np.random.RandomState(params.seed)`
			`result = pipe(`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`generator=rng,`
			`guidance_scale=params.cfg,`
			`image=source,`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`negative_prompt=negative_prompt,`
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`num_inference_steps=params.steps,`
			`callback=callback,`
			`**pipe_params,`
			`)`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`outputs.extend(result.images)`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): make pipeline stages support multiple images 2023-07-04 18:29:58 +00:00			`return outputs`
feat(api): attempt to calculate total steps for chain pipelines 2023-09-12 23:16:16 +00:00
			`def steps(`
			`self,`
			`params: ImageParams,`
			`*args,`
			`) -> int:`
			`return params.steps # TODO: multiply by strength`

			`def outputs(`
			`self,`
			`params: ImageParams,`
			`sources: int,`
			`) -> int:`
			`return sources + 1`