onnx-web/api/onnx_web/chain/source_txt2img.py

from logging import getLogger
from typing import Optional, Tuple

import numpy as np
import torch
from PIL import Image

from ..diffusers.load import load_pipeline
from ..diffusers.utils import encode_prompt, get_latents_from_seed, get_tile_latents, parse_prompt
from ..params import ImageParams, Size, SizeChart, StageParams
from ..server import ServerContext
from ..worker import ProgressCallback, WorkerContext
from .stage import BaseStage

logger = getLogger(__name__)


class SourceTxt2ImgStage(BaseStage):
    max_tile = SizeChart.unlimited

    def run(
        self,
        job: WorkerContext,
        server: ServerContext,
        _stage: StageParams,
        params: ImageParams,
        _source: Image.Image,
        *,
        dims: Tuple[int, int, int],
        size: Size,
        callback: Optional[ProgressCallback] = None,
        latents: Optional[np.ndarray] = None,
        **kwargs,
    ) -> Image.Image:
        params = params.with_args(**kwargs)
        size = size.with_args(**kwargs)

        logger.info(
            "generating image using txt2img, %s steps: %s", params.steps, params.prompt
        )

        if "stage_source" in kwargs:
            logger.warn(
                "a source image was passed to a txt2img stage, and will be discarded"
            )

        prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(
            params
        )

        tile_size = params.tiles
        latent_size = size.min(tile_size, tile_size)

        # generate new latents or slice existing
        if latents is None:
            latents = get_latents_from_seed(params.seed, latent_size, params.batch)
        else:
            latents = get_tile_latents(latents, dims, latent_size)

        pipe_type = params.get_valid_pipeline("txt2img")
        pipe = load_pipeline(
            server,
            params,
            pipe_type,
            job.get_device(),
            inversions=inversions,
            loras=loras,
        )

        if params.lpw():
            logger.debug("using LPW pipeline for txt2img")
            rng = torch.manual_seed(params.seed)
            result = pipe.text2img(
                prompt,
                height=latent_size.height,
                width=latent_size.width,
                generator=rng,
                guidance_scale=params.cfg,
                latents=latents,
                negative_prompt=negative_prompt,
                num_images_per_prompt=params.batch,
                num_inference_steps=params.steps,
                eta=params.eta,
                callback=callback,
            )
        else:
            # encode and record alternative prompts outside of LPW
            prompt_embeds = encode_prompt(
                pipe, prompt_pairs, params.batch, params.do_cfg()
            )
            pipe.unet.set_prompts(prompt_embeds)

            rng = np.random.RandomState(params.seed)
            result = pipe(
                prompt,
                height=latent_size.height,
                width=latent_size.width,
                generator=rng,
                guidance_scale=params.cfg,
                latents=latents,
                negative_prompt=negative_prompt,
                num_images_per_prompt=params.batch,
                num_inference_steps=params.steps,
                eta=params.eta,
                callback=callback,
            )

        return result.images
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`from logging import getLogger`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`from typing import Optional, Tuple`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
fix(api): switch RNG based on LPW parameter 2023-02-05 23:24:08 +00:00			`import numpy as np`
apply lint fixes again 2023-02-05 23:55:04 +00:00			`import torch`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00			`from PIL import Image`

feat(api): parse alternative groups in prompts 2023-04-23 20:03:11 +00:00			`from ..diffusers.load import load_pipeline`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`from ..diffusers.utils import encode_prompt, get_latents_from_seed, get_tile_latents, parse_prompt`
feat(api): pass tile size param to most pipeline stages 2023-07-02 23:54:10 +00:00			`from ..params import ImageParams, Size, SizeChart, StageParams`
background workers, logger 2023-02-26 05:49:39 +00:00			`from ..server import ServerContext`
lint all the new stuff 2023-02-26 20:15:30 +00:00			`from ..worker import ProgressCallback, WorkerContext`
lint(api): make all other stages inherit from base stage 2023-07-02 23:21:21 +00:00			`from .stage import BaseStage`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): switch to python logging 2023-01-28 23:09:19 +00:00			`logger = getLogger(__name__)`

feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
lint(api): make all other stages inherit from base stage 2023-07-02 23:21:21 +00:00			`class SourceTxt2ImgStage(BaseStage):`
feat(api): pass tile size param to most pipeline stages 2023-07-02 23:54:10 +00:00			`max_tile = SizeChart.unlimited`

feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`def run(`
			`self,`
			`job: WorkerContext,`
			`server: ServerContext,`
			`_stage: StageParams,`
			`params: ImageParams,`
			`_source: Image.Image,`
			`*,`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`dims: Tuple[int, int, int],`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`size: Size,`
			`callback: Optional[ProgressCallback] = None,`
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`latents: Optional[np.ndarray] = None,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`**kwargs,`
			`) -> Image.Image:`
			`params = params.with_args(**kwargs)`
			`size = size.with_args(**kwargs)`
linting 2023-07-09 05:02:27 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`logger.info(`
			`"generating image using txt2img, %s steps: %s", params.steps, params.prompt`
lint(api): apply black and isort style 2023-02-05 13:53:26 +00:00			`)`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`if "stage_source" in kwargs:`
			`logger.warn(`
			`"a source image was passed to a txt2img stage, and will be discarded"`
			`)`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(`
			`params`
			`)`
linting 2023-07-09 05:02:27 +00:00
tiling in txt2img, subtiling in txt2img and img2img 2023-07-09 00:48:40 +00:00			`tile_size = params.tiles`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`latent_size = size.min(tile_size, tile_size)`
use tile size when completing partial latents 2023-07-10 04:49:34 +00:00
fix(api): generate latents before tiling 2023-07-10 03:19:02 +00:00			`# generate new latents or slice existing`
			`if latents is None:`
tiling in txt2img, subtiling in txt2img and img2img 2023-07-09 00:48:40 +00:00			`latents = get_latents_from_seed(params.seed, latent_size, params.batch)`
linting 2023-07-09 05:02:27 +00:00			`else:`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`latents = get_tile_latents(latents, dims, latent_size)`
linting 2023-07-09 05:02:27 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`pipe_type = params.get_valid_pipeline("txt2img")`
			`pipe = load_pipeline(`
			`server,`
			`params,`
			`pipe_type,`
			`job.get_device(),`
			`inversions=inversions,`
			`loras=loras,`
fix(api): fully switch between LPW and regular ONNX pipelines 2023-02-05 23:36:00 +00:00			`)`
feat(api): start using chain pipelines for all images 2023-06-30 04:06:36 +00:00
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`if params.lpw():`
			`logger.debug("using LPW pipeline for txt2img")`
			`rng = torch.manual_seed(params.seed)`
			`result = pipe.text2img(`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt,`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`height=latent_size.height,`
			`width=latent_size.width,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`generator=rng,`
			`guidance_scale=params.cfg,`
			`latents=latents,`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`negative_prompt=negative_prompt,`
fix(api): pass batch size and eta params to txt2img stage 2023-07-04 22:24:37 +00:00			`num_images_per_prompt=params.batch,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`num_inference_steps=params.steps,`
fix(api): pass batch size and eta params to txt2img stage 2023-07-04 22:24:37 +00:00			`eta=params.eta,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`callback=callback,`
			`)`
			`else:`
			`# encode and record alternative prompts outside of LPW`
			`prompt_embeds = encode_prompt(`
			`pipe, prompt_pairs, params.batch, params.do_cfg()`
			`)`
			`pipe.unet.set_prompts(prompt_embeds)`

			`rng = np.random.RandomState(params.seed)`
			`result = pipe(`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`prompt,`
fix(api): improve handling of non-square images around tile size 2023-07-10 22:41:08 +00:00			`height=latent_size.height,`
			`width=latent_size.width,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`generator=rng,`
			`guidance_scale=params.cfg,`
			`latents=latents,`
fix(api): keep network tokens while replacing wildcards in the saved prompt 2023-07-07 01:39:08 +00:00			`negative_prompt=negative_prompt,`
fix(api): pass batch size and eta params to txt2img stage 2023-07-04 22:24:37 +00:00			`num_images_per_prompt=params.batch,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`num_inference_steps=params.steps,`
fix(api): pass batch size and eta params to txt2img stage 2023-07-04 22:24:37 +00:00			`eta=params.eta,`
feat(api): make chain stages into classes with max tile size and step count estimate 2023-07-01 12:10:53 +00:00			`callback=callback,`
			`)`
feat(api): synthesize a mask for outpaint stages 2023-01-28 14:37:17 +00:00
feat(api): add support for wildcards 2023-07-04 21:41:54 +00:00			`return result.images`