From bea5a3c935ab822d0d46c5efa55617dee1a70407 Mon Sep 17 00:00:00 2001
From: BZLibby <b.z.libby@gmail.com>
Date: Tue, 5 Sep 2023 18:56:00 -0500
Subject: [PATCH 001/240] rebase diffuser change

---
 api/onnx_web/models/cnet.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/models/cnet.py b/api/onnx_web/models/cnet.py
index 1c9a9a02..71c4b4d0 100644
--- a/api/onnx_web/models/cnet.py
+++ b/api/onnx_web/models/cnet.py
@@ -24,7 +24,7 @@ import torch.nn as nn
 import torch.utils.checkpoint
 from diffusers.configuration_utils import ConfigMixin, register_to_config
 from diffusers.loaders import UNet2DConditionLoadersMixin
-from diffusers.models.cross_attention import AttnProcessor
+from diffusers.models.attention_processor import AttnProcessor
 from diffusers.models.embeddings import (
     GaussianFourierProjection,
     TimestepEmbedding,

From 0fa03e77ad175b0f8756b138ddc2ed2b793655b9 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 11:26:18 -0500
Subject: [PATCH 002/240] feat: add panorama pipeline for SDXL

---
 api/onnx_web/diffusers/load.py                |  33 +-
 api/onnx_web/diffusers/patches/vae.py         |   4 +-
 .../diffusers/pipelines/panorama_xl.py        | 664 ++++++++++++++++++
 api/onnx_web/params.py                        |   6 +-
 gui/src/strings/de.ts                         |   1 +
 gui/src/strings/en.ts                         |   1 +
 gui/src/strings/es.ts                         |   1 +
 gui/src/strings/fr.ts                         |   1 +
 8 files changed, 693 insertions(+), 18 deletions(-)
 create mode 100644 api/onnx_web/diffusers/pipelines/panorama_xl.py

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 78123449..36a35b7a 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -24,6 +24,7 @@ from .patches.vae import VAEWrapper
 from .pipelines.controlnet import OnnxStableDiffusionControlNetPipeline
 from .pipelines.lpw import OnnxStableDiffusionLongPromptWeightingPipeline
 from .pipelines.panorama import OnnxStableDiffusionPanoramaPipeline
+from .pipelines.panorama_xl import ORTStableDiffusionXLPanoramaPipeline
 from .pipelines.pix2pix import OnnxStableDiffusionInstructPix2PixPipeline
 from .version_safe_diffusers import (
     DDIMScheduler,
@@ -58,6 +59,7 @@ available_pipelines = {
     # "inpaint-sdxl": ORTStableDiffusionXLInpaintPipeline,
     "lpw": OnnxStableDiffusionLongPromptWeightingPipeline,
     "panorama": OnnxStableDiffusionPanoramaPipeline,
+    "panorama-sdxl": ORTStableDiffusionXLPanoramaPipeline,
     "pix2pix": OnnxStableDiffusionInstructPix2PixPipeline,
     "txt2img-sdxl": ORTStableDiffusionXLPipeline,
     "txt2img": OnnxStableDiffusionPipeline,
@@ -399,7 +401,6 @@ def load_pipeline(
         )
 
         # make sure XL models are actually being used
-        # TODO: why is this needed?
         if "text_encoder_session" in components:
             logger.info(
                 "text encoder matches: %s, %s",
@@ -424,23 +425,23 @@ def load_pipeline(
                 pipe.unet.session == components["unet_session"],
                 type(pipe.unet),
             )
+            pipe.unet = None
+            run_gc([device])
             pipe.unet = ORTModelUnet(unet_session, unet_model)
 
         if not server.show_progress:
             pipe.set_progress_bar_config(disable=True)
 
         optimize_pipeline(server, pipe)
-
-        if not params.is_xl():
-            patch_pipeline(server, pipe, pipeline, pipeline_class, params)
+        patch_pipeline(server, pipe, pipeline_class, params)
 
         server.cache.set(ModelTypes.diffusion, pipe_key, pipe)
         server.cache.set(ModelTypes.scheduler, scheduler_key, components["scheduler"])
 
-    if not params.is_xl() and hasattr(pipe, "vae_decoder"):
+    if hasattr(pipe, "vae_decoder"):
         pipe.vae_decoder.set_tiled(tiled=params.tiled_vae)
 
-    if not params.is_xl() and hasattr(pipe, "vae_encoder"):
+    if hasattr(pipe, "vae_encoder"):
         pipe.vae_encoder.set_tiled(tiled=params.tiled_vae)
 
     # update panorama params
@@ -514,17 +515,18 @@ def optimize_pipeline(
 def patch_pipeline(
     server: ServerContext,
     pipe: StableDiffusionPipeline,
-    pipe_type: str,
     pipeline: Any,
     params: ImageParams,
 ) -> None:
     logger.debug("patching SD pipeline")
 
-    if pipe_type != "lpw":
+    if params.is_lpw():
         pipe._encode_prompt = expand_prompt.__get__(pipe, pipeline)
 
-    original_unet = pipe.unet
-    pipe.unet = UNetWrapper(server, original_unet)
+    if not params.is_xl():
+        original_unet = pipe.unet
+        pipe.unet = UNetWrapper(server, original_unet)
+        logger.debug("patched UNet with wrapper")
 
     if hasattr(pipe, "vae_decoder"):
         original_decoder = pipe.vae_decoder
@@ -535,6 +537,9 @@ def patch_pipeline(
             window=params.tiles,
             overlap=params.overlap,
         )
+        logger.debug("patched VAE decoder with wrapper")
+
+    if hasattr(pipe, "vae_encoder"):
         original_encoder = pipe.vae_encoder
         pipe.vae_encoder = VAEWrapper(
             server,
@@ -543,7 +548,7 @@ def patch_pipeline(
             window=params.tiles,
             overlap=params.overlap,
         )
-    elif hasattr(pipe, "vae"):
-        pass  # TODO: current wrapper does not work with upscaling VAE
-    else:
-        logger.debug("no VAE found to patch")
+        logger.debug("patched VAE encoder with wrapper")
+
+    if hasattr(pipe, "vae"):
+        logger.warning("not patching single VAE, tiled VAE may not work")
diff --git a/api/onnx_web/diffusers/patches/vae.py b/api/onnx_web/diffusers/patches/vae.py
index c5fd6936..48e9358e 100644
--- a/api/onnx_web/diffusers/patches/vae.py
+++ b/api/onnx_web/diffusers/patches/vae.py
@@ -39,11 +39,13 @@ class VAEWrapper(object):
         self.tile_overlap_factor = overlap
 
     def __call__(self, latent_sample=None, sample=None, **kwargs):
+        model = self.wrapped.model if hasattr(self.wrapped, "model") else self.wrapped.session
+
         # set timestep dtype to input type
         sample_dtype = next(
             (
                 input.type
-                for input in self.wrapped.model.get_inputs()
+                for input in model.get_inputs()
                 if input.name == "sample" or input.name == "latent_sample"
             ),
             "tensor(float)",
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
new file mode 100644
index 00000000..5092cae0
--- /dev/null
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -0,0 +1,664 @@
+from optimum.onnxruntime.modeling_diffusion import ORTStableDiffusionXLPipelineBase
+from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import StableDiffusionXLImg2ImgPipelineMixin
+from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
+from diffusers.pipelines.stable_diffusion_xl import StableDiffusionXLPipelineOutput
+import logging
+from typing import Any, Optional, List, Union, Tuple, Callable, Dict
+import torch
+import numpy as np
+import PIL
+import inspect
+
+logger = logging.getLogger(__name__)
+
+
+DEFAULT_WINDOW = 64
+DEFAULT_STRIDE = 16
+
+
+class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMixin):
+    def __init__(
+            self,
+            *args,
+            window: int = DEFAULT_WINDOW,
+            stride: int = DEFAULT_STRIDE,
+            **kwargs,
+    ):
+        super().__init__(self, *args, **kwargs)
+
+        self.window = window
+        self.stride = stride
+
+
+    def set_window_size(self, window: int, stride: int):
+        self.window = window
+        self.stride = stride
+
+
+    def get_views(self, panorama_height, panorama_width, window_size, stride):
+        # Here, we define the mappings F_i (see Eq. 7 in the MultiDiffusion paper https://arxiv.org/abs/2302.08113)
+        panorama_height /= 8
+        panorama_width /= 8
+
+        num_blocks_height = abs((panorama_height - window_size) // stride) + 1
+        num_blocks_width = abs((panorama_width - window_size) // stride) + 1
+        total_num_blocks = int(num_blocks_height * num_blocks_width)
+        logger.debug(
+            "panorama generated %s views, %s by %s blocks",
+            total_num_blocks,
+            num_blocks_height,
+            num_blocks_width,
+        )
+
+        views = []
+        for i in range(total_num_blocks):
+            h_start = int((i // num_blocks_width) * stride)
+            h_end = h_start + window_size
+            w_start = int((i % num_blocks_width) * stride)
+            w_end = w_start + window_size
+            views.append((h_start, h_end, w_start, w_end))
+
+        return views
+
+
+    # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
+    def prepare_latents_img2img(self, image, timestep, batch_size, num_images_per_prompt, dtype, generator=None):
+        batch_size = batch_size * num_images_per_prompt
+
+        if image.shape[1] == 4:
+            init_latents = image
+        else:
+            init_latents = self.vae_encoder(sample=image)[0] * self.vae_decoder.config.get("scaling_factor", 0.18215)
+
+        if batch_size > init_latents.shape[0] and batch_size % init_latents.shape[0] == 0:
+            # expand init_latents for batch_size
+            additional_image_per_prompt = batch_size // init_latents.shape[0]
+            init_latents = np.concatenate([init_latents] * additional_image_per_prompt, axis=0)
+        elif batch_size > init_latents.shape[0] and batch_size % init_latents.shape[0] != 0:
+            raise ValueError(
+                f"Cannot duplicate `image` of batch size {init_latents.shape[0]} to {batch_size} text prompts."
+            )
+        else:
+            init_latents = np.concatenate([init_latents], axis=0)
+
+        # add noise to latents using the timesteps
+        noise = generator.randn(*init_latents.shape).astype(dtype)
+        init_latents = self.scheduler.add_noise(
+            torch.from_numpy(init_latents), torch.from_numpy(noise), torch.from_numpy(timestep)
+        )
+        return init_latents.numpy()
+
+
+    # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
+    def prepare_latents_text2img(self, batch_size, num_channels_latents, height, width, dtype, generator, latents=None):
+        shape = (batch_size, num_channels_latents, height // self.vae_scale_factor, width // self.vae_scale_factor)
+        if isinstance(generator, list) and len(generator) != batch_size:
+            raise ValueError(
+                f"You have passed a list of generators of length {len(generator)}, but requested an effective batch"
+                f" size of {batch_size}. Make sure the batch size matches the length of the generators."
+            )
+
+        if latents is None:
+            latents = generator.randn(*shape).astype(dtype)
+        elif latents.shape != shape:
+            raise ValueError(f"Unexpected latents shape, got {latents.shape}, expected {shape}")
+
+        # scale the initial noise by the standard deviation required by the scheduler
+        latents = latents * np.float64(self.scheduler.init_noise_sigma)
+
+        return latents
+
+
+    # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_extra_step_kwargs
+    def prepare_extra_step_kwargs(self, generator, eta):
+        # prepare extra kwargs for the scheduler step, since not all schedulers have the same signature
+        # eta (η) is only used with the DDIMScheduler, it will be ignored for other schedulers.
+        # eta corresponds to η in DDIM paper: https://arxiv.org/abs/2010.02502
+        # and should be between [0, 1]
+
+        extra_step_kwargs = {}
+
+        accepts_eta = "eta" in set(inspect.signature(self.scheduler.step).parameters.keys())
+        if accepts_eta:
+            extra_step_kwargs["eta"] = eta
+
+        return extra_step_kwargs
+
+
+    # Adapted from diffusers.pipelines.stable_diffusion_xl.pipeline_stable_diffusion_xl.StableDiffusionXLPipeline.__call__
+    def text2img(
+        self,
+        prompt: Optional[Union[str, List[str]]] = None,
+        height: Optional[int] = None,
+        width: Optional[int] = None,
+        num_inference_steps: int = 50,
+        guidance_scale: float = 5.0,
+        negative_prompt: Optional[Union[str, List[str]]] = None,
+        num_images_per_prompt: int = 1,
+        eta: float = 0.0,
+        generator: Optional[np.random.RandomState] = None,
+        latents: Optional[np.ndarray] = None,
+        prompt_embeds: Optional[np.ndarray] = None,
+        negative_prompt_embeds: Optional[np.ndarray] = None,
+        pooled_prompt_embeds: Optional[np.ndarray] = None,
+        negative_pooled_prompt_embeds: Optional[np.ndarray] = None,
+        output_type: str = "pil",
+        return_dict: bool = True,
+        callback: Optional[Callable[[int, int, np.ndarray], None]] = None,
+        callback_steps: int = 1,
+        cross_attention_kwargs: Optional[Dict[str, Any]] = None,
+        guidance_rescale: float = 0.0,
+        original_size: Optional[Tuple[int, int]] = None,
+        crops_coords_top_left: Tuple[int, int] = (0, 0),
+        target_size: Optional[Tuple[int, int]] = None,
+    ):
+        r"""
+        Function invoked when calling the pipeline for generation.
+
+        Args:
+            prompt (`Optional[Union[str, List[str]]]`, defaults to None):
+                The prompt or prompts to guide the image generation. If not defined, one has to pass `prompt_embeds`.
+                instead.
+            height (`Optional[int]`, defaults to None):
+                The height in pixels of the generated image.
+            width (`Optional[int]`, defaults to None):
+                The width in pixels of the generated image.
+            num_inference_steps (`int`, defaults to 50):
+                The number of denoising steps. More denoising steps usually lead to a higher quality image at the
+                expense of slower inference.
+            guidance_scale (`float`, defaults to 5):
+                Guidance scale as defined in [Classifier-Free Diffusion Guidance](https://arxiv.org/abs/2207.12598).
+                `guidance_scale` is defined as `w` of equation 2. of [Imagen
+                Paper](https://arxiv.org/pdf/2205.11487.pdf). Guidance scale is enabled by setting `guidance_scale >
+                1`. Higher guidance scale encourages to generate images that are closely linked to the text `prompt`,
+                usually at the expense of lower image quality.
+            negative_prompt (`Optional[Union[str, list]]`):
+                The prompt or prompts not to guide the image generation. If not defined, one has to pass
+                `negative_prompt_embeds`. instead. Ignored when not using guidance (i.e., ignored if `guidance_scale`
+                is less than `1`).
+            num_images_per_prompt (`int`, defaults to 1):
+                The number of images to generate per prompt.
+            eta (`float`, defaults to 0.0):
+                Corresponds to parameter eta (η) in the DDIM paper: https://arxiv.org/abs/2010.02502. Only applies to
+                [`schedulers.DDIMScheduler`], will be ignored for others.
+            generator (`Optional[np.random.RandomState]`, defaults to `None`)::
+                A np.random.RandomState to make generation deterministic.
+            latents (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated noisy latents, sampled from a Gaussian distribution, to be used as inputs for image
+                generation. Can be used to tweak the same generation with different prompts. If not provided, a latents
+                tensor will ge generated by sampling using the supplied random `generator`.
+            prompt_embeds (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated text embeddings. Can be used to easily tweak text inputs, *e.g.* prompt weighting. If not
+                provided, text embeddings will be generated from `prompt` input argument.
+            negative_prompt_embeds (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated negative text embeddings. Can be used to easily tweak text inputs, *e.g.* prompt
+                weighting. If not provided, negative_prompt_embeds will be generated from `negative_prompt` input
+                argument.
+            output_type (`str`, defaults to `"pil"`):
+                The output format of the generate image. Choose between
+                [PIL](https://pillow.readthedocs.io/en/stable/): `PIL.Image.Image` or `np.array`.
+            return_dict (`bool`, defaults to `True`):
+                Whether or not to return a [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] instead of a
+                plain tuple.
+            callback (Optional[Callable], defaults to `None`):
+                A function that will be called every `callback_steps` steps during inference. The function will be
+                called with the following arguments: `callback(step: int, timestep: int, latents: torch.FloatTensor)`.
+            callback_steps (`int`, defaults to 1):
+                The frequency at which the `callback` function will be called. If not specified, the callback will be
+                called at every step.
+            guidance_rescale (`float`, defaults to 0.7):
+                Guidance rescale factor proposed by [Common Diffusion Noise Schedules and Sample Steps are
+                Flawed](https://arxiv.org/pdf/2305.08891.pdf) `guidance_scale` is defined as `φ` in equation 16. of
+                [Common Diffusion Noise Schedules and Sample Steps are Flawed](https://arxiv.org/pdf/2305.08891.pdf).
+                Guidance rescale factor should fix overexposure when using zero terminal SNR.
+
+        Returns:
+            [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] or `tuple`:
+            [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] if `return_dict` is True, otherwise a `tuple.
+            When returning a tuple, the first element is a list with the generated images, and the second element is a
+            list of `bool`s denoting whether the corresponding generated image likely represents "not-safe-for-work"
+            (nsfw) content, according to the `safety_checker`.
+        """
+
+        # 0. Default height and width to unet
+        height = height or self.unet.config["sample_size"] * self.vae_scale_factor
+        width = width or self.unet.config["sample_size"] * self.vae_scale_factor
+
+        original_size = original_size or (height, width)
+        target_size = target_size or (height, width)
+
+        # 1. Check inputs. Raise error if not correct
+        self.check_inputs(
+            prompt,
+            1.0,
+            callback_steps,
+            negative_prompt,
+            prompt_embeds,
+            negative_prompt_embeds,
+        )
+
+        # 2. Define call parameters
+        if isinstance(prompt, str):
+            batch_size = 1
+        elif isinstance(prompt, list):
+            batch_size = len(prompt)
+        else:
+            batch_size = prompt_embeds.shape[0]
+
+        if generator is None:
+            generator = np.random
+
+        # here `guidance_scale` is defined analog to the guidance weight `w` of equation (2)
+        # of the Imagen paper: https://arxiv.org/pdf/2205.11487.pdf . `guidance_scale = 1`
+        # corresponds to doing no classifier free guidance.
+        do_classifier_free_guidance = guidance_scale > 1.0
+
+        # 3. Encode input prompt
+        (
+            prompt_embeds,
+            negative_prompt_embeds,
+            pooled_prompt_embeds,
+            negative_pooled_prompt_embeds,
+        ) = self._encode_prompt(
+            prompt,
+            num_images_per_prompt,
+            do_classifier_free_guidance,
+            negative_prompt,
+            prompt_embeds=prompt_embeds,
+            negative_prompt_embeds=negative_prompt_embeds,
+            pooled_prompt_embeds=pooled_prompt_embeds,
+            negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
+        )
+
+        # 4. Prepare timesteps
+        self.scheduler.set_timesteps(num_inference_steps)
+        timesteps = self.scheduler.timesteps
+
+        # 5. Prepare latent variables
+        latents = self.prepare_latents_text2img(
+            batch_size * num_images_per_prompt,
+            self.unet.config.get("in_channels", 4),
+            height,
+            width,
+            prompt_embeds.dtype,
+            generator,
+            latents,
+        )
+
+        # 6. Prepare extra step kwargs
+        extra_step_kwargs = self.prepare_extra_step_kwargs(generator, eta)
+
+        # 7. Prepare added time ids & embeddings
+        add_text_embeds = pooled_prompt_embeds
+        add_time_ids = (original_size + crops_coords_top_left + target_size,)
+        add_time_ids = np.array(add_time_ids, dtype=prompt_embeds.dtype)
+
+        if do_classifier_free_guidance:
+            prompt_embeds = np.concatenate((negative_prompt_embeds, prompt_embeds), axis=0)
+            add_text_embeds = np.concatenate((negative_pooled_prompt_embeds, add_text_embeds), axis=0)
+            add_time_ids = np.concatenate((add_time_ids, add_time_ids), axis=0)
+        add_time_ids = np.repeat(add_time_ids, batch_size * num_images_per_prompt, axis=0)
+
+        # Adapted from diffusers to extend it for other runtimes than ORT
+        timestep_dtype = self.unet.input_dtype.get("timestep", np.float32)
+
+        # 8. Panorama additions
+        views = self.get_views(height, width, self.window, self.stride)
+        count = np.zeros_like(latents)
+        value = np.zeros_like(latents)
+
+        # 8. Denoising loop
+        num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
+        for i, t in enumerate(self.progress_bar(timesteps)):
+            count.fill(0)
+            value.fill(0)
+
+            for h_start, h_end, w_start, w_end in views:
+                # get the latents corresponding to the current view coordinates
+                latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
+
+                # expand the latents if we are doing classifier free guidance
+                latent_model_input = np.concatenate([latents_for_view] * 2) if do_classifier_free_guidance else latents_for_view
+                latent_model_input = self.scheduler.scale_model_input(torch.from_numpy(latent_model_input), t)
+                latent_model_input = latent_model_input.cpu().numpy()
+
+                # predict the noise residual
+                timestep = np.array([t], dtype=timestep_dtype)
+                noise_pred = self.unet(
+                    sample=latent_model_input,
+                    timestep=timestep,
+                    encoder_hidden_states=prompt_embeds,
+                    text_embeds=add_text_embeds,
+                    time_ids=add_time_ids,
+                )
+                noise_pred = noise_pred[0]
+
+                # perform guidance
+                if do_classifier_free_guidance:
+                    noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
+                    noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
+                    if guidance_rescale > 0.0:
+                        # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
+                        noise_pred = rescale_noise_cfg(noise_pred, noise_pred_text, guidance_rescale=guidance_rescale)
+
+                # compute the previous noisy sample x_t -> x_t-1
+                scheduler_output = self.scheduler.step(
+                    torch.from_numpy(noise_pred), t, torch.from_numpy(latents_for_view), **extra_step_kwargs
+                )
+                latents_view_denoised = scheduler_output.prev_sample.numpy()
+
+                value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
+                count[:, :, h_start:h_end, w_start:w_end] += 1
+
+            # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
+            latents = np.where(count > 0, value / count, value)
+
+            # call the callback, if provided
+            if i == len(timesteps) - 1 or ((i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0):
+                if callback is not None and i % callback_steps == 0:
+                    callback(i, t, latents)
+
+        if output_type == "latent":
+            image = latents
+        else:
+            latents = latents / self.vae_decoder.config.get("scaling_factor", 0.18215)
+            # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
+            image = np.concatenate(
+                [self.vae_decoder(latent_sample=latents[i : i + 1])[0] for i in range(latents.shape[0])]
+            )
+            image = self.watermark.apply_watermark(image)
+
+            # TODO: add image_processor
+            image = np.clip(image / 2 + 0.5, 0, 1).transpose((0, 2, 3, 1))
+
+        if output_type == "pil":
+            image = self.numpy_to_pil(image)
+
+        if not return_dict:
+            return (image,)
+
+        return StableDiffusionXLPipelineOutput(images=image)
+
+
+    # Adapted from diffusers.pipelines.stable_diffusion_xl.pipeline_stable_diffusion_xl.StableDiffusionXLPipeline.__call__
+    def img2img(
+        self,
+        prompt: Optional[Union[str, List[str]]] = None,
+        image: Union[np.ndarray, PIL.Image.Image] = None,
+        strength: float = 0.3,
+        num_inference_steps: int = 50,
+        guidance_scale: float = 5.0,
+        negative_prompt: Optional[Union[str, List[str]]] = None,
+        num_images_per_prompt: int = 1,
+        eta: float = 0.0,
+        generator: Optional[np.random.RandomState] = None,
+        latents: Optional[np.ndarray] = None,
+        prompt_embeds: Optional[np.ndarray] = None,
+        negative_prompt_embeds: Optional[np.ndarray] = None,
+        pooled_prompt_embeds: Optional[np.ndarray] = None,
+        negative_pooled_prompt_embeds: Optional[np.ndarray] = None,
+        output_type: str = "pil",
+        return_dict: bool = True,
+        callback: Optional[Callable[[int, int, np.ndarray], None]] = None,
+        callback_steps: int = 1,
+        cross_attention_kwargs: Optional[Dict[str, Any]] = None,
+        guidance_rescale: float = 0.0,
+        original_size: Optional[Tuple[int, int]] = None,
+        crops_coords_top_left: Tuple[int, int] = (0, 0),
+        target_size: Optional[Tuple[int, int]] = None,
+        aesthetic_score: float = 6.0,
+        negative_aesthetic_score: float = 2.5,
+    ):
+        r"""
+        Function invoked when calling the pipeline for generation.
+
+        Args:
+            prompt (`Optional[Union[str, List[str]]]`, defaults to None):
+                The prompt or prompts to guide the image generation. If not defined, one has to pass `prompt_embeds`.
+                instead.
+            image (`Union[np.ndarray, PIL.Image.Image]`):
+                `Image`, or tensor representing an image batch which will be upscaled.
+            strength (`float`, defaults to 0.8):
+                Conceptually, indicates how much to transform the reference `image`. Must be between 0 and 1. `image`
+                will be used as a starting point, adding more noise to it the larger the `strength`. The number of
+                denoising steps depends on the amount of noise initially added. When `strength` is 1, added noise will
+                be maximum and the denoising process will run for the full number of iterations specified in
+                `num_inference_steps`. A value of 1, therefore, essentially ignores `image`.
+            num_inference_steps (`int`, defaults to 50):
+                The number of denoising steps. More denoising steps usually lead to a higher quality image at the
+                expense of slower inference.
+            guidance_scale (`float`, defaults to 5):
+                Guidance scale as defined in [Classifier-Free Diffusion Guidance](https://arxiv.org/abs/2207.12598).
+                `guidance_scale` is defined as `w` of equation 2. of [Imagen
+                Paper](https://arxiv.org/pdf/2205.11487.pdf). Guidance scale is enabled by setting `guidance_scale >
+                1`. Higher guidance scale encourages to generate images that are closely linked to the text `prompt`,
+                usually at the expense of lower image quality.
+            negative_prompt (`Optional[Union[str, list]]`):
+                The prompt or prompts not to guide the image generation. If not defined, one has to pass
+                `negative_prompt_embeds`. instead. Ignored when not using guidance (i.e., ignored if `guidance_scale`
+                is less than `1`).
+            num_images_per_prompt (`int`, defaults to 1):
+                The number of images to generate per prompt.
+            eta (`float`, defaults to 0.0):
+                Corresponds to parameter eta (η) in the DDIM paper: https://arxiv.org/abs/2010.02502. Only applies to
+                [`schedulers.DDIMScheduler`], will be ignored for others.
+            generator (`Optional[np.random.RandomState]`, defaults to `None`)::
+                A np.random.RandomState to make generation deterministic.
+            latents (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated noisy latents, sampled from a Gaussian distribution, to be used as inputs for image
+                generation. Can be used to tweak the same generation with different prompts. If not provided, a latents
+                tensor will ge generated by sampling using the supplied random `generator`.
+            prompt_embeds (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated text embeddings. Can be used to easily tweak text inputs, *e.g.* prompt weighting. If not
+                provided, text embeddings will be generated from `prompt` input argument.
+            negative_prompt_embeds (`Optional[np.ndarray]`, defaults to `None`):
+                Pre-generated negative text embeddings. Can be used to easily tweak text inputs, *e.g.* prompt
+                weighting. If not provided, negative_prompt_embeds will be generated from `negative_prompt` input
+                argument.
+            output_type (`str`, defaults to `"pil"`):
+                The output format of the generate image. Choose between
+                [PIL](https://pillow.readthedocs.io/en/stable/): `PIL.Image.Image` or `np.array`.
+            return_dict (`bool`, defaults to `True`):
+                Whether or not to return a [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] instead of a
+                plain tuple.
+            callback (Optional[Callable], defaults to `None`):
+                A function that will be called every `callback_steps` steps during inference. The function will be
+                called with the following arguments: `callback(step: int, timestep: int, latents: torch.FloatTensor)`.
+            callback_steps (`int`, defaults to 1):
+                The frequency at which the `callback` function will be called. If not specified, the callback will be
+                called at every step.
+            guidance_rescale (`float`, defaults to 0.7):
+                Guidance rescale factor proposed by [Common Diffusion Noise Schedules and Sample Steps are
+                Flawed](https://arxiv.org/pdf/2305.08891.pdf) `guidance_scale` is defined as `φ` in equation 16. of
+                [Common Diffusion Noise Schedules and Sample Steps are Flawed](https://arxiv.org/pdf/2305.08891.pdf).
+                Guidance rescale factor should fix overexposure when using zero terminal SNR.
+
+        Returns:
+            [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] or `tuple`:
+            [`~pipelines.stable_diffusion.StableDiffusionXLPipelineOutput`] if `return_dict` is True, otherwise a `tuple.
+            When returning a tuple, the first element is a list with the generated images, and the second element is a
+            list of `bool`s denoting whether the corresponding generated image likely represents "not-safe-for-work"
+            (nsfw) content, according to the `safety_checker`.
+        """
+        # 0. Check inputs. Raise error if not correct
+        self.check_inputs(prompt, strength, callback_steps, negative_prompt, prompt_embeds, negative_prompt_embeds)
+
+        # 1. Define call parameters
+        if isinstance(prompt, str):
+            batch_size = 1
+        elif isinstance(prompt, list):
+            batch_size = len(prompt)
+        else:
+            batch_size = prompt_embeds.shape[0]
+
+        if generator is None:
+            generator = np.random
+
+        # here `guidance_scale` is defined analog to the guidance weight `w` of equation (2)
+        # of the Imagen paper: https://arxiv.org/pdf/2205.11487.pdf . `guidance_scale = 1`
+        # corresponds to doing no classifier free guidance.
+        do_classifier_free_guidance = guidance_scale > 1.0
+
+        # 2. Encode input prompt
+        (
+            prompt_embeds,
+            negative_prompt_embeds,
+            pooled_prompt_embeds,
+            negative_pooled_prompt_embeds,
+        ) = self._encode_prompt(
+            prompt,
+            num_images_per_prompt,
+            do_classifier_free_guidance,
+            negative_prompt,
+            prompt_embeds=prompt_embeds,
+            negative_prompt_embeds=negative_prompt_embeds,
+            pooled_prompt_embeds=pooled_prompt_embeds,
+            negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
+        )
+
+        # 3. Preprocess image
+        image = preprocess(image)
+
+        # 4. Prepare timesteps
+        self.scheduler.set_timesteps(num_inference_steps)
+
+        timesteps, num_inference_steps = self.get_timesteps(num_inference_steps, strength)
+        latent_timestep = np.repeat(timesteps[:1], batch_size * num_images_per_prompt, axis=0)
+        timestep_dtype = self.unet.input_dtype.get("timestep", np.float32)
+
+        latents_dtype = prompt_embeds.dtype
+        image = image.astype(latents_dtype)
+
+        # 5. Prepare latent variables
+        latents = self.prepare_latents_img2img(
+            image, latent_timestep, batch_size, num_images_per_prompt, latents_dtype, generator
+        )
+
+        # 6. Prepare extra step kwargs
+        extra_step_kwargs = {}
+        accepts_eta = "eta" in set(inspect.signature(self.scheduler.step).parameters.keys())
+        if accepts_eta:
+            extra_step_kwargs["eta"] = eta
+
+        height, width = latents.shape[-2:]
+        height = height * self.vae_scale_factor
+        width = width * self.vae_scale_factor
+        original_size = original_size or (height, width)
+        target_size = target_size or (height, width)
+
+        # 8. Prepare added time ids & embeddings
+        add_text_embeds = pooled_prompt_embeds
+        add_time_ids, add_neg_time_ids = self._get_add_time_ids(
+            original_size,
+            crops_coords_top_left,
+            target_size,
+            aesthetic_score,
+            negative_aesthetic_score,
+            dtype=prompt_embeds.dtype,
+        )
+
+        if do_classifier_free_guidance:
+            prompt_embeds = np.concatenate((negative_prompt_embeds, prompt_embeds), axis=0)
+            add_text_embeds = np.concatenate((negative_pooled_prompt_embeds, add_text_embeds), axis=0)
+            add_time_ids = np.concatenate((add_time_ids, add_time_ids), axis=0)
+        add_time_ids = np.repeat(add_time_ids, batch_size * num_images_per_prompt, axis=0)
+
+        # 8. Panorama additions
+        views = self.get_views(height, width, self.window, self.stride)
+        count = np.zeros_like(latents)
+        value = np.zeros_like(latents)
+
+        # 8. Denoising loop
+        num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
+        for i, t in enumerate(self.progress_bar(timesteps)):
+            count.fill(0)
+            value.fill(0)
+
+            for h_start, h_end, w_start, w_end in views:
+                # get the latents corresponding to the current view coordinates
+                latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
+
+                # expand the latents if we are doing classifier free guidance
+                latent_model_input = np.concatenate([latents_for_view] * 2) if do_classifier_free_guidance else latents_for_view
+                latent_model_input = self.scheduler.scale_model_input(torch.from_numpy(latent_model_input), t)
+                latent_model_input = latent_model_input.cpu().numpy()
+
+                # predict the noise residual
+                timestep = np.array([t], dtype=timestep_dtype)
+                noise_pred = self.unet(
+                    sample=latent_model_input,
+                    timestep=timestep,
+                    encoder_hidden_states=prompt_embeds,
+                    text_embeds=add_text_embeds,
+                    time_ids=add_time_ids,
+                )
+                noise_pred = noise_pred[0]
+
+                # perform guidance
+                if do_classifier_free_guidance:
+                    noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
+                    noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
+                    if guidance_rescale > 0.0:
+                        # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
+                        noise_pred = rescale_noise_cfg(noise_pred, noise_pred_text, guidance_rescale=guidance_rescale)
+
+                # compute the previous noisy sample x_t -> x_t-1
+                scheduler_output = self.scheduler.step(
+                    torch.from_numpy(noise_pred), t, torch.from_numpy(latents_for_view), **extra_step_kwargs
+                )
+                latents_view_denoised = scheduler_output.prev_sample.numpy()
+
+                value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
+                count[:, :, h_start:h_end, w_start:w_end] += 1
+
+            # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
+            latents = np.where(count > 0, value / count, value)
+
+            # call the callback, if provided
+            if i == len(timesteps) - 1 or ((i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0):
+                if callback is not None and i % callback_steps == 0:
+                    callback(i, t, latents)
+
+        if output_type == "latent":
+            image = latents
+        else:
+            latents = latents / self.vae_decoder.config.get("scaling_factor", 0.18215)
+            # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
+            image = np.concatenate(
+                [self.vae_decoder(latent_sample=latents[i : i + 1])[0] for i in range(latents.shape[0])]
+            )
+            image = self.watermark.apply_watermark(image)
+
+            # TODO: add image_processor
+            image = np.clip(image / 2 + 0.5, 0, 1).transpose((0, 2, 3, 1))
+
+        if output_type == "pil":
+            image = self.numpy_to_pil(image)
+
+        if not return_dict:
+            return (image,)
+
+        return StableDiffusionXLPipelineOutput(images=image)
+
+
+    def __call__(
+        self,
+        *args,
+        **kwargs,
+    ):
+        if "image" in kwargs or (
+            len(args) > 1
+            and (
+                isinstance(args[1], np.ndarray) or isinstance(args[1], PIL.Image.Image)
+            )
+        ):
+            logger.debug("running img2img panorama XL pipeline")
+            return self.img2img(*args, **kwargs)
+        else:
+            logger.debug("running txt2img panorama XL pipeline")
+            return self.text2img(*args, **kwargs)
+
+
+class ORTStableDiffusionXLPanoramaPipeline(ORTStableDiffusionXLPipelineBase, StableDiffusionXLPanoramaPipelineMixin):
+    def __call__(self, *args, **kwargs):
+        return StableDiffusionXLPanoramaPipelineMixin.__call__(self, *args, **kwargs)
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 28825ad4..0ceb99e6 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -259,7 +259,7 @@ class ImageParams:
 
         # otherwise, check for additional allowed pipelines
         if group == "img2img":
-            if pipeline in ["controlnet", "img2img-sdxl", "lpw", "panorama", "pix2pix"]:
+            if pipeline in ["controlnet", "img2img-sdxl", "lpw", "panorama", "panorama-sdxl", "pix2pix"]:
                 return pipeline
             elif pipeline == "txt2img-sdxl":
                 return "img2img-sdxl"
@@ -267,7 +267,7 @@ class ImageParams:
             if pipeline in ["controlnet", "lpw", "panorama"]:
                 return pipeline
         elif group == "txt2img":
-            if pipeline in ["lpw", "panorama", "txt2img-sdxl"]:
+            if pipeline in ["lpw", "panorama", "panorama-sdxl", "txt2img-sdxl"]:
                 return pipeline
 
         logger.debug("pipeline %s is not valid for %s", pipeline, group)
@@ -280,7 +280,7 @@ class ImageParams:
         return self.pipeline == "lpw"
 
     def is_panorama(self):
-        return self.pipeline == "panorama"
+        return self.pipeline in ["panorama", "panorama-sdxl"]
 
     def is_pix2pix(self):
         return self.pipeline == "pix2pix"
diff --git a/gui/src/strings/de.ts b/gui/src/strings/de.ts
index 922ff27d..fb324301 100644
--- a/gui/src/strings/de.ts
+++ b/gui/src/strings/de.ts
@@ -188,6 +188,7 @@ export const I18N_STRINGS_DE = {
         'inpaint-sdxl': '',
         'lpw': '',
         'panorama': '',
+        'panorama-sdxl': '',
         'pix2pix': '',
         'txt2img': '',
         'txt2img-sdxl': '',
diff --git a/gui/src/strings/en.ts b/gui/src/strings/en.ts
index b7fe2cc6..fc2eb448 100644
--- a/gui/src/strings/en.ts
+++ b/gui/src/strings/en.ts
@@ -242,6 +242,7 @@ export const I18N_STRINGS_EN = {
         'inpaint-sdxl': 'SDXL Inpaint',
         'lpw': 'Long Prompt Weighting',
         'panorama': 'Panorama',
+        'panorama-sdxl': 'SDXL Panorama',
         'pix2pix': 'Instruct Pix2Pix',
         'txt2img': 'Txt2Img',
         'txt2img-sdxl': 'SDXL Txt2Img',
diff --git a/gui/src/strings/es.ts b/gui/src/strings/es.ts
index 8bd6d792..e2b572e0 100644
--- a/gui/src/strings/es.ts
+++ b/gui/src/strings/es.ts
@@ -188,6 +188,7 @@ export const I18N_STRINGS_ES = {
         'inpaint-sdxl': '',
         'lpw': '',
         'panorama': '',
+        'panorama-sdxl': '',
         'pix2pix': '',
         'txt2img': '',
         'txt2img-sdxl': '',
diff --git a/gui/src/strings/fr.ts b/gui/src/strings/fr.ts
index 38afb2e1..589cf85f 100644
--- a/gui/src/strings/fr.ts
+++ b/gui/src/strings/fr.ts
@@ -188,6 +188,7 @@ export const I18N_STRINGS_FR = {
         'inpaint-sdxl': '',
         'lpw': '',
         'panorama': '',
+        'panorama-sdxl': '',
         'pix2pix': '',
         'txt2img': '',
         'txt2img-sdxl': '',

From 78f834a67852a92f6b7967bcda8d5da8a94f9cb1 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 11:26:55 -0500
Subject: [PATCH 003/240] apply lint

---
 api/onnx_web/diffusers/patches/vae.py         |   6 +-
 .../diffusers/pipelines/panorama_xl.py        | 211 +++++++++++++-----
 api/onnx_web/params.py                        |   9 +-
 3 files changed, 168 insertions(+), 58 deletions(-)

diff --git a/api/onnx_web/diffusers/patches/vae.py b/api/onnx_web/diffusers/patches/vae.py
index 48e9358e..1b46e505 100644
--- a/api/onnx_web/diffusers/patches/vae.py
+++ b/api/onnx_web/diffusers/patches/vae.py
@@ -39,7 +39,11 @@ class VAEWrapper(object):
         self.tile_overlap_factor = overlap
 
     def __call__(self, latent_sample=None, sample=None, **kwargs):
-        model = self.wrapped.model if hasattr(self.wrapped, "model") else self.wrapped.session
+        model = (
+            self.wrapped.model
+            if hasattr(self.wrapped, "model")
+            else self.wrapped.session
+        )
 
         # set timestep dtype to input type
         sample_dtype = next(
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 5092cae0..fed65722 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -1,13 +1,16 @@
-from optimum.onnxruntime.modeling_diffusion import ORTStableDiffusionXLPipelineBase
-from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import StableDiffusionXLImg2ImgPipelineMixin
-from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
-from diffusers.pipelines.stable_diffusion_xl import StableDiffusionXLPipelineOutput
+import inspect
 import logging
-from typing import Any, Optional, List, Union, Tuple, Callable, Dict
-import torch
+from typing import Any, Callable, Dict, List, Optional, Tuple, Union
+
 import numpy as np
 import PIL
-import inspect
+import torch
+from diffusers.pipelines.stable_diffusion_xl import StableDiffusionXLPipelineOutput
+from optimum.onnxruntime.modeling_diffusion import ORTStableDiffusionXLPipelineBase
+from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
+    StableDiffusionXLImg2ImgPipelineMixin,
+)
+from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
 
 logger = logging.getLogger(__name__)
 
@@ -18,23 +21,21 @@ DEFAULT_STRIDE = 16
 
 class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMixin):
     def __init__(
-            self,
-            *args,
-            window: int = DEFAULT_WINDOW,
-            stride: int = DEFAULT_STRIDE,
-            **kwargs,
+        self,
+        *args,
+        window: int = DEFAULT_WINDOW,
+        stride: int = DEFAULT_STRIDE,
+        **kwargs,
     ):
         super().__init__(self, *args, **kwargs)
 
         self.window = window
         self.stride = stride
 
-
     def set_window_size(self, window: int, stride: int):
         self.window = window
         self.stride = stride
 
-
     def get_views(self, panorama_height, panorama_width, window_size, stride):
         # Here, we define the mappings F_i (see Eq. 7 in the MultiDiffusion paper https://arxiv.org/abs/2302.08113)
         panorama_height /= 8
@@ -60,21 +61,32 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         return views
 
-
     # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
-    def prepare_latents_img2img(self, image, timestep, batch_size, num_images_per_prompt, dtype, generator=None):
+    def prepare_latents_img2img(
+        self, image, timestep, batch_size, num_images_per_prompt, dtype, generator=None
+    ):
         batch_size = batch_size * num_images_per_prompt
 
         if image.shape[1] == 4:
             init_latents = image
         else:
-            init_latents = self.vae_encoder(sample=image)[0] * self.vae_decoder.config.get("scaling_factor", 0.18215)
+            init_latents = self.vae_encoder(sample=image)[
+                0
+            ] * self.vae_decoder.config.get("scaling_factor", 0.18215)
 
-        if batch_size > init_latents.shape[0] and batch_size % init_latents.shape[0] == 0:
+        if (
+            batch_size > init_latents.shape[0]
+            and batch_size % init_latents.shape[0] == 0
+        ):
             # expand init_latents for batch_size
             additional_image_per_prompt = batch_size // init_latents.shape[0]
-            init_latents = np.concatenate([init_latents] * additional_image_per_prompt, axis=0)
-        elif batch_size > init_latents.shape[0] and batch_size % init_latents.shape[0] != 0:
+            init_latents = np.concatenate(
+                [init_latents] * additional_image_per_prompt, axis=0
+            )
+        elif (
+            batch_size > init_latents.shape[0]
+            and batch_size % init_latents.shape[0] != 0
+        ):
             raise ValueError(
                 f"Cannot duplicate `image` of batch size {init_latents.shape[0]} to {batch_size} text prompts."
             )
@@ -84,14 +96,29 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         # add noise to latents using the timesteps
         noise = generator.randn(*init_latents.shape).astype(dtype)
         init_latents = self.scheduler.add_noise(
-            torch.from_numpy(init_latents), torch.from_numpy(noise), torch.from_numpy(timestep)
+            torch.from_numpy(init_latents),
+            torch.from_numpy(noise),
+            torch.from_numpy(timestep),
         )
         return init_latents.numpy()
 
-
     # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
-    def prepare_latents_text2img(self, batch_size, num_channels_latents, height, width, dtype, generator, latents=None):
-        shape = (batch_size, num_channels_latents, height // self.vae_scale_factor, width // self.vae_scale_factor)
+    def prepare_latents_text2img(
+        self,
+        batch_size,
+        num_channels_latents,
+        height,
+        width,
+        dtype,
+        generator,
+        latents=None,
+    ):
+        shape = (
+            batch_size,
+            num_channels_latents,
+            height // self.vae_scale_factor,
+            width // self.vae_scale_factor,
+        )
         if isinstance(generator, list) and len(generator) != batch_size:
             raise ValueError(
                 f"You have passed a list of generators of length {len(generator)}, but requested an effective batch"
@@ -101,14 +128,15 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         if latents is None:
             latents = generator.randn(*shape).astype(dtype)
         elif latents.shape != shape:
-            raise ValueError(f"Unexpected latents shape, got {latents.shape}, expected {shape}")
+            raise ValueError(
+                f"Unexpected latents shape, got {latents.shape}, expected {shape}"
+            )
 
         # scale the initial noise by the standard deviation required by the scheduler
         latents = latents * np.float64(self.scheduler.init_noise_sigma)
 
         return latents
 
-
     # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_extra_step_kwargs
     def prepare_extra_step_kwargs(self, generator, eta):
         # prepare extra kwargs for the scheduler step, since not all schedulers have the same signature
@@ -118,13 +146,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         extra_step_kwargs = {}
 
-        accepts_eta = "eta" in set(inspect.signature(self.scheduler.step).parameters.keys())
+        accepts_eta = "eta" in set(
+            inspect.signature(self.scheduler.step).parameters.keys()
+        )
         if accepts_eta:
             extra_step_kwargs["eta"] = eta
 
         return extra_step_kwargs
 
-
     # Adapted from diffusers.pipelines.stable_diffusion_xl.pipeline_stable_diffusion_xl.StableDiffusionXLPipeline.__call__
     def text2img(
         self,
@@ -294,10 +323,16 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         add_time_ids = np.array(add_time_ids, dtype=prompt_embeds.dtype)
 
         if do_classifier_free_guidance:
-            prompt_embeds = np.concatenate((negative_prompt_embeds, prompt_embeds), axis=0)
-            add_text_embeds = np.concatenate((negative_pooled_prompt_embeds, add_text_embeds), axis=0)
+            prompt_embeds = np.concatenate(
+                (negative_prompt_embeds, prompt_embeds), axis=0
+            )
+            add_text_embeds = np.concatenate(
+                (negative_pooled_prompt_embeds, add_text_embeds), axis=0
+            )
             add_time_ids = np.concatenate((add_time_ids, add_time_ids), axis=0)
-        add_time_ids = np.repeat(add_time_ids, batch_size * num_images_per_prompt, axis=0)
+        add_time_ids = np.repeat(
+            add_time_ids, batch_size * num_images_per_prompt, axis=0
+        )
 
         # Adapted from diffusers to extend it for other runtimes than ORT
         timestep_dtype = self.unet.input_dtype.get("timestep", np.float32)
@@ -318,8 +353,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
 
                 # expand the latents if we are doing classifier free guidance
-                latent_model_input = np.concatenate([latents_for_view] * 2) if do_classifier_free_guidance else latents_for_view
-                latent_model_input = self.scheduler.scale_model_input(torch.from_numpy(latent_model_input), t)
+                latent_model_input = (
+                    np.concatenate([latents_for_view] * 2)
+                    if do_classifier_free_guidance
+                    else latents_for_view
+                )
+                latent_model_input = self.scheduler.scale_model_input(
+                    torch.from_numpy(latent_model_input), t
+                )
                 latent_model_input = latent_model_input.cpu().numpy()
 
                 # predict the noise residual
@@ -336,14 +377,23 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 # perform guidance
                 if do_classifier_free_guidance:
                     noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
-                    noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
+                    noise_pred = noise_pred_uncond + guidance_scale * (
+                        noise_pred_text - noise_pred_uncond
+                    )
                     if guidance_rescale > 0.0:
                         # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
-                        noise_pred = rescale_noise_cfg(noise_pred, noise_pred_text, guidance_rescale=guidance_rescale)
+                        noise_pred = rescale_noise_cfg(
+                            noise_pred,
+                            noise_pred_text,
+                            guidance_rescale=guidance_rescale,
+                        )
 
                 # compute the previous noisy sample x_t -> x_t-1
                 scheduler_output = self.scheduler.step(
-                    torch.from_numpy(noise_pred), t, torch.from_numpy(latents_for_view), **extra_step_kwargs
+                    torch.from_numpy(noise_pred),
+                    t,
+                    torch.from_numpy(latents_for_view),
+                    **extra_step_kwargs,
                 )
                 latents_view_denoised = scheduler_output.prev_sample.numpy()
 
@@ -354,7 +404,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             latents = np.where(count > 0, value / count, value)
 
             # call the callback, if provided
-            if i == len(timesteps) - 1 or ((i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0):
+            if i == len(timesteps) - 1 or (
+                (i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0
+            ):
                 if callback is not None and i % callback_steps == 0:
                     callback(i, t, latents)
 
@@ -364,7 +416,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             latents = latents / self.vae_decoder.config.get("scaling_factor", 0.18215)
             # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
             image = np.concatenate(
-                [self.vae_decoder(latent_sample=latents[i : i + 1])[0] for i in range(latents.shape[0])]
+                [
+                    self.vae_decoder(latent_sample=latents[i : i + 1])[0]
+                    for i in range(latents.shape[0])
+                ]
             )
             image = self.watermark.apply_watermark(image)
 
@@ -379,7 +434,6 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         return StableDiffusionXLPipelineOutput(images=image)
 
-
     # Adapted from diffusers.pipelines.stable_diffusion_xl.pipeline_stable_diffusion_xl.StableDiffusionXLPipeline.__call__
     def img2img(
         self,
@@ -481,7 +535,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             (nsfw) content, according to the `safety_checker`.
         """
         # 0. Check inputs. Raise error if not correct
-        self.check_inputs(prompt, strength, callback_steps, negative_prompt, prompt_embeds, negative_prompt_embeds)
+        self.check_inputs(
+            prompt,
+            strength,
+            callback_steps,
+            negative_prompt,
+            prompt_embeds,
+            negative_prompt_embeds,
+        )
 
         # 1. Define call parameters
         if isinstance(prompt, str):
@@ -522,8 +583,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         # 4. Prepare timesteps
         self.scheduler.set_timesteps(num_inference_steps)
 
-        timesteps, num_inference_steps = self.get_timesteps(num_inference_steps, strength)
-        latent_timestep = np.repeat(timesteps[:1], batch_size * num_images_per_prompt, axis=0)
+        timesteps, num_inference_steps = self.get_timesteps(
+            num_inference_steps, strength
+        )
+        latent_timestep = np.repeat(
+            timesteps[:1], batch_size * num_images_per_prompt, axis=0
+        )
         timestep_dtype = self.unet.input_dtype.get("timestep", np.float32)
 
         latents_dtype = prompt_embeds.dtype
@@ -531,12 +596,19 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 5. Prepare latent variables
         latents = self.prepare_latents_img2img(
-            image, latent_timestep, batch_size, num_images_per_prompt, latents_dtype, generator
+            image,
+            latent_timestep,
+            batch_size,
+            num_images_per_prompt,
+            latents_dtype,
+            generator,
         )
 
         # 6. Prepare extra step kwargs
         extra_step_kwargs = {}
-        accepts_eta = "eta" in set(inspect.signature(self.scheduler.step).parameters.keys())
+        accepts_eta = "eta" in set(
+            inspect.signature(self.scheduler.step).parameters.keys()
+        )
         if accepts_eta:
             extra_step_kwargs["eta"] = eta
 
@@ -558,10 +630,16 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         )
 
         if do_classifier_free_guidance:
-            prompt_embeds = np.concatenate((negative_prompt_embeds, prompt_embeds), axis=0)
-            add_text_embeds = np.concatenate((negative_pooled_prompt_embeds, add_text_embeds), axis=0)
+            prompt_embeds = np.concatenate(
+                (negative_prompt_embeds, prompt_embeds), axis=0
+            )
+            add_text_embeds = np.concatenate(
+                (negative_pooled_prompt_embeds, add_text_embeds), axis=0
+            )
             add_time_ids = np.concatenate((add_time_ids, add_time_ids), axis=0)
-        add_time_ids = np.repeat(add_time_ids, batch_size * num_images_per_prompt, axis=0)
+        add_time_ids = np.repeat(
+            add_time_ids, batch_size * num_images_per_prompt, axis=0
+        )
 
         # 8. Panorama additions
         views = self.get_views(height, width, self.window, self.stride)
@@ -579,8 +657,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
 
                 # expand the latents if we are doing classifier free guidance
-                latent_model_input = np.concatenate([latents_for_view] * 2) if do_classifier_free_guidance else latents_for_view
-                latent_model_input = self.scheduler.scale_model_input(torch.from_numpy(latent_model_input), t)
+                latent_model_input = (
+                    np.concatenate([latents_for_view] * 2)
+                    if do_classifier_free_guidance
+                    else latents_for_view
+                )
+                latent_model_input = self.scheduler.scale_model_input(
+                    torch.from_numpy(latent_model_input), t
+                )
                 latent_model_input = latent_model_input.cpu().numpy()
 
                 # predict the noise residual
@@ -597,14 +681,23 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 # perform guidance
                 if do_classifier_free_guidance:
                     noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
-                    noise_pred = noise_pred_uncond + guidance_scale * (noise_pred_text - noise_pred_uncond)
+                    noise_pred = noise_pred_uncond + guidance_scale * (
+                        noise_pred_text - noise_pred_uncond
+                    )
                     if guidance_rescale > 0.0:
                         # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
-                        noise_pred = rescale_noise_cfg(noise_pred, noise_pred_text, guidance_rescale=guidance_rescale)
+                        noise_pred = rescale_noise_cfg(
+                            noise_pred,
+                            noise_pred_text,
+                            guidance_rescale=guidance_rescale,
+                        )
 
                 # compute the previous noisy sample x_t -> x_t-1
                 scheduler_output = self.scheduler.step(
-                    torch.from_numpy(noise_pred), t, torch.from_numpy(latents_for_view), **extra_step_kwargs
+                    torch.from_numpy(noise_pred),
+                    t,
+                    torch.from_numpy(latents_for_view),
+                    **extra_step_kwargs,
                 )
                 latents_view_denoised = scheduler_output.prev_sample.numpy()
 
@@ -615,7 +708,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             latents = np.where(count > 0, value / count, value)
 
             # call the callback, if provided
-            if i == len(timesteps) - 1 or ((i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0):
+            if i == len(timesteps) - 1 or (
+                (i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0
+            ):
                 if callback is not None and i % callback_steps == 0:
                     callback(i, t, latents)
 
@@ -625,7 +720,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             latents = latents / self.vae_decoder.config.get("scaling_factor", 0.18215)
             # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
             image = np.concatenate(
-                [self.vae_decoder(latent_sample=latents[i : i + 1])[0] for i in range(latents.shape[0])]
+                [
+                    self.vae_decoder(latent_sample=latents[i : i + 1])[0]
+                    for i in range(latents.shape[0])
+                ]
             )
             image = self.watermark.apply_watermark(image)
 
@@ -640,7 +738,6 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         return StableDiffusionXLPipelineOutput(images=image)
 
-
     def __call__(
         self,
         *args,
@@ -659,6 +756,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             return self.text2img(*args, **kwargs)
 
 
-class ORTStableDiffusionXLPanoramaPipeline(ORTStableDiffusionXLPipelineBase, StableDiffusionXLPanoramaPipelineMixin):
+class ORTStableDiffusionXLPanoramaPipeline(
+    ORTStableDiffusionXLPipelineBase, StableDiffusionXLPanoramaPipelineMixin
+):
     def __call__(self, *args, **kwargs):
         return StableDiffusionXLPanoramaPipelineMixin.__call__(self, *args, **kwargs)
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 0ceb99e6..4b03f758 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -259,7 +259,14 @@ class ImageParams:
 
         # otherwise, check for additional allowed pipelines
         if group == "img2img":
-            if pipeline in ["controlnet", "img2img-sdxl", "lpw", "panorama", "panorama-sdxl", "pix2pix"]:
+            if pipeline in [
+                "controlnet",
+                "img2img-sdxl",
+                "lpw",
+                "panorama",
+                "panorama-sdxl",
+                "pix2pix",
+            ]:
                 return pipeline
             elif pipeline == "txt2img-sdxl":
                 return "img2img-sdxl"

From fe68670844d25226a634c8ead689b47fa520722b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 11:52:46 -0500
Subject: [PATCH 004/240] feat(api): add conversion for SDXL models

---
 api/onnx_web/convert/__main__.py              | 28 +++++---
 .../diffusion/{diffusers.py => diffusion.py}  |  0
 .../convert/diffusion/diffusion_xl.py         | 72 +++++++++++++++++++
 3 files changed, 92 insertions(+), 8 deletions(-)
 rename api/onnx_web/convert/diffusion/{diffusers.py => diffusion.py} (100%)
 create mode 100644 api/onnx_web/convert/diffusion/diffusion_xl.py

diff --git a/api/onnx_web/convert/__main__.py b/api/onnx_web/convert/__main__.py
index 36c97429..9a44fd8d 100644
--- a/api/onnx_web/convert/__main__.py
+++ b/api/onnx_web/convert/__main__.py
@@ -11,11 +11,13 @@ from jsonschema import ValidationError, validate
 from onnx import load_model, save_model
 from transformers import CLIPTokenizer
 
+from .diffusion.diffusion_xl import convert_diffusion_diffusers_xl
+
 from ..constants import ONNX_MODEL, ONNX_WEIGHTS
 from ..utils import load_config
 from .correction.gfpgan import convert_correction_gfpgan
 from .diffusion.control import convert_diffusion_control
-from .diffusion.diffusers import convert_diffusion_diffusers
+from .diffusion.diffusion import convert_diffusion_diffusers
 from .diffusion.lora import blend_loras
 from .diffusion.textual_inversion import blend_textual_inversions
 from .upscaling.bsrgan import convert_upscaling_bsrgan
@@ -357,13 +359,23 @@ def convert_models(conversion: ConversionContext, args, models: Models):
                         conversion, name, model["source"], format=model_format
                     )
 
-                    converted, dest = convert_diffusion_diffusers(
-                        conversion,
-                        model,
-                        source,
-                        model_format,
-                        hf=hf,
-                    )
+                    pipeline = model.get("pipeline", "txt2img")
+                    if pipeline.endswith("-sdxl"):
+                        converted, dest = convert_diffusion_diffusers_xl(
+                            conversion,
+                            model,
+                            source,
+                            model_format,
+                            hf=hf,
+                        )
+                    else:
+                        converted, dest = convert_diffusion_diffusers(
+                            conversion,
+                            model,
+                            source,
+                            model_format,
+                            hf=hf,
+                        )
 
                     # make sure blending only happens once, not every run
                     if converted:
diff --git a/api/onnx_web/convert/diffusion/diffusers.py b/api/onnx_web/convert/diffusion/diffusion.py
similarity index 100%
rename from api/onnx_web/convert/diffusion/diffusers.py
rename to api/onnx_web/convert/diffusion/diffusion.py
diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
new file mode 100644
index 00000000..58d57143
--- /dev/null
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -0,0 +1,72 @@
+from logging import getLogger
+from os import path
+from typing import Dict, Optional, Tuple
+
+import torch
+from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl import StableDiffusionXLPipeline
+from optimum.exporters.onnx import main_export
+
+from ..utils import ConversionContext
+
+logger = getLogger(__name__)
+
+
+@torch.no_grad()
+def convert_diffusion_diffusers_xl(
+    conversion: ConversionContext,
+    model: Dict,
+    source: str,
+    format: Optional[str],
+    hf: bool = False,
+) -> Tuple[bool, str]:
+    """
+    From https://github.com/huggingface/diffusers/blob/main/scripts/convert_stable_diffusion_checkpoint_to_onnx.py
+    """
+    name = model.get("name")
+    # TODO: support alternate VAE
+
+    device = conversion.training_device
+    dtype = conversion.torch_dtype()
+    logger.debug("using Torch dtype %s for pipeline", dtype)
+
+    dest_path = path.join(conversion.model_path, name)
+    model_index = path.join(dest_path, "model_index.json")
+    model_hash = path.join(dest_path, "hash.txt")
+
+    # diffusers go into a directory rather than .onnx file
+    logger.info(
+        "converting Stable Diffusion XL model %s: %s -> %s/", name, source, dest_path
+    )
+
+    if "hash" in model and not path.exists(model_hash):
+        logger.info("ONNX model does not have hash file, adding one")
+        with open(model_hash, "w") as f:
+            f.write(model["hash"])
+
+    if path.exists(dest_path) and path.exists(model_index):
+        logger.info("ONNX model already exists, skipping conversion")
+        return (False, dest_path)
+
+    # safetensors -> diffusers directory with torch models
+    temp_path = path.join(conversion.cache_path, f"{name}-torch")
+
+    if format == "safetensors":
+        pipeline = StableDiffusionXLPipeline.from_single_file(source, use_safetensors=True)
+    else:
+        pipeline = StableDiffusionXLPipeline.from_pretrained(source)
+
+    pipeline.save_pretrained(temp_path)
+
+    # directory -> onnx using optimum exporters
+    main_export(
+        temp_path,
+        output=dest_path,
+        task="stable-diffusion-xl",
+        device=device,
+        fp16=conversion.half,
+        framework="pt",
+    )
+
+    # TODO: optimize UNet to fp16
+
+    return False, dest_path
\ No newline at end of file

From f2d0c2f7657d6ac5af955a1cedd5de05540c1f03 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 11:53:36 -0500
Subject: [PATCH 005/240] apply lint

---
 api/onnx_web/convert/__main__.py               |  3 +--
 api/onnx_web/convert/diffusion/diffusion_xl.py | 10 +++++++---
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/api/onnx_web/convert/__main__.py b/api/onnx_web/convert/__main__.py
index 9a44fd8d..a969ca4c 100644
--- a/api/onnx_web/convert/__main__.py
+++ b/api/onnx_web/convert/__main__.py
@@ -11,13 +11,12 @@ from jsonschema import ValidationError, validate
 from onnx import load_model, save_model
 from transformers import CLIPTokenizer
 
-from .diffusion.diffusion_xl import convert_diffusion_diffusers_xl
-
 from ..constants import ONNX_MODEL, ONNX_WEIGHTS
 from ..utils import load_config
 from .correction.gfpgan import convert_correction_gfpgan
 from .diffusion.control import convert_diffusion_control
 from .diffusion.diffusion import convert_diffusion_diffusers
+from .diffusion.diffusion_xl import convert_diffusion_diffusers_xl
 from .diffusion.lora import blend_loras
 from .diffusion.textual_inversion import blend_textual_inversions
 from .upscaling.bsrgan import convert_upscaling_bsrgan
diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index 58d57143..a92c5856 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -3,8 +3,10 @@ from os import path
 from typing import Dict, Optional, Tuple
 
 import torch
-from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl import StableDiffusionXLPipeline
 from optimum.exporters.onnx import main_export
+from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl import (
+    StableDiffusionXLPipeline,
+)
 
 from ..utils import ConversionContext
 
@@ -51,7 +53,9 @@ def convert_diffusion_diffusers_xl(
     temp_path = path.join(conversion.cache_path, f"{name}-torch")
 
     if format == "safetensors":
-        pipeline = StableDiffusionXLPipeline.from_single_file(source, use_safetensors=True)
+        pipeline = StableDiffusionXLPipeline.from_single_file(
+            source, use_safetensors=True
+        )
     else:
         pipeline = StableDiffusionXLPipeline.from_pretrained(source)
 
@@ -69,4 +73,4 @@ def convert_diffusion_diffusers_xl(
 
     # TODO: optimize UNet to fp16
 
-    return False, dest_path
\ No newline at end of file
+    return False, dest_path

From 956a260db6b6a6c91ffe7bcdf9ba8106e3f2faf0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 12:15:39 -0500
Subject: [PATCH 006/240] fix import

---
 api/onnx_web/convert/diffusion/diffusion_xl.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index a92c5856..a7dcf104 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -3,10 +3,8 @@ from os import path
 from typing import Dict, Optional, Tuple
 
 import torch
+from diffusers import StableDiffusionXLPipeline
 from optimum.exporters.onnx import main_export
-from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl import (
-    StableDiffusionXLPipeline,
-)
 
 from ..utils import ConversionContext
 

From 1a732d54b6168fa9949ec3d19faea10b197fb508 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 16:35:16 -0500
Subject: [PATCH 007/240] add endpoint for multiple image generation

---
 api/onnx_web/output.py        |   3 +-
 api/onnx_web/server/api.py    |  58 ++++++++++++-
 api/onnx_web/server/params.py | 153 +++++++++++++++++++++++++++++++++-
 3 files changed, 211 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/output.py b/api/onnx_web/output.py
index 17f29744..d64f79a0 100644
--- a/api/onnx_web/output.py
+++ b/api/onnx_web/output.py
@@ -158,6 +158,7 @@ def make_output_name(
     size: Size,
     extras: Optional[List[Optional[Param]]] = None,
     count: Optional[int] = None,
+    offset: int = 0,
 ) -> List[str]:
     count = count or params.batch
     now = int(time())
@@ -183,7 +184,7 @@ def make_output_name(
 
     return [
         f"{mode}_{params.seed}_{sha.hexdigest()}_{now}_{i}.{server.image_format}"
-        for i in range(count)
+        for i in range(offset, count + offset)
     ]
 
 
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 7035f680..8e046440 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -51,6 +51,7 @@ from .load import (
 from .params import (
     border_from_request,
     highres_from_request,
+    pipeline_from_json,
     pipeline_from_request,
     upscale_from_request,
 )
@@ -221,7 +222,7 @@ def txt2img(server: ServerContext, pool: DevicePoolExecutor):
 
     replace_wildcards(params, get_wildcard_data())
 
-    output = make_output_name(server, "txt2img", params, size)
+    output = make_output_name(server, "txt2img", params, size, count=params.batch)
 
     job_name = output[0]
     pool.submit(
@@ -514,6 +515,61 @@ def txt2txt(server: ServerContext, pool: DevicePoolExecutor):
     return jsonify(json_params(output, params, size))
 
 
+def generate(server: ServerContext, pool: DevicePoolExecutor):
+    if not request.is_json():
+        return error_reply("generate endpoint requires JSON parameters")
+
+    # TODO: should this accept YAML as well?
+    data = request.get_json()
+    schema = load_config("./schemas/generate.yaml")
+
+    logger.debug("validating generate request: %s against %s", data, schema)
+    validate(data, schema)
+
+    jobs = []
+
+    if "txt2img" in data:
+        for job in data.get("txt2img"):
+            device, params, size = pipeline_from_json(server, job, "txt2img")
+            jobs.append((
+                f"generate-txt2img-{len(jobs)}",
+                run_txt2img_pipeline,
+                server,
+                params,
+                size,
+                make_output_name(server, "txt2img", params, size, offset=len(jobs)),
+                None,
+                None,
+                device,
+            ))
+
+    if "img2img" in data:
+        for job in data.get("img2img"):
+            device, params, size = pipeline_from_json(server, job, "img2img")
+            jobs.append((
+                f"generate-img2img-{len(jobs)}",
+                run_img2img_pipeline,
+                server,
+                params,
+                size,
+                make_output_name(server, "img2img", params, size, offset=len(jobs))
+                None,
+                None,
+                device,
+            ))
+
+    for job in jobs:
+        pool.submit(*job)
+
+    # TODO: collect results
+    # this is the hard part. once all of the jobs are done, the last job or some dedicated job
+    # needs to collect the previous outputs and put them on a grid. jobs write their own
+    # output to disk and do not return it, so that may need to read the images based on the
+    # output names assigned to each job. knowing when the jobs are done is the first problem.
+
+    # TODO: assemble grid
+
+
 def cancel(server: ServerContext, pool: DevicePoolExecutor):
     output_file = request.args.get("output", None)
     if output_file is None:
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index 2598e819..43c7a511 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Tuple
+from typing import Any, Dict, Tuple
 
 import numpy as np
 from flask import request
@@ -34,6 +34,157 @@ from .utils import get_model_path
 logger = getLogger(__name__)
 
 
+def pipeline_from_json(
+        server: ServerContext,
+        data: Dict[str, Any],
+        default_pipeline: str = "txt2img",
+) -> Tuple[DeviceParams, ImageParams, Size]:
+    device = None
+    device_name = data.get("platform")
+
+    if device_name is not None and device_name != "any":
+        for platform in get_available_platforms():
+            if platform.device == device_name:
+                device = platform
+
+    # diffusion model
+    model = get_not_empty(data, "model", get_config_value("model"))
+    model_path = get_model_path(server, model)
+
+    # pipeline stuff
+    pipeline = get_from_list(
+        data, "pipeline", get_available_pipelines(), default_pipeline
+    )
+    scheduler = get_from_list(data, "scheduler", get_pipeline_schedulers())
+
+    if scheduler is None:
+        scheduler = get_config_value("scheduler")
+
+    # prompt does not come from config
+    prompt = data.get("prompt", "")
+    negative_prompt = data.get("negativePrompt", None)
+
+    if negative_prompt is not None and negative_prompt.strip() == "":
+        negative_prompt = None
+
+    # image params
+    batch = get_and_clamp_int(
+        data,
+        "batch",
+        get_config_value("batch"),
+        get_config_value("batch", "max"),
+        get_config_value("batch", "min"),
+    )
+    cfg = get_and_clamp_float(
+        data,
+        "cfg",
+        get_config_value("cfg"),
+        get_config_value("cfg", "max"),
+        get_config_value("cfg", "min"),
+    )
+    eta = get_and_clamp_float(
+        data,
+        "eta",
+        get_config_value("eta"),
+        get_config_value("eta", "max"),
+        get_config_value("eta", "min"),
+    )
+    loopback = get_and_clamp_int(
+        data,
+        "loopback",
+        get_config_value("loopback"),
+        get_config_value("loopback", "max"),
+        get_config_value("loopback", "min"),
+    )
+    steps = get_and_clamp_int(
+        data,
+        "steps",
+        get_config_value("steps"),
+        get_config_value("steps", "max"),
+        get_config_value("steps", "min"),
+    )
+    height = get_and_clamp_int(
+        data,
+        "height",
+        get_config_value("height"),
+        get_config_value("height", "max"),
+        get_config_value("height", "min"),
+    )
+    width = get_and_clamp_int(
+        data,
+        "width",
+        get_config_value("width"),
+        get_config_value("width", "max"),
+        get_config_value("width", "min"),
+    )
+    tiled_vae = get_boolean(data, "tiledVAE", get_config_value("tiledVAE"))
+    tiles = get_and_clamp_int(
+        data,
+        "tiles",
+        get_config_value("tiles"),
+        get_config_value("tiles", "max"),
+        get_config_value("tiles", "min"),
+    )
+    overlap = get_and_clamp_float(
+        data,
+        "overlap",
+        get_config_value("overlap"),
+        get_config_value("overlap", "max"),
+        get_config_value("overlap", "min"),
+    )
+    stride = get_and_clamp_int(
+        data,
+        "stride",
+        get_config_value("stride"),
+        get_config_value("stride", "max"),
+        get_config_value("stride", "min"),
+    )
+
+    if stride > tiles:
+        logger.info("limiting stride to tile size, %s > %s", stride, tiles)
+        stride = tiles
+
+    seed = int(data.get("seed", -1))
+    if seed == -1:
+        # this one can safely use np.random because it produces a single value
+        seed = np.random.randint(np.iinfo(np.int32).max)
+
+    logger.debug(
+        "parsed parameters for %s steps of %s using %s in %s on %s, %sx%s, %s, %s - %s",
+        steps,
+        scheduler,
+        model_path,
+        pipeline,
+        device or "any device",
+        width,
+        height,
+        cfg,
+        seed,
+        prompt,
+    )
+
+    params = ImageParams(
+        model_path,
+        pipeline,
+        scheduler,
+        prompt,
+        cfg,
+        steps,
+        seed,
+        eta=eta,
+        negative_prompt=negative_prompt,
+        batch=batch,
+        # TODO: control=control,
+        loopback=loopback,
+        tiled_vae=tiled_vae,
+        tiles=tiles,
+        overlap=overlap,
+        stride=stride,
+    )
+    size = Size(width, height)
+    return (device, params, size)
+
+
 def pipeline_from_request(
     server: ServerContext,
     default_pipeline: str = "txt2img",

From 1fb965633ed339bafb3097b21a6cb485af29f41b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 20:59:13 -0500
Subject: [PATCH 008/240] read chain pipeline from JSON, remove new endpoint

---
 api/onnx_web/chain/__init__.py       |   2 +
 api/onnx_web/chain/blend_grid.py     |  47 +++++++++++
 api/onnx_web/chain/source_noise.py   |   8 +-
 api/onnx_web/chain/source_s3.py      |   9 ++-
 api/onnx_web/chain/source_txt2img.py |  14 ++--
 api/onnx_web/chain/source_url.py     |   6 +-
 api/onnx_web/server/api.py           |  76 +++--------------
 api/schemas/generate.yaml            | 117 +++++++++++++++++++++++++++
 8 files changed, 202 insertions(+), 77 deletions(-)
 create mode 100644 api/onnx_web/chain/blend_grid.py
 create mode 100644 api/schemas/generate.yaml

diff --git a/api/onnx_web/chain/__init__.py b/api/onnx_web/chain/__init__.py
index e0e23a30..df2ac80e 100644
--- a/api/onnx_web/chain/__init__.py
+++ b/api/onnx_web/chain/__init__.py
@@ -1,5 +1,6 @@
 from .base import ChainPipeline, PipelineStage, StageParams
 from .blend_img2img import BlendImg2ImgStage
+from .blend_grid import BlendGridStage
 from .blend_linear import BlendLinearStage
 from .blend_mask import BlendMaskStage
 from .correct_codeformer import CorrectCodeformerStage
@@ -23,6 +24,7 @@ from .upscale_swinir import UpscaleSwinIRStage
 CHAIN_STAGES = {
     "blend-img2img": BlendImg2ImgStage,
     "blend-inpaint": UpscaleOutpaintStage,
+    "blend-grid": BlendGridStage,
     "blend-linear": BlendLinearStage,
     "blend-mask": BlendMaskStage,
     "correct-codeformer": CorrectCodeformerStage,
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
new file mode 100644
index 00000000..51472a42
--- /dev/null
+++ b/api/onnx_web/chain/blend_grid.py
@@ -0,0 +1,47 @@
+from logging import getLogger
+from typing import List, Optional
+
+from PIL import Image
+
+from ..params import ImageParams, StageParams
+from ..server import ServerContext
+from ..worker import ProgressCallback, WorkerContext
+from .stage import BaseStage
+
+logger = getLogger(__name__)
+
+
+class BlendGridStage(BaseStage):
+    def run(
+        self,
+        _worker: WorkerContext,
+        _server: ServerContext,
+        _stage: StageParams,
+        _params: ImageParams,
+        sources: List[Image.Image],
+        *,
+        height: int,
+        width: int,
+        rows: Optional[List[str]] = None,
+        columns: Optional[List[str]] = None,
+        title: Optional[str] = None,
+        order: Optional[int] = None,
+        stage_source: Optional[Image.Image] = None,
+        _callback: Optional[ProgressCallback] = None,
+        **kwargs,
+    ) -> List[Image.Image]:
+        logger.info("combining source images using grid layout")
+
+        size = sources[0].size
+
+        output = Image.new("RGB", (size[0] * width, size[1] * height))
+
+        # TODO: labels
+        for i in order or range(len(sources)):
+            x = i % width
+            y = i / width
+
+            output.paste(sources[i], (x * size[0], y * size[1]))
+
+        return [output]
+
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 1ee68f42..5e6035d8 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -28,11 +28,13 @@ class SourceNoiseStage(BaseStage):
         logger.info("generating image from noise source")
 
         if len(sources) > 0:
-            logger.warning(
-                "source images were passed to a noise stage and will be discarded"
+            logger.info(
+                "source images were passed to a source stage, new images will be appended"
             )
 
-        outputs = []
+        outputs = list(sources)
+
+        # TODO: looping over sources and ignoring params does not make much sense for a source stage
         for source in sources:
             output = noise_source(source, (size.width, size.height), (0, 0))
 
diff --git a/api/onnx_web/chain/source_s3.py b/api/onnx_web/chain/source_s3.py
index 900270a3..55f8f228 100644
--- a/api/onnx_web/chain/source_s3.py
+++ b/api/onnx_web/chain/source_s3.py
@@ -20,7 +20,7 @@ class SourceS3Stage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        _sources: List[Image.Image],
+        sources: List[Image.Image],
         *,
         source_keys: List[str],
         bucket: str,
@@ -31,7 +31,12 @@ class SourceS3Stage(BaseStage):
         session = Session(profile_name=profile_name)
         s3 = session.client("s3", endpoint_url=endpoint_url)
 
-        outputs = []
+        if len(sources) > 0:
+            logger.info(
+                "source images were passed to a source stage, new images will be appended"
+            )
+
+        outputs = list(sources)
         for key in source_keys:
             try:
                 logger.info("loading image from s3://%s/%s", bucket, key)
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index cc642d55..82d9aebe 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Optional, Tuple
+from typing import List, Optional, Tuple
 
 import numpy as np
 import torch
@@ -30,7 +30,7 @@ class SourceTxt2ImgStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         params: ImageParams,
-        _source: Image.Image,
+        sources: List[Image.Image],
         *,
         dims: Tuple[int, int, int],
         size: Size,
@@ -50,9 +50,9 @@ class SourceTxt2ImgStage(BaseStage):
             "generating image using txt2img, %s steps: %s", params.steps, params.prompt
         )
 
-        if "stage_source" in kwargs:
-            logger.warning(
-                "a source image was passed to a txt2img stage, and will be discarded"
+        if len(sources):
+            logger.info(
+                "source images were passed to a source stage, new images will be appended"
             )
 
         prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(
@@ -123,4 +123,6 @@ class SourceTxt2ImgStage(BaseStage):
                 callback=callback,
             )
 
-        return result.images
+        output = list(sources)
+        output.extend(result.images)
+        return output
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 5fa54b67..54f86c54 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -29,11 +29,11 @@ class SourceURLStage(BaseStage):
         logger.info("loading image from URL source")
 
         if len(sources) > 0:
-            logger.warning(
-                "a source image was passed to a source stage, and will be discarded"
+            logger.info(
+                "source images were passed to a source stage, new images will be appended"
             )
 
-        outputs = []
+        outputs = list(sources)
         for url in source_urls:
             response = requests.get(url)
             output = Image.open(BytesIO(response.content))
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 8e046440..b97ab36a 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -368,16 +368,21 @@ def upscale(server: ServerContext, pool: DevicePoolExecutor):
 
 
 def chain(server: ServerContext, pool: DevicePoolExecutor):
-    logger.debug(
-        "chain pipeline request: %s, %s", request.form.keys(), request.files.keys()
-    )
-    body = request.form.get("chain") or request.files.get("chain")
-    if body is None:
-        return error_reply("chain pipeline must have a body")
+    if request.is_json():
+        logger.debug("chain pipeline request with JSON body")
+        data = request.get_json()
+    else:
+        logger.debug(
+            "chain pipeline request: %s, %s", request.form.keys(), request.files.keys()
+        )
+
+        body = request.form.get("chain") or request.files.get("chain")
+        if body is None:
+            return error_reply("chain pipeline must have a body")
+
+        data = load_config_str(body)
 
-    data = load_config_str(body)
     schema = load_config("./schemas/chain.yaml")
-
     logger.debug("validating chain request: %s against %s", data, schema)
     validate(data, schema)
 
@@ -515,61 +520,6 @@ def txt2txt(server: ServerContext, pool: DevicePoolExecutor):
     return jsonify(json_params(output, params, size))
 
 
-def generate(server: ServerContext, pool: DevicePoolExecutor):
-    if not request.is_json():
-        return error_reply("generate endpoint requires JSON parameters")
-
-    # TODO: should this accept YAML as well?
-    data = request.get_json()
-    schema = load_config("./schemas/generate.yaml")
-
-    logger.debug("validating generate request: %s against %s", data, schema)
-    validate(data, schema)
-
-    jobs = []
-
-    if "txt2img" in data:
-        for job in data.get("txt2img"):
-            device, params, size = pipeline_from_json(server, job, "txt2img")
-            jobs.append((
-                f"generate-txt2img-{len(jobs)}",
-                run_txt2img_pipeline,
-                server,
-                params,
-                size,
-                make_output_name(server, "txt2img", params, size, offset=len(jobs)),
-                None,
-                None,
-                device,
-            ))
-
-    if "img2img" in data:
-        for job in data.get("img2img"):
-            device, params, size = pipeline_from_json(server, job, "img2img")
-            jobs.append((
-                f"generate-img2img-{len(jobs)}",
-                run_img2img_pipeline,
-                server,
-                params,
-                size,
-                make_output_name(server, "img2img", params, size, offset=len(jobs))
-                None,
-                None,
-                device,
-            ))
-
-    for job in jobs:
-        pool.submit(*job)
-
-    # TODO: collect results
-    # this is the hard part. once all of the jobs are done, the last job or some dedicated job
-    # needs to collect the previous outputs and put them on a grid. jobs write their own
-    # output to disk and do not return it, so that may need to read the images based on the
-    # output names assigned to each job. knowing when the jobs are done is the first problem.
-
-    # TODO: assemble grid
-
-
 def cancel(server: ServerContext, pool: DevicePoolExecutor):
     output_file = request.args.get("output", None)
     if output_file is None:
diff --git a/api/schemas/generate.yaml b/api/schemas/generate.yaml
new file mode 100644
index 00000000..8666468e
--- /dev/null
+++ b/api/schemas/generate.yaml
@@ -0,0 +1,117 @@
+$id: TODO
+$schema: https://json-schema.org/draft/2020-12/schema
+
+$defs:
+  grid:
+    type: object
+    additionalProperties: False
+    required: [width, height]
+    width:
+      type: number
+    height:
+      type: number
+    labels:
+      type: object
+      additionalProperties: False
+      properties:
+        title:
+          type: string
+        rows:
+          type: array
+          items:
+            type: string
+        columns:
+          type: array
+          items:
+            type: string
+    order:
+      type: array
+      items: number
+
+  job_base:
+    type: object
+    additionalProperties: true
+    required: [
+      device,
+      model,
+      pipeline,
+      scheduler,
+      prompt,
+      cfg,
+      steps,
+      seed,
+    ]
+    properties:
+      batch:
+        type: number
+      device:
+        type: string
+      model:
+        type: string
+      control:
+        type: string
+      pipeline:
+        type: string
+      scheduler:
+        type: string
+      prompt:
+        type: string
+      negative_prompt:
+        type: string
+      cfg:
+        type: number
+      eta:
+        type: number
+      steps:
+        type: number
+      tiled_vae:
+        type: boolean
+      tiles:
+        type: number
+      overlap:
+        type: number
+      seed:
+        type: number
+      stride:
+        type: number
+
+  job_txt2img:
+    allOf:
+      - $ref: "#/$defs/job_base"
+      - type: object
+        additionalProperties: False
+        required: [
+          height,
+          width,
+        ]
+        properties:
+          width:
+            type: number
+          height:
+            type: number
+
+  job_img2img:
+    allOf:
+      - $ref: "#/$defs/job_base"
+      - type: object
+        additionalProperties: False
+        required: []
+        properties:
+          loopback:
+            type: number
+
+type: object
+additionalProperties: False
+properties:
+  txt2img:
+    type: array
+    items:
+      $ref: "#/$defs/job_txt2img"
+  img2img:
+    type: array
+    items:
+      $ref: "#/$defs/job_img2img"
+  grid:
+    type: array
+    items:
+      $ref: "#/$defs/grid"

From 9d4272eb09e27df1e6d806b5bb2c619e70d8979e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 20:59:33 -0500
Subject: [PATCH 009/240] add basic variables to txt2img tab

---
 gui/src/client/api.ts                         |  11 ++
 gui/src/client/local.ts                       |   3 +
 gui/src/client/types.ts                       |  18 +++
 gui/src/client/utils.ts                       |  42 +++++++
 gui/src/components/card/ErrorCard.tsx         |  11 +-
 .../components/control/VariableControl.tsx    | 107 ++++++++++++++++++
 gui/src/components/tab/Txt2Img.tsx            |  25 +++-
 gui/src/state.ts                              |  31 ++++-
 8 files changed, 239 insertions(+), 9 deletions(-)
 create mode 100644 gui/src/client/utils.ts
 create mode 100644 gui/src/components/control/VariableControl.tsx

diff --git a/gui/src/client/api.ts b/gui/src/client/api.ts
index 6bed1e46..1271caab 100644
--- a/gui/src/client/api.ts
+++ b/gui/src/client/api.ts
@@ -7,6 +7,7 @@ import {
   ApiClient,
   BaseImgParams,
   BlendParams,
+  ChainPipeline,
   FilterResponse,
   HighresParams,
   ImageResponse,
@@ -430,6 +431,16 @@ export function makeClient(root: string, token: Maybe<string> = undefined, f = f
         }
       };
     },
+    async chain(chain: ChainPipeline): Promise<ImageResponse> {
+      const url = makeApiUrl(root, 'chain');
+      const body = JSON.stringify(chain);
+
+      // eslint-disable-next-line no-return-await
+      return await parseRequest(url, {
+        body,
+        method: 'POST',
+      });
+    },
     async ready(key: string): Promise<ReadyResponse> {
       const path = makeApiUrl(root, 'ready');
       path.searchParams.append('output', key);
diff --git a/gui/src/client/local.ts b/gui/src/client/local.ts
index 97f785a8..273e5168 100644
--- a/gui/src/client/local.ts
+++ b/gui/src/client/local.ts
@@ -39,6 +39,9 @@ export const LOCAL_CLIENT = {
   async outpaint(model, params, upscale) {
     throw new NoServerError();
   },
+  async chain(chain) {
+    throw new NoServerError();
+  },
   async noises() {
     throw new NoServerError();
   },
diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index b9d22495..d1912d7b 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -162,6 +162,22 @@ export interface HighresParams {
   highresStrength: number;
 }
 
+export interface Txt2ImgStage {
+  name: string;
+  type: 'source-txt2img';
+  params: Txt2ImgParams;
+}
+
+export interface Img2ImgStage {
+  name: string;
+  type: 'blend-img2img';
+  params: Img2ImgParams;
+}
+
+export interface ChainPipeline {
+  stages: Array<Txt2ImgStage | Img2ImgStage>;
+}
+
 /**
  * Output image data within the response.
  */
@@ -354,6 +370,8 @@ export interface ApiClient {
    */
   blend(model: ModelParams, params: BlendParams, upscale?: UpscaleParams): Promise<ImageResponseWithRetry>;
 
+  chain(chain: ChainPipeline): Promise<ImageResponse>;
+
   /**
    * Check whether job has finished and its output is ready.
    */
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
new file mode 100644
index 00000000..d1d69141
--- /dev/null
+++ b/gui/src/client/utils.ts
@@ -0,0 +1,42 @@
+import { ChainPipeline, HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from './types.js';
+
+export interface PipelineVariable {
+  parameter: 'prompt' | 'cfg' | 'seed' | 'steps';
+  input: string;
+  values: Array<string>;
+}
+
+export interface PipelineGrid {
+  enabled: boolean;
+  columns: PipelineVariable;
+  rows: PipelineVariable;
+}
+
+// eslint-disable-next-line max-params
+export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
+  const pipeline: ChainPipeline = {
+    stages: [],
+  };
+
+  let i = 0;
+
+  for (const column of grid.columns.values) {
+    for (const row of grid.rows.values) {
+      pipeline.stages.push({
+        name: `cell-${i}`,
+        type: 'source-txt2img',
+        params: {
+          ...params,
+          [grid.columns.parameter]: column,
+          [grid.rows.parameter]: row,
+        },
+      });
+
+      i += 1;
+    }
+  }
+
+  // TODO: add final grid stage
+
+  return pipeline;
+}
diff --git a/gui/src/components/card/ErrorCard.tsx b/gui/src/components/card/ErrorCard.tsx
index fe683e67..9bb6e455 100644
--- a/gui/src/components/card/ErrorCard.tsx
+++ b/gui/src/components/card/ErrorCard.tsx
@@ -1,4 +1,4 @@
-import { mustExist } from '@apextoaster/js-utils';
+import { Maybe, doesExist, mustExist } from '@apextoaster/js-utils';
 import { Delete, Replay } from '@mui/icons-material';
 import { Alert, Box, Card, CardContent, IconButton, Tooltip } from '@mui/material';
 import { Stack } from '@mui/system';
@@ -15,7 +15,7 @@ import { ClientContext, ConfigContext, OnnxState, StateContext } from '../../sta
 export interface ErrorCardProps {
   image: ImageResponse;
   ready: ReadyResponse;
-  retry: RetryParams;
+  retry: Maybe<RetryParams>;
 }
 
 export function ErrorCard(props: ErrorCardProps) {
@@ -30,8 +30,11 @@ export function ErrorCard(props: ErrorCardProps) {
 
   async function retryImage() {
     removeHistory(image);
-    const { image: nextImage, retry: nextRetry } = await client.retry(retryParams);
-    pushHistory(nextImage, nextRetry);
+
+    if (doesExist(retryParams)) {
+      const { image: nextImage, retry: nextRetry } = await client.retry(retryParams);
+      pushHistory(nextImage, nextRetry);
+    }
   }
 
   const retry = useMutation(retryImage);
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
new file mode 100644
index 00000000..cd159954
--- /dev/null
+++ b/gui/src/components/control/VariableControl.tsx
@@ -0,0 +1,107 @@
+import { doesExist, mustExist } from '@apextoaster/js-utils';
+import { Checkbox, FormControl, InputLabel, MenuItem, Select, Stack, TextField } from '@mui/material';
+import * as React from 'react';
+import { useContext } from 'react';
+import { useStore } from 'zustand';
+
+import { PipelineGrid } from '../../client/utils.js';
+import { OnnxState, StateContext } from '../../state.js';
+
+export interface VariableControlProps {
+  selectGrid: (state: OnnxState) => PipelineGrid;
+  setGrid: (grid: Partial<PipelineGrid>) => void;
+}
+
+export type VariableKey = 'prompt' | 'steps' | 'seed';
+
+export function VariableControl(props: VariableControlProps) {
+  const store = mustExist(useContext(StateContext));
+  const grid = useStore(store, props.selectGrid);
+
+  return <Stack direction='column' spacing={2}>
+    <Stack direction='row' spacing={2}>
+      <InputLabel>Grid Mode</InputLabel>
+      <Checkbox checked={grid.enabled} onChange={() => props.setGrid({
+        enabled: grid.enabled === false,
+      })} />
+    </Stack>
+    <Stack direction='row' spacing={2}>
+      <FormControl>
+        <InputLabel id='TODO'>Columns</InputLabel>
+        <Select onChange={(event) => props.setGrid({
+          columns: {
+            parameter: event.target.value as VariableKey,
+            input: '',
+            values: [],
+          },
+        })} value={grid.columns.parameter}>
+          <MenuItem key='prompt' value='prompt'>Prompt</MenuItem>
+          <MenuItem key='seed' value='seed'>Seed</MenuItem>
+          <MenuItem key='steps' value='steps'>Steps</MenuItem>
+        </Select>
+      </FormControl>
+      <TextField label={grid.columns.parameter} value={grid.columns.input} onChange={(event) => props.setGrid({
+        columns: {
+          parameter: grid.columns.parameter,
+          input: event.target.value,
+          values: rangeSplit(grid.columns.parameter, event.target.value),
+        },
+      })} />
+    </Stack>
+    <Stack direction='row' spacing={2}>
+      <FormControl>
+        <InputLabel id='TODO'>Rows</InputLabel>
+        <Select onChange={(event) => props.setGrid({
+          rows: {
+            parameter: event.target.value as VariableKey,
+            input: '',
+            values: [],
+          }
+        })} value={grid.rows.parameter}>
+          <MenuItem key='prompt' value='prompt'>Prompt</MenuItem>
+          <MenuItem key='seed' value='seed'>Seed</MenuItem>
+          <MenuItem key='steps' value='steps'>Steps</MenuItem>
+        </Select>
+      </FormControl>
+      <TextField label={grid.rows.parameter} value={grid.rows.input} onChange={(event) => props.setGrid({
+        rows: {
+          parameter: grid.rows.parameter,
+          input: event.target.value,
+          values: rangeSplit(grid.rows.parameter, event.target.value),
+        }
+      })} />
+    </Stack>
+  </Stack>;
+}
+
+export function rangeSplit(parameter: string, value: string): Array<string> {
+  // string values
+  if (parameter === 'prompt') {
+    return value.split('\n');
+  }
+
+  return value.split(',').map((it) => it.trim()).flatMap((it) => expandRanges(it));
+}
+
+export const EXPR_STRICT_NUMBER = /^[0-9]+$/;
+export const EXPR_NUMBER_RANGE = /^([0-9]+)-([0-9]+)$/;
+
+export function expandRanges(range: string): Array<string> {
+  if (EXPR_STRICT_NUMBER.test(range)) {
+    // entirely numeric, return without parsing
+    return [range];
+  }
+
+  if (EXPR_NUMBER_RANGE.test(range)) {
+    const match = EXPR_NUMBER_RANGE.exec(range);
+    if (doesExist(match)) {
+      const [_full, startStr, endStr] = Array.from(match);
+      const start = parseInt(startStr, 10);
+      const end = parseInt(endStr, 10);
+
+      return new Array(end - start).fill(0).map((_value, idx) => (idx + start).toFixed(0));
+    }
+  }
+
+  return [];
+}
diff --git a/gui/src/components/tab/Txt2Img.tsx b/gui/src/components/tab/Txt2Img.tsx
index 76e669ce..d5347926 100644
--- a/gui/src/components/tab/Txt2Img.tsx
+++ b/gui/src/components/tab/Txt2Img.tsx
@@ -15,15 +15,27 @@ import { ModelControl } from '../control/ModelControl.js';
 import { UpscaleControl } from '../control/UpscaleControl.js';
 import { NumericField } from '../input/NumericField.js';
 import { Profiles } from '../Profiles.js';
+import { VariableControl } from '../control/VariableControl.js';
+import { PipelineGrid, buildPipelineForTxt2ImgGrid } from '../../client/utils.js';
 
 export function Txt2Img() {
   const { params } = mustExist(useContext(ConfigContext));
 
   async function generateImage() {
     const state = store.getState();
-    const { image, retry } = await client.txt2img(model, selectParams(state), selectUpscale(state), selectHighres(state));
+    const grid = selectVariable(state);
+    const params2 = selectParams(state);
+    const upscale = selectUpscale(state);
+    const highres = selectHighres(state);
 
-    pushHistory(image, retry);
+    if (grid.enabled) {
+      const chain = buildPipelineForTxt2ImgGrid(grid, model, params2, upscale, highres);
+      const image = await client.chain(chain);
+      pushHistory(image);
+    } else {
+      const { image, retry } = await client.txt2img(model, params2, upscale, highres);
+      pushHistory(image, retry);
+    }
   }
 
   const client = mustExist(useContext(ClientContext));
@@ -33,7 +45,7 @@ export function Txt2Img() {
   });
 
   const store = mustExist(useContext(StateContext));
-  const { pushHistory, setHighres, setModel, setParams, setUpscale } = useStore(store, selectActions, shallow);
+  const { pushHistory, setHighres, setModel, setParams, setUpscale, setVariable } = useStore(store, selectActions, shallow);
   const { height, width } = useStore(store, selectReactParams, shallow);
   const model = useStore(store, selectModel);
 
@@ -79,6 +91,7 @@ export function Txt2Img() {
       </Stack>
       <HighresControl selectHighres={selectHighres} setHighres={setHighres} />
       <UpscaleControl selectUpscale={selectUpscale} setUpscale={setUpscale} />
+      <VariableControl selectGrid={selectVariable} setGrid={setVariable} />
       <Button
         variant='contained'
         onClick={() => generate.mutate()}
@@ -99,6 +112,8 @@ export function selectActions(state: OnnxState) {
     setParams: state.setTxt2Img,
     // eslint-disable-next-line @typescript-eslint/unbound-method
     setUpscale: state.setTxt2ImgUpscale,
+    // eslint-disable-next-line @typescript-eslint/unbound-method
+    setVariable: state.setTxt2ImgVariable,
   };
 }
 
@@ -124,3 +139,7 @@ export function selectHighres(state: OnnxState): HighresParams {
 export function selectUpscale(state: OnnxState): UpscaleParams {
   return state.txt2imgUpscale;
 }
+
+export function selectVariable(state: OnnxState): PipelineGrid {
+  return state.txt2imgVariable;
+}
diff --git a/gui/src/state.ts b/gui/src/state.ts
index 25398689..5144fd7d 100644
--- a/gui/src/state.ts
+++ b/gui/src/state.ts
@@ -25,6 +25,7 @@ import {
 } from './client/types.js';
 import { Config, ConfigFiles, ConfigState, ServerParams } from './config.js';
 import { CorrectionModel, DiffusionModel, ExtraNetwork, ExtraSource, ExtrasFile, UpscalingModel } from './types.js';
+import { PipelineGrid } from './client/utils.js';
 
 export const MISSING_INDEX = -1;
 
@@ -38,7 +39,7 @@ export type TabState<TabParams> = ConfigFiles<Required<TabParams>> & ConfigState
 export interface HistoryItem {
   image: ImageResponse;
   ready: Maybe<ReadyResponse>;
-  retry: RetryParams;
+  retry: Maybe<RetryParams>;
 }
 
 export interface ProfileItem {
@@ -60,7 +61,7 @@ interface HistorySlice {
   history: Array<HistoryItem>;
   limit: number;
 
-  pushHistory(image: ImageResponse, retry: RetryParams): void;
+  pushHistory(image: ImageResponse, retry?: RetryParams): void;
   removeHistory(image: ImageResponse): void;
   setLimit(limit: number): void;
   setReady(image: ImageResponse, ready: ReadyResponse): void;
@@ -90,6 +91,7 @@ interface Txt2ImgSlice {
   txt2imgModel: ModelParams;
   txt2imgHighres: HighresParams;
   txt2imgUpscale: UpscaleParams;
+  txt2imgVariable: PipelineGrid;
 
   resetTxt2Img(): void;
 
@@ -97,6 +99,7 @@ interface Txt2ImgSlice {
   setTxt2ImgModel(params: Partial<ModelParams>): void;
   setTxt2ImgHighres(params: Partial<HighresParams>): void;
   setTxt2ImgUpscale(params: Partial<UpscaleParams>): void;
+  setTxt2ImgVariable(params: Partial<PipelineGrid>): void;
 }
 
 interface Img2ImgSlice {
@@ -305,6 +308,19 @@ export function createStateSlices(server: ServerParams) {
     scale: server.scale.default,
     upscaleOrder: server.upscaleOrder.default,
   };
+  const defaultGrid: PipelineGrid = {
+    enabled: false,
+    columns: {
+      input: '',
+      parameter: 'seed',
+      values: [],
+    },
+    rows: {
+      input: '',
+      parameter: 'seed',
+      values: [],
+    },
+  };
 
   const createTxt2ImgSlice: Slice<Txt2ImgSlice> = (set) => ({
     txt2img: {
@@ -321,6 +337,9 @@ export function createStateSlices(server: ServerParams) {
     txt2imgUpscale: {
       ...defaultUpscale,
     },
+    txt2imgVariable: {
+      ...defaultGrid,
+    },
     setTxt2Img(params) {
       set((prev) => ({
         txt2img: {
@@ -353,6 +372,14 @@ export function createStateSlices(server: ServerParams) {
         },
       }));
     },
+    setTxt2ImgVariable(params) {
+      set((prev) => ({
+        txt2imgVariable: {
+          ...prev.txt2imgVariable,
+          ...params,
+        },
+      }));
+    },
     resetTxt2Img() {
       set({
         txt2img: {

From 93fe54577ca22456f7bec6aaa9e53691e7fa6d1a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:17:09 -0500
Subject: [PATCH 010/240] skip controlnet in chains for now, remove empty
 source image

---
 api/onnx_web/chain/source_txt2img.py |  4 ++--
 api/onnx_web/server/api.py           | 12 ++++++++----
 api/schemas/chain.yaml               |  2 ++
 3 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 82d9aebe..c69443a1 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -69,9 +69,9 @@ class SourceTxt2ImgStage(BaseStage):
 
         # generate new latents or slice existing
         if latents is None:
-            latents = get_latents_from_seed(params.seed, latent_size, params.batch)
+            latents = get_latents_from_seed(int(params.seed), latent_size, params.batch)
         else:
-            latents = get_tile_latents(latents, params.seed, latent_size, dims)
+            latents = get_tile_latents(latents, int(params.seed), latent_size, dims)
 
         pipe_type = params.get_valid_pipeline("txt2img")
         pipe = load_pipeline(
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index b97ab36a..ae33901a 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -1,6 +1,7 @@
 from io import BytesIO
 from logging import getLogger
 from os import path
+from typing import Any, Dict
 
 from flask import Flask, jsonify, make_response, request, url_for
 from jsonschema import validate
@@ -368,7 +369,7 @@ def upscale(server: ServerContext, pool: DevicePoolExecutor):
 
 
 def chain(server: ServerContext, pool: DevicePoolExecutor):
-    if request.is_json():
+    if request.is_json:
         logger.debug("chain pipeline request with JSON body")
         data = request.get_json()
     else:
@@ -396,9 +397,13 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     pipeline = ChainPipeline()
     for stage_data in data.get("stages", []):
         stage_class = CHAIN_STAGES[stage_data.get("type")]
-        kwargs = stage_data.get("params", {})
+        kwargs: Dict[str, Any] = stage_data.get("params", {})
         logger.info("request stage: %s, %s", stage_class.__name__, kwargs)
 
+        if "control" in kwargs:
+            logger.warning("TODO: resolve controlnet model")
+            kwargs.pop("control")
+
         stage = StageParams(
             stage_data.get("name", stage_class.__name__),
             tile_size=get_size(kwargs.get("tile_size")),
@@ -443,13 +448,12 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
     # build and run chain pipeline
-    empty_source = Image.new("RGB", (size.width, size.height))
     pool.submit(
         job_name,
         pipeline,
         server,
         params,
-        empty_source,
+        [],
         output=output[0],
         size=size,
         needs_device=device,
diff --git a/api/schemas/chain.yaml b/api/schemas/chain.yaml
index 1b41c503..96d0c73b 100644
--- a/api/schemas/chain.yaml
+++ b/api/schemas/chain.yaml
@@ -46,8 +46,10 @@ $defs:
           patternProperties:
             "^[-_A-Za-z]+$":
               oneOf:
+                - type: boolean
                 - type: number
                 - type: string
+                - type: "null"
 
   request_chain:
     type: array

From 07662b22dfd997475eb3a33800656959f8b67a03 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:17:27 -0500
Subject: [PATCH 011/240] send chain request as json, with numbers

---
 gui/src/client/api.ts                          | 3 +++
 gui/src/client/utils.ts                        | 2 +-
 gui/src/components/control/VariableControl.tsx | 6 +++---
 3 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/gui/src/client/api.ts b/gui/src/client/api.ts
index 1271caab..cffdc183 100644
--- a/gui/src/client/api.ts
+++ b/gui/src/client/api.ts
@@ -438,6 +438,9 @@ export function makeClient(root: string, token: Maybe<string> = undefined, f = f
       // eslint-disable-next-line no-return-await
       return await parseRequest(url, {
         body,
+        headers: {
+          'Content-Type': 'application/json',
+        },
         method: 'POST',
       });
     },
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index d1d69141..20742556 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -3,7 +3,7 @@ import { ChainPipeline, HighresParams, ModelParams, Txt2ImgParams, UpscaleParams
 export interface PipelineVariable {
   parameter: 'prompt' | 'cfg' | 'seed' | 'steps';
   input: string;
-  values: Array<string>;
+  values: Array<number | string>;
 }
 
 export interface PipelineGrid {
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index cd159954..abdbce13 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -74,7 +74,7 @@ export function VariableControl(props: VariableControlProps) {
   </Stack>;
 }
 
-export function rangeSplit(parameter: string, value: string): Array<string> {
+export function rangeSplit(parameter: string, value: string): Array<number | string> {
   // string values
   if (parameter === 'prompt') {
     return value.split('\n');
@@ -86,7 +86,7 @@ export function rangeSplit(parameter: string, value: string): Array<string> {
 export const EXPR_STRICT_NUMBER = /^[0-9]+$/;
 export const EXPR_NUMBER_RANGE = /^([0-9]+)-([0-9]+)$/;
 
-export function expandRanges(range: string): Array<string> {
+export function expandRanges(range: string): Array<string | number> {
   if (EXPR_STRICT_NUMBER.test(range)) {
     // entirely numeric, return without parsing
     return [range];
@@ -99,7 +99,7 @@ export function expandRanges(range: string): Array<string> {
       const start = parseInt(startStr, 10);
       const end = parseInt(endStr, 10);
 
-      return new Array(end - start).fill(0).map((_value, idx) => (idx + start).toFixed(0));
+      return new Array(end - start).fill(0).map((_value, idx) => idx + start);
     }
   }
 

From 441a47a88571d5a99e4a7703392697fb376b101b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:21:57 -0500
Subject: [PATCH 012/240] read chain params per stage

---
 api/onnx_web/server/api.py    |  13 +--
 api/onnx_web/server/params.py | 179 +++-------------------------------
 2 files changed, 23 insertions(+), 169 deletions(-)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index ae33901a..7ad90da2 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -388,18 +388,16 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     validate(data, schema)
 
     # get defaults from the regular parameters
-    device, params, size = pipeline_from_request(server)
-    output = make_output_name(server, "chain", params, size)
-    job_name = output[0]
-
-    replace_wildcards(params, get_wildcard_data())
-
+    device, _params, _size = pipeline_from_request(server)
     pipeline = ChainPipeline()
     for stage_data in data.get("stages", []):
         stage_class = CHAIN_STAGES[stage_data.get("type")]
         kwargs: Dict[str, Any] = stage_data.get("params", {})
         logger.info("request stage: %s, %s", stage_class.__name__, kwargs)
 
+        _device, params, size = pipeline_from_request(server, data=kwargs)
+        replace_wildcards(params, get_wildcard_data())
+
         if "control" in kwargs:
             logger.warning("TODO: resolve controlnet model")
             kwargs.pop("control")
@@ -447,6 +445,9 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
 
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
+    output = make_output_name(server, "chain", params, size, count=len(pipeline.stages))
+    job_name = output[0]
+
     # build and run chain pipeline
     pool.submit(
         job_name,
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index 43c7a511..d3311010 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -34,11 +34,17 @@ from .utils import get_model_path
 logger = getLogger(__name__)
 
 
-def pipeline_from_json(
-        server: ServerContext,
-        data: Dict[str, Any],
-        default_pipeline: str = "txt2img",
+def pipeline_from_request(
+    server: ServerContext,
+    data: Dict[str, str] = None,
+    default_pipeline: str = "txt2img",
 ) -> Tuple[DeviceParams, ImageParams, Size]:
+    user = request.remote_addr
+
+    if data is None:
+        data = request.args
+
+    # platform stuff
     device = None
     device_name = data.get("platform")
 
@@ -51,6 +57,12 @@ def pipeline_from_json(
     model = get_not_empty(data, "model", get_config_value("model"))
     model_path = get_model_path(server, model)
 
+    control = None
+    control_name = data.get("control")
+    for network in get_network_models():
+        if network.name == control_name:
+            control = network
+
     # pipeline stuff
     pipeline = get_from_list(
         data, "pipeline", get_available_pipelines(), default_pipeline
@@ -149,165 +161,6 @@ def pipeline_from_json(
         # this one can safely use np.random because it produces a single value
         seed = np.random.randint(np.iinfo(np.int32).max)
 
-    logger.debug(
-        "parsed parameters for %s steps of %s using %s in %s on %s, %sx%s, %s, %s - %s",
-        steps,
-        scheduler,
-        model_path,
-        pipeline,
-        device or "any device",
-        width,
-        height,
-        cfg,
-        seed,
-        prompt,
-    )
-
-    params = ImageParams(
-        model_path,
-        pipeline,
-        scheduler,
-        prompt,
-        cfg,
-        steps,
-        seed,
-        eta=eta,
-        negative_prompt=negative_prompt,
-        batch=batch,
-        # TODO: control=control,
-        loopback=loopback,
-        tiled_vae=tiled_vae,
-        tiles=tiles,
-        overlap=overlap,
-        stride=stride,
-    )
-    size = Size(width, height)
-    return (device, params, size)
-
-
-def pipeline_from_request(
-    server: ServerContext,
-    default_pipeline: str = "txt2img",
-) -> Tuple[DeviceParams, ImageParams, Size]:
-    user = request.remote_addr
-
-    # platform stuff
-    device = None
-    device_name = request.args.get("platform")
-
-    if device_name is not None and device_name != "any":
-        for platform in get_available_platforms():
-            if platform.device == device_name:
-                device = platform
-
-    # diffusion model
-    model = get_not_empty(request.args, "model", get_config_value("model"))
-    model_path = get_model_path(server, model)
-
-    control = None
-    control_name = request.args.get("control")
-    for network in get_network_models():
-        if network.name == control_name:
-            control = network
-
-    # pipeline stuff
-    pipeline = get_from_list(
-        request.args, "pipeline", get_available_pipelines(), default_pipeline
-    )
-    scheduler = get_from_list(request.args, "scheduler", get_pipeline_schedulers())
-
-    if scheduler is None:
-        scheduler = get_config_value("scheduler")
-
-    # prompt does not come from config
-    prompt = request.args.get("prompt", "")
-    negative_prompt = request.args.get("negativePrompt", None)
-
-    if negative_prompt is not None and negative_prompt.strip() == "":
-        negative_prompt = None
-
-    # image params
-    batch = get_and_clamp_int(
-        request.args,
-        "batch",
-        get_config_value("batch"),
-        get_config_value("batch", "max"),
-        get_config_value("batch", "min"),
-    )
-    cfg = get_and_clamp_float(
-        request.args,
-        "cfg",
-        get_config_value("cfg"),
-        get_config_value("cfg", "max"),
-        get_config_value("cfg", "min"),
-    )
-    eta = get_and_clamp_float(
-        request.args,
-        "eta",
-        get_config_value("eta"),
-        get_config_value("eta", "max"),
-        get_config_value("eta", "min"),
-    )
-    loopback = get_and_clamp_int(
-        request.args,
-        "loopback",
-        get_config_value("loopback"),
-        get_config_value("loopback", "max"),
-        get_config_value("loopback", "min"),
-    )
-    steps = get_and_clamp_int(
-        request.args,
-        "steps",
-        get_config_value("steps"),
-        get_config_value("steps", "max"),
-        get_config_value("steps", "min"),
-    )
-    height = get_and_clamp_int(
-        request.args,
-        "height",
-        get_config_value("height"),
-        get_config_value("height", "max"),
-        get_config_value("height", "min"),
-    )
-    width = get_and_clamp_int(
-        request.args,
-        "width",
-        get_config_value("width"),
-        get_config_value("width", "max"),
-        get_config_value("width", "min"),
-    )
-    tiled_vae = get_boolean(request.args, "tiledVAE", get_config_value("tiledVAE"))
-    tiles = get_and_clamp_int(
-        request.args,
-        "tiles",
-        get_config_value("tiles"),
-        get_config_value("tiles", "max"),
-        get_config_value("tiles", "min"),
-    )
-    overlap = get_and_clamp_float(
-        request.args,
-        "overlap",
-        get_config_value("overlap"),
-        get_config_value("overlap", "max"),
-        get_config_value("overlap", "min"),
-    )
-    stride = get_and_clamp_int(
-        request.args,
-        "stride",
-        get_config_value("stride"),
-        get_config_value("stride", "max"),
-        get_config_value("stride", "min"),
-    )
-
-    if stride > tiles:
-        logger.info("limiting stride to tile size, %s > %s", stride, tiles)
-        stride = tiles
-
-    seed = int(request.args.get("seed", -1))
-    if seed == -1:
-        # this one can safely use np.random because it produces a single value
-        seed = np.random.randint(np.iinfo(np.int32).max)
-
     logger.info(
         "request from %s: %s steps of %s using %s in %s on %s, %sx%s, %s, %s - %s",
         user,

From d0080c476d9b40a6cbfa1425fb764d7f1a8cbbf5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:23:16 -0500
Subject: [PATCH 013/240] read chain params per stage

---
 api/onnx_web/server/api.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 7ad90da2..9b0f38f2 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -395,6 +395,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         kwargs: Dict[str, Any] = stage_data.get("params", {})
         logger.info("request stage: %s, %s", stage_class.__name__, kwargs)
 
+        # TODO: combine base params with stage params
         _device, params, size = pipeline_from_request(server, data=kwargs)
         replace_wildcards(params, get_wildcard_data())
 

From 52521e569433c7cf32920fcacad795778a857690 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:25:23 -0500
Subject: [PATCH 014/240] handle boolean values better

---
 api/onnx_web/server/api.py | 1 -
 api/onnx_web/utils.py      | 7 ++++++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 9b0f38f2..bf8cd956 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -52,7 +52,6 @@ from .load import (
 from .params import (
     border_from_request,
     highres_from_request,
-    pipeline_from_json,
     pipeline_from_request,
     upscale_from_request,
 )
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 465e5aa8..d7ca839e 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -28,7 +28,12 @@ def is_debug() -> bool:
 
 
 def get_boolean(args: Any, key: str, default_value: bool) -> bool:
-    return args.get(key, str(default_value)).lower() in ("1", "t", "true", "y", "yes")
+    val = args.get(key, str(default_value))
+
+    if type(val) == bool:
+        return val
+
+    return val.lower() in ("1", "t", "true", "y", "yes")
 
 
 def get_and_clamp_float(

From dc812a4e06e533e8b33fc1bb292a467e4019e549 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:44:00 -0500
Subject: [PATCH 015/240] pass all output names to chain job

---
 api/onnx_web/server/api.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index bf8cd956..3f2ffa8b 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -455,7 +455,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         server,
         params,
         [],
-        output=output[0],
+        output=output,
         size=size,
         needs_device=device,
     )

From 15b8a80f6d98d788fd2763b262520c98dfa2e79b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:44:12 -0500
Subject: [PATCH 016/240] add grid stage to chain def

---
 gui/src/client/types.ts | 11 ++++++++++-
 gui/src/client/utils.ts | 12 +++++++++++-
 2 files changed, 21 insertions(+), 2 deletions(-)

diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index d1912d7b..908f70b0 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -174,8 +174,17 @@ export interface Img2ImgStage {
   params: Img2ImgParams;
 }
 
+export interface GridStage {
+  name: string;
+  type: 'blend-grid';
+  params: {
+    height: number;
+    width: number;
+  };
+}
+
 export interface ChainPipeline {
-  stages: Array<Txt2ImgStage | Img2ImgStage>;
+  stages: Array<Txt2ImgStage | Img2ImgStage | GridStage>;
 }
 
 /**
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 20742556..fc7aad74 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -27,6 +27,7 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
         type: 'source-txt2img',
         params: {
           ...params,
+          ...model,
           [grid.columns.parameter]: column,
           [grid.rows.parameter]: row,
         },
@@ -36,7 +37,16 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
     }
   }
 
-  // TODO: add final grid stage
+  pipeline.stages.push({
+    name: 'grid',
+    type: 'blend-grid',
+    params: {
+      ...params,
+      ...model,
+      height: grid.rows.values.length,
+      width: grid.columns.values.length,
+    },
+  });
 
   return pipeline;
 }

From c6302946c0f7649e64d9d850050e0df9b449dde0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 21:52:45 -0500
Subject: [PATCH 017/240] use existing output names in output stage

---
 api/onnx_web/chain/persist_disk.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 794dbb37..4ca200d1 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -21,11 +21,11 @@ class PersistDiskStage(BaseStage):
         params: ImageParams,
         sources: List[Image.Image],
         *,
-        output: str,
+        outputs: List[str],
         stage_source: Image.Image,
         **kwargs,
     ) -> List[Image.Image]:
-        for source in sources:
+        for source, output in zip(sources, outputs):
             # TODO: append index to output name
             dest = save_image(server, output, source, params=params)
             logger.info("saved image to %s", dest)

From dcc00631952341b4261790f1bd9e534ecf871a67 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 22:19:29 -0500
Subject: [PATCH 018/240] pass params per stage

---
 api/onnx_web/chain/base.py    | 2 +-
 api/onnx_web/server/api.py    | 5 +++++
 api/onnx_web/server/params.py | 2 +-
 3 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index c7ebfe7f..b0d91512 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -159,7 +159,7 @@ class ChainPipeline:
                                     worker,
                                     server,
                                     stage_params,
-                                    params,
+                                    kwargs["params"] if "params" in kwargs else params,
                                     [source_tile],
                                     tile_mask=tile_mask,
                                     callback=callback,
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 3f2ffa8b..3d30d2e0 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -398,10 +398,15 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         _device, params, size = pipeline_from_request(server, data=kwargs)
         replace_wildcards(params, get_wildcard_data())
 
+        if "model" in kwargs:
+            kwargs.pop("model")
+
         if "control" in kwargs:
             logger.warning("TODO: resolve controlnet model")
             kwargs.pop("control")
 
+        kwargs["params"] = params
+
         stage = StageParams(
             stage_data.get("name", stage_class.__name__),
             tile_size=get_size(kwargs.get("tile_size")),
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index d3311010..e37a15a8 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -36,8 +36,8 @@ logger = getLogger(__name__)
 
 def pipeline_from_request(
     server: ServerContext,
-    data: Dict[str, str] = None,
     default_pipeline: str = "txt2img",
+    data: Dict[str, str] = None,
 ) -> Tuple[DeviceParams, ImageParams, Size]:
     user = request.remote_addr
 

From 89de05b7c5421fb8d0c751d09e1b95c461980a1e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 22:19:46 -0500
Subject: [PATCH 019/240] add output stage, parse individual numbers

---
 gui/src/client/types.ts                        | 10 +++++++++-
 gui/src/client/utils.ts                        |  6 ++++++
 gui/src/components/control/VariableControl.tsx |  2 +-
 3 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index 908f70b0..5af31564 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -183,8 +183,16 @@ export interface GridStage {
   };
 }
 
+export interface OutputStage {
+  name: string;
+  type: 'persist-disk';
+  params: {
+    /* none */
+  };
+}
+
 export interface ChainPipeline {
-  stages: Array<Txt2ImgStage | Img2ImgStage | GridStage>;
+  stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
 }
 
 /**
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index fc7aad74..92b12d13 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -48,5 +48,11 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
     },
   });
 
+  pipeline.stages.push({
+    name: 'save',
+    type: 'persist-disk',
+    params: {},
+  });
+
   return pipeline;
 }
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index abdbce13..91ce6a26 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -89,7 +89,7 @@ export const EXPR_NUMBER_RANGE = /^([0-9]+)-([0-9]+)$/;
 export function expandRanges(range: string): Array<string | number> {
   if (EXPR_STRICT_NUMBER.test(range)) {
     // entirely numeric, return without parsing
-    return [range];
+    return [parseInt(range, 10)];
   }
 
   if (EXPR_NUMBER_RANGE.test(range)) {

From fb7a0996a8884140921cd596faf7fd8878ee1621 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 22:21:48 -0500
Subject: [PATCH 020/240] wire up per stage params

---
 api/onnx_web/chain/base.py | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index b0d91512..0100dea5 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -123,6 +123,11 @@ class ChainPipeline:
                 kwargs.keys(),
             )
 
+            per_stage_params = params
+            if "params" in kwargs:
+                per_stage_params = kwargs["params"]
+                kwargs.pop("params")
+
             # the stage must be split and tiled if any image is larger than the selected/max tile size
             must_tile = any(
                 [
@@ -159,7 +164,7 @@ class ChainPipeline:
                                     worker,
                                     server,
                                     stage_params,
-                                    kwargs["params"] if "params" in kwargs else params,
+                                    per_stage_params,
                                     [source_tile],
                                     tile_mask=tile_mask,
                                     callback=callback,
@@ -201,7 +206,7 @@ class ChainPipeline:
                             worker,
                             server,
                             stage_params,
-                            params,
+                            per_stage_params,
                             stage_sources,
                             callback=callback,
                             **kwargs,

From 51b10de2655148c050a2d4d32a6ded9f465101cd Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 22:46:06 -0500
Subject: [PATCH 021/240] pass initial device to chain

---
 api/onnx_web/chain/base.py             | 1 -
 api/onnx_web/convert/diffusion/lora.py | 2 +-
 api/schemas/chain.yaml                 | 2 ++
 gui/src/client/api.ts                  | 7 +++++--
 gui/src/client/local.ts                | 2 +-
 gui/src/client/types.ts                | 2 +-
 gui/src/components/tab/Txt2Img.tsx     | 2 +-
 7 files changed, 11 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 0100dea5..34b1f5f2 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -108,7 +108,6 @@ class ChainPipeline:
                 len(sources),
             )
         else:
-            sources = [None]
             logger.info("running pipeline without source images")
 
         stage_sources = sources
diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index ae5b910a..e2dc0058 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -519,7 +519,7 @@ def blend_loras(
                 t_weights = interp_to_match(weights, onnx_weights).transpose()
 
             blended = onnx_weights + t_weights
-            logger.debug(
+            logger.trace(
                 "blended weight shape: %s, %s", blended.shape, onnx_weights.dtype
             )
 
diff --git a/api/schemas/chain.yaml b/api/schemas/chain.yaml
index 96d0c73b..211e65ac 100644
--- a/api/schemas/chain.yaml
+++ b/api/schemas/chain.yaml
@@ -60,5 +60,7 @@ type: object
 additionalProperties: False
 required: [stages]
 properties:
+  platform:
+    type: string
   stages:
     $ref: "#/$defs/request_chain"
diff --git a/gui/src/client/api.ts b/gui/src/client/api.ts
index cffdc183..99d55baa 100644
--- a/gui/src/client/api.ts
+++ b/gui/src/client/api.ts
@@ -431,9 +431,12 @@ export function makeClient(root: string, token: Maybe<string> = undefined, f = f
         }
       };
     },
-    async chain(chain: ChainPipeline): Promise<ImageResponse> {
+    async chain(model: ModelParams, chain: ChainPipeline): Promise<ImageResponse> {
       const url = makeApiUrl(root, 'chain');
-      const body = JSON.stringify(chain);
+      const body = JSON.stringify({
+        ...chain,
+        platform: model.platform,
+      });
 
       // eslint-disable-next-line no-return-await
       return await parseRequest(url, {
diff --git a/gui/src/client/local.ts b/gui/src/client/local.ts
index 273e5168..f1cefe5d 100644
--- a/gui/src/client/local.ts
+++ b/gui/src/client/local.ts
@@ -39,7 +39,7 @@ export const LOCAL_CLIENT = {
   async outpaint(model, params, upscale) {
     throw new NoServerError();
   },
-  async chain(chain) {
+  async chain(model, chain) {
     throw new NoServerError();
   },
   async noises() {
diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index 5af31564..c00a0ae1 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -387,7 +387,7 @@ export interface ApiClient {
    */
   blend(model: ModelParams, params: BlendParams, upscale?: UpscaleParams): Promise<ImageResponseWithRetry>;
 
-  chain(chain: ChainPipeline): Promise<ImageResponse>;
+  chain(model: ModelParams, chain: ChainPipeline): Promise<ImageResponse>;
 
   /**
    * Check whether job has finished and its output is ready.
diff --git a/gui/src/components/tab/Txt2Img.tsx b/gui/src/components/tab/Txt2Img.tsx
index d5347926..f5fab31b 100644
--- a/gui/src/components/tab/Txt2Img.tsx
+++ b/gui/src/components/tab/Txt2Img.tsx
@@ -30,7 +30,7 @@ export function Txt2Img() {
 
     if (grid.enabled) {
       const chain = buildPipelineForTxt2ImgGrid(grid, model, params2, upscale, highres);
-      const image = await client.chain(chain);
+      const image = await client.chain(model, chain);
       pushHistory(image);
     } else {
       const { image, retry } = await client.txt2img(model, params2, upscale, highres);

From feb9ea9e1a022a751327e497dedf5b2381503dc7 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 23:06:00 -0500
Subject: [PATCH 022/240] fix order, parse right data, use output names

---
 api/onnx_web/chain/blend_grid.py     |  9 +++++----
 api/onnx_web/chain/persist_disk.py   | 11 +++++------
 api/onnx_web/chain/source_txt2img.py |  2 +-
 api/onnx_web/server/api.py           |  2 +-
 4 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 51472a42..34a45753 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -37,11 +37,12 @@ class BlendGridStage(BaseStage):
         output = Image.new("RGB", (size[0] * width, size[1] * height))
 
         # TODO: labels
-        for i in order or range(len(sources)):
+        order = order or range(len(sources))
+        for i in len(order):
             x = i % width
-            y = i / width
+            y = i // width
 
-            output.paste(sources[i], (x * size[0], y * size[1]))
+            n = order[i]
+            output.paste(sources[n], (x * size[0], y * size[1]))
 
         return [output]
-
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 4ca200d1..fb9e53c0 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List
+from typing import List, Optional
 
 from PIL import Image
 
@@ -21,13 +21,12 @@ class PersistDiskStage(BaseStage):
         params: ImageParams,
         sources: List[Image.Image],
         *,
-        outputs: List[str],
-        stage_source: Image.Image,
+        output: List[str],
+        stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
-        for source, output in zip(sources, outputs):
-            # TODO: append index to output name
-            dest = save_image(server, output, source, params=params)
+        for source, name in zip(sources, output):
+            dest = save_image(server, name, source, params=params)
             logger.info("saved image to %s", dest)
 
         return sources
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index c69443a1..cda81b3d 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -32,7 +32,7 @@ class SourceTxt2ImgStage(BaseStage):
         params: ImageParams,
         sources: List[Image.Image],
         *,
-        dims: Tuple[int, int, int],
+        dims: Tuple[int, int, int] = None,
         size: Size,
         callback: Optional[ProgressCallback] = None,
         latents: Optional[np.ndarray] = None,
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 3d30d2e0..85103bba 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -387,7 +387,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     validate(data, schema)
 
     # get defaults from the regular parameters
-    device, _params, _size = pipeline_from_request(server)
+    device, _params, _size = pipeline_from_request(server, data=data)
     pipeline = ChainPipeline()
     for stage_data in data.get("stages", []):
         stage_class = CHAIN_STAGES[stage_data.get("type")]

From b0df6247b2c7a8127f5574c671c1fdef27cee841 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 23:15:01 -0500
Subject: [PATCH 023/240] synthesize order

---
 api/onnx_web/chain/blend_grid.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 34a45753..cea63322 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -37,8 +37,10 @@ class BlendGridStage(BaseStage):
         output = Image.new("RGB", (size[0] * width, size[1] * height))
 
         # TODO: labels
-        order = order or range(len(sources))
-        for i in len(order):
+        if order is None:
+            order = range(len(sources))
+
+        for i in range(len(order)):
             x = i % width
             y = i // width
 

From 0047e1a12cd752b9bc749c330cd0fd03ef704109 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 10 Sep 2023 23:20:49 -0500
Subject: [PATCH 024/240] add size

---
 api/onnx_web/chain/persist_disk.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index fb9e53c0..890e6589 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -4,7 +4,7 @@ from typing import List, Optional
 from PIL import Image
 
 from ..output import save_image
-from ..params import ImageParams, StageParams
+from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .stage import BaseStage
@@ -22,11 +22,12 @@ class PersistDiskStage(BaseStage):
         sources: List[Image.Image],
         *,
         output: List[str],
+        size: Optional[Size] = None,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
         for source, name in zip(sources, output):
-            dest = save_image(server, name, source, params=params)
+            dest = save_image(server, name, source, params=params, size=size)
             logger.info("saved image to %s", dest)
 
         return sources

From 1247cb7307359883842e104d141ada470b75b571 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 07:28:20 -0500
Subject: [PATCH 025/240] super hacky multi tiling

---
 api/onnx_web/chain/base.py       | 25 ++++++++++++++++++++++---
 api/onnx_web/chain/blend_grid.py |  2 +-
 api/onnx_web/chain/tile.py       |  3 +++
 3 files changed, 26 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 34b1f5f2..077f5998 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -152,6 +152,8 @@ class ChainPipeline:
                         tile,
                     )
 
+                    extra_tiles = []
+
                     def stage_tile(
                         source_tile: Image.Image,
                         tile_mask: Image.Image,
@@ -169,12 +171,19 @@ class ChainPipeline:
                                     callback=callback,
                                     dims=dims,
                                     **kwargs,
-                                )[0]
+                                )
+
+                                if len(output_tile) > 1:
+                                    while len(extra_tiles) < len(output_tile):
+                                        extra_tiles.append([])
+
+                                    for tile, layer in zip(output_tile, extra_tiles):
+                                        layer.append((tile, dims))
 
                                 if is_debug():
-                                    save_image(server, "last-tile.png", output_tile)
+                                    save_image(server, "last-tile.png", output_tile[0])
 
-                                return output_tile
+                                return output_tile[0]
                             except Exception:
                                 logger.exception(
                                     "error while running stage pipeline for tile, retry %s of 3",
@@ -194,8 +203,17 @@ class ChainPipeline:
                         [stage_tile],
                         **kwargs,
                     )
+
                     stage_outputs.append(output)
 
+                    if len(extra_tiles) > 1:
+                        for layer in extra_tiles:
+                            layer_output = Image.new("RGB", output.size)
+                            for tile, dims in layer:
+                                layer_output.paste(tile, (dims[0], dims[1]))
+
+                            stage_outputs.append(layer_output)
+
                 stage_sources = stage_outputs
             else:
                 logger.debug("image within tile size of %s, running stage", tile)
@@ -208,6 +226,7 @@ class ChainPipeline:
                             per_stage_params,
                             stage_sources,
                             callback=callback,
+                            dims=(0, 0, tile),
                             **kwargs,
                         )
                         # doing this on the same line as stage_pipe.run can leave sources as None, which the pipeline
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index cea63322..5a23f779 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -47,4 +47,4 @@ class BlendGridStage(BaseStage):
             n = order[i]
             output.paste(sources[n], (x * size[0], y * size[1]))
 
-        return [output]
+        return [*sources, output]
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 8b7898c6..c80a5719 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -343,6 +343,9 @@ def process_tile_order(
     filters: List[TileCallback],
     **kwargs,
 ) -> Image.Image:
+    """
+    TODO: needs to handle more than one image
+    """
     if order == TileOrder.grid:
         logger.debug("using grid tile order with tile size: %s", tile)
         return process_tile_grid(source, tile, scale, filters, **kwargs)

From bf830a9032e5a1c9877c6a6e6729b5f98c63d48b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 17:35:47 -0500
Subject: [PATCH 026/240] add tile size to grid jobs

---
 gui/src/client/types.ts | 7 +++++--
 gui/src/client/utils.ts | 9 ++++++++-
 2 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index c00a0ae1..9be13103 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -165,7 +165,9 @@ export interface HighresParams {
 export interface Txt2ImgStage {
   name: string;
   type: 'source-txt2img';
-  params: Txt2ImgParams;
+  params: Txt2ImgParams & {
+    tile_size: number;
+  };
 }
 
 export interface Img2ImgStage {
@@ -180,6 +182,7 @@ export interface GridStage {
   params: {
     height: number;
     width: number;
+    tile_size: number;
   };
 }
 
@@ -187,7 +190,7 @@ export interface OutputStage {
   name: string;
   type: 'persist-disk';
   params: {
-    /* none */
+    tile_size: number;
   };
 }
 
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 92b12d13..10d81600 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -30,6 +30,8 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
           ...model,
           [grid.columns.parameter]: column,
           [grid.rows.parameter]: row,
+          // eslint-disable-next-line camelcase
+          tile_size: 8192,
         },
       });
 
@@ -45,13 +47,18 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
       ...model,
       height: grid.rows.values.length,
       width: grid.columns.values.length,
+      // eslint-disable-next-line camelcase
+      tile_size: 8192,
     },
   });
 
   pipeline.stages.push({
     name: 'save',
     type: 'persist-disk',
-    params: {},
+    params: {
+      // eslint-disable-next-line camelcase
+      tile_size: 8192,
+    },
   });
 
   return pipeline;

From f3d1b16c8c235acff0dfdd92c5ebbb0ad6f7c647 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 17:36:15 -0500
Subject: [PATCH 027/240] prevent selecting the same variable for both axes

---
 gui/src/client/utils.ts                       |   3 +-
 .../components/control/VariableControl.tsx    | 152 +++++++++++-------
 2 files changed, 99 insertions(+), 56 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 10d81600..6944141c 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -1,7 +1,8 @@
+import { doesExist } from '@apextoaster/js-utils';
 import { ChainPipeline, HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from './types.js';
 
 export interface PipelineVariable {
-  parameter: 'prompt' | 'cfg' | 'seed' | 'steps';
+  parameter: 'prompt' | 'cfg' | 'seed' | 'steps' | 'eta' | 'scheduler' | 'token';
   input: string;
   values: Array<number | string>;
 }
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index 91ce6a26..a4752691 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -1,5 +1,5 @@
 import { doesExist, mustExist } from '@apextoaster/js-utils';
-import { Checkbox, FormControl, InputLabel, MenuItem, Select, Stack, TextField } from '@mui/material';
+import { Checkbox, FormControl, FormControlLabel, InputLabel, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useContext } from 'react';
 import { useStore } from 'zustand';
@@ -18,78 +18,96 @@ export function VariableControl(props: VariableControlProps) {
   const store = mustExist(useContext(StateContext));
   const grid = useStore(store, props.selectGrid);
 
-  return <Stack direction='column' spacing={2}>
-    <Stack direction='row' spacing={2}>
-      <InputLabel>Grid Mode</InputLabel>
-      <Checkbox checked={grid.enabled} onChange={() => props.setGrid({
-        enabled: grid.enabled === false,
-      })} />
-    </Stack>
+  const stack = [
     <Stack direction='row' spacing={2}>
       <FormControl>
-        <InputLabel id='TODO'>Columns</InputLabel>
-        <Select onChange={(event) => props.setGrid({
+        <FormControlLabel
+          label='Grid Mode'
+          control={<Checkbox
+            checked={grid.enabled}
+            onChange={() => props.setGrid({
+              enabled: grid.enabled === false,
+            })}
+          />}
+        />
+      </FormControl>
+    </Stack>,
+  ];
+
+  if (grid.enabled) {
+    stack.push(
+      <Stack direction='row' spacing={2}>
+        <FormControl>
+          <InputLabel id='TODO'>Columns</InputLabel>
+          <Select onChange={(event) => props.setGrid({
+            columns: {
+              parameter: event.target.value as VariableKey,
+              input: '',
+              values: [],
+            },
+          })} value={grid.columns.parameter}>
+            {...parameterList([grid.rows.parameter])}
+          </Select>
+        </FormControl>
+        <TextField label={grid.columns.parameter} value={grid.columns.input} onChange={(event) => props.setGrid({
           columns: {
-            parameter: event.target.value as VariableKey,
-            input: '',
-            values: [],
+            parameter: grid.columns.parameter,
+            input: event.target.value,
+            values: rangeSplit(grid.columns.parameter, event.target.value),
           },
-        })} value={grid.columns.parameter}>
-          <MenuItem key='prompt' value='prompt'>Prompt</MenuItem>
-          <MenuItem key='seed' value='seed'>Seed</MenuItem>
-          <MenuItem key='steps' value='steps'>Steps</MenuItem>
-        </Select>
-      </FormControl>
-      <TextField label={grid.columns.parameter} value={grid.columns.input} onChange={(event) => props.setGrid({
-        columns: {
-          parameter: grid.columns.parameter,
-          input: event.target.value,
-          values: rangeSplit(grid.columns.parameter, event.target.value),
-        },
-      })} />
-    </Stack>
-    <Stack direction='row' spacing={2}>
-      <FormControl>
-        <InputLabel id='TODO'>Rows</InputLabel>
-        <Select onChange={(event) => props.setGrid({
+        })} />
+      </Stack>,
+      <Stack direction='row' spacing={2}>
+        <FormControl>
+          <InputLabel id='TODO'>Rows</InputLabel>
+          <Select onChange={(event) => props.setGrid({
+            rows: {
+              parameter: event.target.value as VariableKey,
+              input: '',
+              values: [],
+            }
+          })} value={grid.rows.parameter}>
+            {...parameterList([grid.columns.parameter])}
+          </Select>
+        </FormControl>
+        <TextField label={grid.rows.parameter} value={grid.rows.input} onChange={(event) => props.setGrid({
           rows: {
-            parameter: event.target.value as VariableKey,
-            input: '',
-            values: [],
+            parameter: grid.rows.parameter,
+            input: event.target.value,
+            values: rangeSplit(grid.rows.parameter, event.target.value),
           }
-        })} value={grid.rows.parameter}>
-          <MenuItem key='prompt' value='prompt'>Prompt</MenuItem>
-          <MenuItem key='seed' value='seed'>Seed</MenuItem>
-          <MenuItem key='steps' value='steps'>Steps</MenuItem>
-        </Select>
-      </FormControl>
-      <TextField label={grid.rows.parameter} value={grid.rows.input} onChange={(event) => props.setGrid({
-        rows: {
-          parameter: grid.rows.parameter,
-          input: event.target.value,
-          values: rangeSplit(grid.rows.parameter, event.target.value),
-        }
-      })} />
-    </Stack>
-  </Stack>;
+        })} />
+      </Stack>
+    );
+  }
+
+  return <Stack direction='column' spacing={2}>{...stack}</Stack>;
 }
 
 export function rangeSplit(parameter: string, value: string): Array<number | string> {
-  // string values
-  if (parameter === 'prompt') {
-    return value.split('\n');
+  const csv = value.split(',').map((it) => it.trim());
+
+  if (STRING_PARAMETERS.includes(parameter)) {
+    return csv;
   }
 
-  return value.split(',').map((it) => it.trim()).flatMap((it) => expandRanges(it));
+  return csv.flatMap((it) => expandRanges(it));
 }
 
-export const EXPR_STRICT_NUMBER = /^[0-9]+$/;
+export const EXPR_STRICT_NUMBER = /^-?[0-9]+$/;
 export const EXPR_NUMBER_RANGE = /^([0-9]+)-([0-9]+)$/;
 
 export function expandRanges(range: string): Array<string | number> {
   if (EXPR_STRICT_NUMBER.test(range)) {
     // entirely numeric, return without parsing
-    return [parseInt(range, 10)];
+    const val = parseInt(range, 10);
+
+    // eslint-disable-next-line @typescript-eslint/no-magic-numbers
+    if (val === -1) {
+      return [newSeed()];
+    }
+
+    return [val];
   }
 
   if (EXPR_NUMBER_RANGE.test(range)) {
@@ -105,3 +123,27 @@ export function expandRanges(range: string): Array<string | number> {
 
   return [];
 }
+
+export const MAX_SEED_SIZE = 32;
+export const MAX_SEED = (2**MAX_SEED_SIZE) - 1;
+
+export function newSeed(): number {
+  return Math.floor(Math.random() * MAX_SEED);
+}
+
+export const VARIABLE_PARAMETERS = ['prompt', 'negativePrompt', 'seed', 'steps', 'cfg', 'scheduler', 'eta', 'token'];
+export const STRING_PARAMETERS = ['prompt', 'negativePrompt', 'scheduler', 'token'];
+
+export function parameterList(exclude?: Array<string>) {
+  const items = [];
+
+  for (const variable of VARIABLE_PARAMETERS) {
+    if (variable !== 'token' && doesExist(exclude) && exclude.includes(variable)) {
+      continue;
+    }
+
+    items.push(<MenuItem key={variable} value={variable}>{variable}</MenuItem>);
+  }
+
+  return items;
+}

From e5a9d5772d7a0b119bbe3e71f00f4c60afdf78e8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 17:36:49 -0500
Subject: [PATCH 028/240] feat(gui): add row and column tokens for X/Y prompts

---
 gui/src/client/utils.ts | 32 ++++++++++++++++++++++++++++++--
 1 file changed, 30 insertions(+), 2 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 6944141c..e771fc8b 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -13,6 +13,31 @@ export interface PipelineGrid {
   rows: PipelineVariable;
 }
 
+export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, columnValue: string | number, rowValue: string | number): {prompt: string} {
+  const result = {
+    negativePrompt: params.negativePrompt,
+    prompt: params.prompt,
+  };
+
+  if (grid.columns.parameter === 'token') {
+    result.prompt = result.prompt.replace('__column__', columnValue.toString());
+
+    if (doesExist(result.negativePrompt)) {
+      result.negativePrompt = result.negativePrompt.replace('__column__', columnValue.toString());
+    }
+  }
+
+  if (grid.rows.parameter === 'token') {
+    result.prompt = result.prompt.replace('__row__', rowValue.toString());
+
+    if (doesExist(result.negativePrompt)) {
+      result.negativePrompt = result.negativePrompt.replace('__row__', rowValue.toString());
+    }
+  }
+
+  return result;
+}
+
 // eslint-disable-next-line max-params
 export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
@@ -21,13 +46,16 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
 
   let i = 0;
 
-  for (const column of grid.columns.values) {
-    for (const row of grid.rows.values) {
+  for (const row of grid.rows.values) {
+    for (const column of grid.columns.values) {
+      const prompt = replacePromptTokens(grid, params, column, row);
+
       pipeline.stages.push({
         name: `cell-${i}`,
         type: 'source-txt2img',
         params: {
           ...params,
+          ...prompt,
           ...model,
           [grid.columns.parameter]: column,
           [grid.rows.parameter]: row,

From eeebdfebcb774cb6fa40b3ee6d46e438c7f58d07 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 17:37:20 -0500
Subject: [PATCH 029/240] set unlimited tile to large value, clarify variable
 names

---
 api/onnx_web/chain/base.py | 4 ++--
 api/onnx_web/params.py     | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 077f5998..a62d6fcb 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -209,8 +209,8 @@ class ChainPipeline:
                     if len(extra_tiles) > 1:
                         for layer in extra_tiles:
                             layer_output = Image.new("RGB", output.size)
-                            for tile, dims in layer:
-                                layer_output.paste(tile, (dims[0], dims[1]))
+                            for layer_tile, dims in layer:
+                                layer_output.paste(layer_tile, (dims[0], dims[1]))
 
                             stage_outputs.append(layer_output)
 
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 4b03f758..a6f2c888 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -14,7 +14,6 @@ Point = Tuple[int, int]
 
 
 class SizeChart(IntEnum):
-    unlimited = 0
     mini = 128  # small tile for very expensive models
     half = 256  # half tile for outpainting
     auto = 512  # auto tile size
@@ -25,6 +24,7 @@ class SizeChart(IntEnum):
     hd16k = 2**14
     hd32k = 2**15
     hd64k = 2**16
+    unlimited = 2**32 # sort of
 
 
 class TileOrder:

From cd06f9291b3f7ada56e6745df87a5aae26423338 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 18:18:38 -0500
Subject: [PATCH 030/240] add custom VAE and fp16 support to SDXL conversion

---
 .../convert/diffusion/diffusion_xl.py         | 33 +++++++++++++++++--
 api/onnx_web/params.py                        |  2 +-
 api/onnx_web/server/params.py                 |  2 +-
 3 files changed, 32 insertions(+), 5 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index a7dcf104..6982d0b1 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -2,10 +2,14 @@ from logging import getLogger
 from os import path
 from typing import Dict, Optional, Tuple
 
+import onnx
 import torch
-from diffusers import StableDiffusionXLPipeline
+from diffusers import AutoencoderKL, StableDiffusionXLPipeline
+from onnx.shape_inference import infer_shapes_path
+from onnxruntime.transformers.float16 import convert_float_to_float16
 from optimum.exporters.onnx import main_export
 
+from ...constants import ONNX_MODEL
 from ..utils import ConversionContext
 
 logger = getLogger(__name__)
@@ -23,7 +27,7 @@ def convert_diffusion_diffusers_xl(
     From https://github.com/huggingface/diffusers/blob/main/scripts/convert_stable_diffusion_checkpoint_to_onnx.py
     """
     name = model.get("name")
-    # TODO: support alternate VAE
+    replace_vae = model.get("vae", None)
 
     device = conversion.training_device
     dtype = conversion.torch_dtype()
@@ -57,6 +61,12 @@ def convert_diffusion_diffusers_xl(
     else:
         pipeline = StableDiffusionXLPipeline.from_pretrained(source)
 
+    if replace_vae is not None:
+        if replace_vae.endswith(".safetensors"):
+            pipeline.vae = AutoencoderKL.from_single_file(replace_vae)
+        else:
+            pipeline.vae = AutoencoderKL.from_pretrained(replace_vae)
+
     pipeline.save_pretrained(temp_path)
 
     # directory -> onnx using optimum exporters
@@ -69,6 +79,23 @@ def convert_diffusion_diffusers_xl(
         framework="pt",
     )
 
-    # TODO: optimize UNet to fp16
+    if conversion.half:
+        unet_path = path.join(dest_path, "unet", ONNX_MODEL)
+        infer_shapes_path(unet_path)
+        unet = onnx.load(unet_path)
+        opt_model = convert_float_to_float16(
+            unet,
+            disable_shape_infer=True,
+            force_fp16_initializers=True,
+            keep_io_types=True,
+            op_block_list=["Attention", "MultiHeadAttention"],
+        )
+        onnx.save_model(
+            opt_model,
+            unet_path,
+            save_as_external_data=True,
+            all_tensors_to_one_file=True,
+            location="weights.pb",
+        )
 
     return False, dest_path
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index a6f2c888..5b504c6a 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -24,7 +24,7 @@ class SizeChart(IntEnum):
     hd16k = 2**14
     hd32k = 2**15
     hd64k = 2**16
-    unlimited = 2**32 # sort of
+    unlimited = 2**32  # sort of
 
 
 class TileOrder:
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index e37a15a8..c32fdbf2 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Any, Dict, Tuple
+from typing import Dict, Tuple
 
 import numpy as np
 from flask import request

From 6fb0366f529674ba2d47f99a217c0fe1454a79f9 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 18:41:59 -0500
Subject: [PATCH 031/240] feat(api): make tile retries configurable

---
 api/onnx_web/server/context.py | 3 +++
 api/onnx_web/worker/context.py | 3 ++-
 api/onnx_web/worker/pool.py    | 1 +
 3 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 8af1eb2a..9ab9210c 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -37,6 +37,7 @@ class ServerContext:
         memory_limit: Optional[int] = None,
         admin_token: Optional[str] = None,
         server_version: Optional[str] = DEFAULT_SERVER_VERSION,
+        worker_retries: Optional[int] = 3,
     ) -> None:
         self.bundle_path = bundle_path
         self.model_path = model_path
@@ -56,6 +57,7 @@ class ServerContext:
         self.memory_limit = memory_limit
         self.admin_token = admin_token or token_urlsafe()
         self.server_version = server_version
+        self.worker_retries = worker_retries
 
         self.cache = ModelCache(self.cache_limit)
 
@@ -88,6 +90,7 @@ class ServerContext:
             server_version=environ.get(
                 "ONNX_WEB_SERVER_VERSION", DEFAULT_SERVER_VERSION
             ),
+            worker_retries=int(environ.get("ONNX_WEB_WORKER_RETRIES", 3)),
         )
 
     def torch_dtype(self):
diff --git a/api/onnx_web/worker/context.py b/api/onnx_web/worker/context.py
index 22851f77..2b35ff4c 100644
--- a/api/onnx_web/worker/context.py
+++ b/api/onnx_web/worker/context.py
@@ -36,6 +36,7 @@ class WorkerContext:
         progress: "Queue[ProgressCommand]",
         active_pid: "Value[int]",
         idle: "Value[bool]",
+        retries: int,
     ):
         self.job = None
         self.name = name
@@ -47,8 +48,8 @@ class WorkerContext:
         self.active_pid = active_pid
         self.last_progress = None
         self.idle = idle
+        self.retries = retries
         self.timeout = 1.0
-        self.retries = 3  # TODO: get from env
 
     def start(self, job: str) -> None:
         self.job = job
diff --git a/api/onnx_web/worker/pool.py b/api/onnx_web/worker/pool.py
index c65ebf10..833a04f8 100644
--- a/api/onnx_web/worker/pool.py
+++ b/api/onnx_web/worker/pool.py
@@ -124,6 +124,7 @@ class DevicePoolExecutor:
             pending=self.pending[name],
             active_pid=current,
             idle=self.worker_idle[name],
+            retries=self.server.worker_retries,
         )
         self.context[name] = context
 

From cf2cf51b17f47ad9703014024ad18ea0a98cd9fa Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 20:21:43 -0500
Subject: [PATCH 032/240] fix(api): resolve XL VAE within model folder

---
 api/onnx_web/convert/diffusion/diffusion_xl.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index 6982d0b1..16081b53 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -62,10 +62,11 @@ def convert_diffusion_diffusers_xl(
         pipeline = StableDiffusionXLPipeline.from_pretrained(source)
 
     if replace_vae is not None:
+        vae_path = path.join(conversion.model_path, replace_vae)
         if replace_vae.endswith(".safetensors"):
-            pipeline.vae = AutoencoderKL.from_single_file(replace_vae)
+            pipeline.vae = AutoencoderKL.from_single_file(vae_path)
         else:
-            pipeline.vae = AutoencoderKL.from_pretrained(replace_vae)
+            pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
 
     pipeline.save_pretrained(temp_path)
 

From fd8b9bef3beaa56f565dc4d701a3c2b2e53cb9bf Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 11 Sep 2023 20:47:03 -0500
Subject: [PATCH 033/240] fix type check

---
 api/onnx_web/utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index d7ca839e..43547c63 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -30,7 +30,7 @@ def is_debug() -> bool:
 def get_boolean(args: Any, key: str, default_value: bool) -> bool:
     val = args.get(key, str(default_value))
 
-    if type(val) == bool:
+    if isinstance(val, bool):
         return val
 
     return val.lower() in ("1", "t", "true", "y", "yes")

From d4b013068dc6065cf1973d6d35f28f51b607fcd8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 07:21:35 -0500
Subject: [PATCH 034/240] fix(api): ensure VAE is loaded on correct device

---
 api/onnx_web/diffusers/load.py | 70 +++++++++++++++++++++-------------
 1 file changed, 43 insertions(+), 27 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 36a35b7a..28bdac75 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -7,7 +7,12 @@ from optimum.onnxruntime import (  # ORTStableDiffusionXLInpaintPipeline,
     ORTStableDiffusionXLImg2ImgPipeline,
     ORTStableDiffusionXLPipeline,
 )
-from optimum.onnxruntime.modeling_diffusion import ORTModelTextEncoder, ORTModelUnet
+from optimum.onnxruntime.modeling_diffusion import (
+    ORTModelTextEncoder,
+    ORTModelUnet,
+    ORTModelVaeDecoder,
+    ORTModelVaeEncoder,
+)
 from transformers import CLIPTokenizer
 
 from ..constants import ONNX_MODEL
@@ -363,26 +368,40 @@ def load_pipeline(
                     sess_options=device.sess_options(),
                 )
             )
-        elif (
-            not params.is_xl() and path.exists(vae_decoder) and path.exists(vae_encoder)
-        ):
-            logger.debug("loading VAE decoder from %s", vae_decoder)
-            components["vae_decoder"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
+        elif path.exists(vae_decoder) and path.exists(vae_encoder):
+            if params.is_xl():
+                logger.debug("loading VAE decoder from %s", vae_decoder)
+                components["vae_decoder_session"] = OnnxRuntimeModel.load_model(
                     vae_decoder,
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-            )
 
-            logger.debug("loading VAE encoder from %s", vae_encoder)
-            components["vae_encoder"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
+                logger.debug("loading VAE encoder from %s", vae_encoder)
+                components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
                     vae_encoder,
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-            )
+
+            else:
+                logger.debug("loading VAE decoder from %s", vae_decoder)
+                components["vae_decoder"] = OnnxRuntimeModel(
+                    OnnxRuntimeModel.load_model(
+                        vae_decoder,
+                        provider=device.ort_provider("vae"),
+                        sess_options=device.sess_options(),
+                    )
+                )
+
+                logger.debug("loading VAE encoder from %s", vae_encoder)
+                components["vae_encoder"] = OnnxRuntimeModel(
+                    OnnxRuntimeModel.load_model(
+                        vae_encoder,
+                        provider=device.ort_provider("vae"),
+                        sess_options=device.sess_options(),
+                    )
+                )
 
         # additional options for panorama pipeline
         if params.is_panorama():
@@ -402,33 +421,30 @@ def load_pipeline(
 
         # make sure XL models are actually being used
         if "text_encoder_session" in components:
-            logger.info(
-                "text encoder matches: %s, %s",
-                pipe.text_encoder.session == components["text_encoder_session"],
-                type(pipe.text_encoder),
-            )
             pipe.text_encoder = ORTModelTextEncoder(text_encoder_session, text_encoder)
 
         if "text_encoder_2_session" in components:
-            logger.info(
-                "text encoder 2 matches: %s, %s",
-                pipe.text_encoder_2.session == components["text_encoder_2_session"],
-                type(pipe.text_encoder_2),
-            )
             pipe.text_encoder_2 = ORTModelTextEncoder(
                 text_encoder_2_session, text_encoder_2
             )
 
         if "unet_session" in components:
-            logger.info(
-                "unet matches: %s, %s",
-                pipe.unet.session == components["unet_session"],
-                type(pipe.unet),
-            )
+            # unload old UNet first
             pipe.unet = None
             run_gc([device])
+            # load correct one
             pipe.unet = ORTModelUnet(unet_session, unet_model)
 
+        if "vae_decoder_session" in components:
+            pipe.vae_decoder = ORTModelVaeDecoder(
+                components["vae_decoder_session"], vae_decoder
+            )
+
+        if "vae_encoder_session" in components:
+            pipe.vae_encoder = ORTModelVaeEncoder(
+                components["vae_encoder_session"], vae_encoder
+            )
+
         if not server.show_progress:
             pipe.set_progress_bar_config(disable=True)
 

From 4ccdedba897ee4c16c5092598a7e7977d8291a88 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 07:32:29 -0500
Subject: [PATCH 035/240] set model path for VAE sessions

---
 api/onnx_web/diffusers/load.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 28bdac75..c7bc953b 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -376,6 +376,7 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
+                components["vae_decoder_session"]._model_path = vae_decoder
 
                 logger.debug("loading VAE encoder from %s", vae_encoder)
                 components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
@@ -383,6 +384,7 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
+                components["vae_encoder_session"]._model_path = vae_encoder
 
             else:
                 logger.debug("loading VAE decoder from %s", vae_decoder)

From 55ddb9fdac8e195e733e24a69670bf62f590b6a6 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 18:16:16 -0500
Subject: [PATCH 036/240] feat(api): attempt to calculate total steps for chain
 pipelines

---
 api/onnx_web/chain/base.py           | 10 +++++++++-
 api/onnx_web/chain/blend_grid.py     |  7 +++++++
 api/onnx_web/chain/blend_img2img.py  | 14 ++++++++++++++
 api/onnx_web/chain/source_noise.py   |  7 +++++++
 api/onnx_web/chain/source_s3.py      |  7 +++++++
 api/onnx_web/chain/source_txt2img.py | 14 ++++++++++++++
 api/onnx_web/chain/source_url.py     |  7 +++++++
 api/onnx_web/chain/stage.py          | 11 +++++++++--
 api/onnx_web/chain/tile.py           |  1 +
 api/onnx_web/diffusers/load.py       | 10 ++++++----
 api/onnx_web/server/api.py           | 11 ++++++-----
 11 files changed, 87 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index a62d6fcb..b939f028 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -7,7 +7,7 @@ from PIL import Image
 
 from ..errors import RetryException
 from ..output import save_image
-from ..params import ImageParams, StageParams
+from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..utils import is_debug, run_gc
 from ..worker import ProgressCallback, WorkerContext
@@ -85,6 +85,14 @@ class ChainPipeline:
         self.stages.append((callback, params, kwargs))
         return self
 
+    def steps(self, params: ImageParams, size: Size):
+        steps = 0
+        for callback, _params, _kwargs in self.stages:
+            steps += callback.steps(params, size)
+
+        return steps
+
+
     def __call__(
         self,
         worker: WorkerContext,
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 5a23f779..561319ab 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -48,3 +48,10 @@ class BlendGridStage(BaseStage):
             output.paste(sources[n], (x * size[0], y * size[1]))
 
         return [*sources, output]
+
+    def outputs(
+            self,
+            params: ImageParams,
+            sources: int,
+    ) -> int:
+        return sources + 1
\ No newline at end of file
diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index e3c249a9..fa2023d4 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -103,3 +103,17 @@ class BlendImg2ImgStage(BaseStage):
             outputs.extend(result.images)
 
         return outputs
+
+    def steps(
+            self,
+            params: ImageParams,
+            *args,
+    ) -> int:
+        return params.steps # TODO: multiply by strength
+
+    def outputs(
+            self,
+            params: ImageParams,
+            sources: int,
+    ) -> int:
+        return sources + 1
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 5e6035d8..930599e2 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -42,3 +42,10 @@ class SourceNoiseStage(BaseStage):
             outputs.append(output)
 
         return outputs
+
+    def outputs(
+            self,
+            params: ImageParams,
+            sources: int,
+    ) -> int:
+        return sources + 1
\ No newline at end of file
diff --git a/api/onnx_web/chain/source_s3.py b/api/onnx_web/chain/source_s3.py
index 55f8f228..6fa50b7e 100644
--- a/api/onnx_web/chain/source_s3.py
+++ b/api/onnx_web/chain/source_s3.py
@@ -49,3 +49,10 @@ class SourceS3Stage(BaseStage):
                 logger.exception("error loading image from S3")
 
         return outputs
+
+    def outputs(
+            self,
+            params: ImageParams,
+            sources: int,
+    ) -> int:
+        return sources + 1 # TODO: len(source_keys)
\ No newline at end of file
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index cda81b3d..ed81f8db 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -126,3 +126,17 @@ class SourceTxt2ImgStage(BaseStage):
         output = list(sources)
         output.extend(result.images)
         return output
+
+    def steps(
+        self,
+        params: ImageParams,
+        size: Size,
+    ) -> int:
+        return params.steps
+
+    def outputs(
+        self,
+        params: ImageParams,
+        sources: int,
+    ) -> int:
+        return sources + 1
\ No newline at end of file
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 54f86c54..29d88350 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -42,3 +42,10 @@ class SourceURLStage(BaseStage):
             outputs.append(output)
 
         return outputs
+
+    def outputs(
+            self,
+            params: ImageParams,
+            sources: int,
+    ) -> int:
+        return sources + 1
\ No newline at end of file
diff --git a/api/onnx_web/chain/stage.py b/api/onnx_web/chain/stage.py
index 781b65de..fff56ba7 100644
--- a/api/onnx_web/chain/stage.py
+++ b/api/onnx_web/chain/stage.py
@@ -25,7 +25,14 @@ class BaseStage:
 
     def steps(
         self,
-        _params: ImageParams,
+        params: ImageParams,
         size: Size,
     ) -> int:
-        raise NotImplementedError()
+        return 1
+
+    def outputs(
+        self,
+        params: ImageParams,
+        sources: int,
+    ) -> int:
+        return sources
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index c80a5719..8f228392 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -50,6 +50,7 @@ def needs_tile(
     source: Optional[Image.Image] = None,
 ) -> bool:
     tile = min(max_tile, stage_tile)
+    logger.debug("")
 
     if source is not None:
         return source.width > tile or source.height > tile
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index c7bc953b..1bb8a00e 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -376,7 +376,7 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-                components["vae_decoder_session"]._model_path = vae_decoder
+                components["vae_decoder_session"]._model_path = vae_decoder # "#\\not a real path on any system"
 
                 logger.debug("loading VAE encoder from %s", vae_encoder)
                 components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
@@ -384,7 +384,7 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-                components["vae_encoder_session"]._model_path = vae_encoder
+                components["vae_encoder_session"]._model_path = vae_encoder # "#\\not a real path on any system"
 
             else:
                 logger.debug("loading VAE decoder from %s", vae_decoder)
@@ -439,12 +439,14 @@ def load_pipeline(
 
         if "vae_decoder_session" in components:
             pipe.vae_decoder = ORTModelVaeDecoder(
-                components["vae_decoder_session"], vae_decoder
+                components["vae_decoder_session"],
+                pipe, # TODO: find the right class to provide here. ORTModel is missing the dict json method
             )
 
         if "vae_encoder_session" in components:
             pipe.vae_encoder = ORTModelVaeEncoder(
-                components["vae_encoder_session"], vae_encoder
+                components["vae_encoder_session"],
+                pipe, # TODO: find the right class to provide here. ORTModel is missing the dict json method
             )
 
         if not server.show_progress:
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 85103bba..e5142756 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -387,7 +387,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     validate(data, schema)
 
     # get defaults from the regular parameters
-    device, _params, _size = pipeline_from_request(server, data=data)
+    device, base_params, base_size = pipeline_from_request(server, data=data)
     pipeline = ChainPipeline()
     for stage_data in data.get("stages", []):
         stage_class = CHAIN_STAGES[stage_data.get("type")]
@@ -450,7 +450,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
 
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
-    output = make_output_name(server, "chain", params, size, count=len(pipeline.stages))
+    output = make_output_name(server, "chain", base_params, base_size, count=len(pipeline.stages))
     job_name = output[0]
 
     # build and run chain pipeline
@@ -458,14 +458,15 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         job_name,
         pipeline,
         server,
-        params,
+        base_params,
         [],
         output=output,
-        size=size,
+        size=base_size,
         needs_device=device,
     )
 
-    return jsonify(json_params(output, params, size))
+    step_params = params.with_args(steps=pipeline.steps(base_params, base_size))
+    return jsonify(json_params(output, step_params, base_size))
 
 
 def blend(server: ServerContext, pool: DevicePoolExecutor):

From f9acf9b50f58c324b38eac1ea17057949b866943 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 18:19:07 -0500
Subject: [PATCH 037/240] fix(api): report chain progress using a new callback
 if none was provided

---
 api/onnx_web/chain/base.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index b939f028..9c0cb76e 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -105,7 +105,9 @@ class ChainPipeline:
         """
         DEPRECATED: use `run` instead
         """
-        if callback is not None:
+        if callback is None:
+            callback = worker.get_progress_callback()
+        else:
             callback = ChainProgress.from_progress(callback)
 
         start = monotonic()

From 7d8819ef879cb9f7d964f9b85f60df9bd75526d2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 19:06:13 -0500
Subject: [PATCH 038/240] add default parameters to chain pipeline

---
 api/onnx_web/chain/tile.py |  2 +-
 api/onnx_web/server/api.py |  4 +++-
 api/schemas/chain.yaml     | 10 ++++++++++
 gui/src/client/types.ts    | 24 ++++++++++++++----------
 gui/src/client/utils.ts    |  3 +++
 5 files changed, 31 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 8f228392..ed2d09a4 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -50,7 +50,7 @@ def needs_tile(
     source: Optional[Image.Image] = None,
 ) -> bool:
     tile = min(max_tile, stage_tile)
-    logger.debug("")
+    logger.trace("checking image tile dimensions: %s, %s, %s", tile, source.width > tile or source.height > tile, size.width > tile or size.height > tile)
 
     if source is not None:
         return source.width > tile or source.height > tile
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index e5142756..62cefbf7 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -387,7 +387,9 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     validate(data, schema)
 
     # get defaults from the regular parameters
-    device, base_params, base_size = pipeline_from_request(server, data=data)
+    device, base_params, base_size = pipeline_from_request(server, data=data.get("defaults", None))
+
+    # start building the pipeline
     pipeline = ChainPipeline()
     for stage_data in data.get("stages", []):
         stage_class = CHAIN_STAGES[stage_data.get("type")]
diff --git a/api/schemas/chain.yaml b/api/schemas/chain.yaml
index 211e65ac..e24593f6 100644
--- a/api/schemas/chain.yaml
+++ b/api/schemas/chain.yaml
@@ -56,10 +56,20 @@ $defs:
     items:
       $ref: "#/$defs/request_stage"
 
+  request_defaults:
+    type: object
+    properties:
+      txt2img:
+        $ref: "#/$defs/image_params"
+      img2img:
+        $ref: "#/$defs/image_params"
+
 type: object
 additionalProperties: False
 required: [stages]
 properties:
+  defaults:
+    $ref: "#/$defs/request_defaults"
   platform:
     type: string
   stages:
diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index 9be13103..dfc240bb 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -162,39 +162,43 @@ export interface HighresParams {
   highresStrength: number;
 }
 
+export interface ChainStageParams {
+  tile_size: number;
+}
+
 export interface Txt2ImgStage {
   name: string;
   type: 'source-txt2img';
-  params: Txt2ImgParams & {
-    tile_size: number;
-  };
+  params: Partial<Txt2ImgParams & ChainStageParams>;
 }
 
 export interface Img2ImgStage {
   name: string;
   type: 'blend-img2img';
-  params: Img2ImgParams;
+  params: Partial<Img2ImgParams & ChainStageParams>;
 }
 
 export interface GridStage {
   name: string;
   type: 'blend-grid';
-  params: {
+  params: Partial<{
     height: number;
     width: number;
-    tile_size: number;
-  };
+  } & ChainStageParams>;
 }
 
 export interface OutputStage {
   name: string;
   type: 'persist-disk';
-  params: {
-    tile_size: number;
-  };
+  params: Partial<ChainStageParams>;
 }
 
 export interface ChainPipeline {
+  defaults?: {
+    txt2img?: Txt2ImgParams;
+    img2img?: Img2ImgParams;
+  };
+
   stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
 }
 
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index e771fc8b..88d79ff1 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -41,6 +41,9 @@ export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, c
 // eslint-disable-next-line max-params
 export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
+    defaults: {
+      txt2img: params,
+    },
     stages: [],
   };
 

From 0a5f725efa08376e970b50e2a90148b44715e2ea Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 19:17:03 -0500
Subject: [PATCH 039/240] apply lint

---
 api/onnx_web/chain/base.py           |  1 -
 api/onnx_web/chain/blend_grid.py     |  8 ++++----
 api/onnx_web/chain/blend_img2img.py  | 14 +++++++-------
 api/onnx_web/chain/source_noise.py   |  8 ++++----
 api/onnx_web/chain/source_s3.py      |  8 ++++----
 api/onnx_web/chain/source_txt2img.py |  2 +-
 api/onnx_web/chain/source_url.py     |  8 ++++----
 api/onnx_web/chain/tile.py           |  7 ++++++-
 api/onnx_web/diffusers/load.py       | 12 ++++++++----
 api/onnx_web/server/api.py           |  8 ++++++--
 10 files changed, 44 insertions(+), 32 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 9c0cb76e..76d5d58b 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -92,7 +92,6 @@ class ChainPipeline:
 
         return steps
 
-
     def __call__(
         self,
         worker: WorkerContext,
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 561319ab..cf4b9f90 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -50,8 +50,8 @@ class BlendGridStage(BaseStage):
         return [*sources, output]
 
     def outputs(
-            self,
-            params: ImageParams,
-            sources: int,
+        self,
+        params: ImageParams,
+        sources: int,
     ) -> int:
-        return sources + 1
\ No newline at end of file
+        return sources + 1
diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index fa2023d4..020cd917 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -105,15 +105,15 @@ class BlendImg2ImgStage(BaseStage):
         return outputs
 
     def steps(
-            self,
-            params: ImageParams,
-            *args,
+        self,
+        params: ImageParams,
+        *args,
     ) -> int:
-        return params.steps # TODO: multiply by strength
+        return params.steps  # TODO: multiply by strength
 
     def outputs(
-            self,
-            params: ImageParams,
-            sources: int,
+        self,
+        params: ImageParams,
+        sources: int,
     ) -> int:
         return sources + 1
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 930599e2..738e9878 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -44,8 +44,8 @@ class SourceNoiseStage(BaseStage):
         return outputs
 
     def outputs(
-            self,
-            params: ImageParams,
-            sources: int,
+        self,
+        params: ImageParams,
+        sources: int,
     ) -> int:
-        return sources + 1
\ No newline at end of file
+        return sources + 1
diff --git a/api/onnx_web/chain/source_s3.py b/api/onnx_web/chain/source_s3.py
index 6fa50b7e..1493088c 100644
--- a/api/onnx_web/chain/source_s3.py
+++ b/api/onnx_web/chain/source_s3.py
@@ -51,8 +51,8 @@ class SourceS3Stage(BaseStage):
         return outputs
 
     def outputs(
-            self,
-            params: ImageParams,
-            sources: int,
+        self,
+        params: ImageParams,
+        sources: int,
     ) -> int:
-        return sources + 1 # TODO: len(source_keys)
\ No newline at end of file
+        return sources + 1  # TODO: len(source_keys)
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index ed81f8db..dfed652a 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -139,4 +139,4 @@ class SourceTxt2ImgStage(BaseStage):
         params: ImageParams,
         sources: int,
     ) -> int:
-        return sources + 1
\ No newline at end of file
+        return sources + 1
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 29d88350..8b1683f8 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -44,8 +44,8 @@ class SourceURLStage(BaseStage):
         return outputs
 
     def outputs(
-            self,
-            params: ImageParams,
-            sources: int,
+        self,
+        params: ImageParams,
+        sources: int,
     ) -> int:
-        return sources + 1
\ No newline at end of file
+        return sources + 1
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index ed2d09a4..7e40c7dc 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -50,7 +50,12 @@ def needs_tile(
     source: Optional[Image.Image] = None,
 ) -> bool:
     tile = min(max_tile, stage_tile)
-    logger.trace("checking image tile dimensions: %s, %s, %s", tile, source.width > tile or source.height > tile, size.width > tile or size.height > tile)
+    logger.trace(
+        "checking image tile dimensions: %s, %s, %s",
+        tile,
+        source.width > tile or source.height > tile,
+        size.width > tile or size.height > tile,
+    )
 
     if source is not None:
         return source.width > tile or source.height > tile
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 1bb8a00e..94778e33 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -376,7 +376,9 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-                components["vae_decoder_session"]._model_path = vae_decoder # "#\\not a real path on any system"
+                components[
+                    "vae_decoder_session"
+                ]._model_path = vae_decoder  # "#\\not a real path on any system"
 
                 logger.debug("loading VAE encoder from %s", vae_encoder)
                 components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
@@ -384,7 +386,9 @@ def load_pipeline(
                     provider=device.ort_provider("vae"),
                     sess_options=device.sess_options(),
                 )
-                components["vae_encoder_session"]._model_path = vae_encoder # "#\\not a real path on any system"
+                components[
+                    "vae_encoder_session"
+                ]._model_path = vae_encoder  # "#\\not a real path on any system"
 
             else:
                 logger.debug("loading VAE decoder from %s", vae_decoder)
@@ -440,13 +444,13 @@ def load_pipeline(
         if "vae_decoder_session" in components:
             pipe.vae_decoder = ORTModelVaeDecoder(
                 components["vae_decoder_session"],
-                pipe, # TODO: find the right class to provide here. ORTModel is missing the dict json method
+                pipe,  # TODO: find the right class to provide here. ORTModel is missing the dict json method
             )
 
         if "vae_encoder_session" in components:
             pipe.vae_encoder = ORTModelVaeEncoder(
                 components["vae_encoder_session"],
-                pipe, # TODO: find the right class to provide here. ORTModel is missing the dict json method
+                pipe,  # TODO: find the right class to provide here. ORTModel is missing the dict json method
             )
 
         if not server.show_progress:
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 62cefbf7..5af4de1c 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -387,7 +387,9 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     validate(data, schema)
 
     # get defaults from the regular parameters
-    device, base_params, base_size = pipeline_from_request(server, data=data.get("defaults", None))
+    device, base_params, base_size = pipeline_from_request(
+        server, data=data.get("defaults", None)
+    )
 
     # start building the pipeline
     pipeline = ChainPipeline()
@@ -452,7 +454,9 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
 
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
-    output = make_output_name(server, "chain", base_params, base_size, count=len(pipeline.stages))
+    output = make_output_name(
+        server, "chain", base_params, base_size, count=len(pipeline.stages)
+    )
     job_name = output[0]
 
     # build and run chain pipeline

From 046de9bf3a751c9586fa1b8437887a211c11a023 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 12 Sep 2023 19:17:20 -0500
Subject: [PATCH 040/240] combine defaults and model params for now

---
 gui/src/client/types.ts | 6 ++++--
 gui/src/client/utils.ts | 3 ++-
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
index dfc240bb..291199e0 100644
--- a/gui/src/client/types.ts
+++ b/gui/src/client/types.ts
@@ -194,10 +194,12 @@ export interface OutputStage {
 }
 
 export interface ChainPipeline {
-  defaults?: {
+  /* defaults?: {
     txt2img?: Txt2ImgParams;
     img2img?: Img2ImgParams;
-  };
+  }; */
+
+  defaults?: Txt2ImgParams & ModelParams;
 
   stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
 }
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 88d79ff1..3bd3d403 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -42,7 +42,8 @@ export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, c
 export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
     defaults: {
-      txt2img: params,
+      ...model,
+      ...params,
     },
     stages: [],
   };

From 505e408dd6a9bc7a401eababca693591c7cbdf25 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 08:43:31 -0500
Subject: [PATCH 041/240] use pipeline output count

---
 api/onnx_web/chain/base.py | 7 +++++++
 api/onnx_web/server/api.py | 4 ++--
 2 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 76d5d58b..c775776d 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -92,6 +92,13 @@ class ChainPipeline:
 
         return steps
 
+    def outputs(self, params: ImageParams, sources: int):
+        outputs = sources
+        for callback, _params, _kwargs in self.stages:
+            outputs += callback.outputs(params, outputs)
+
+        return outputs
+
     def __call__(
         self,
         worker: WorkerContext,
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 5af4de1c..15569fc4 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -455,7 +455,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
     output = make_output_name(
-        server, "chain", base_params, base_size, count=len(pipeline.stages)
+        server, "chain", base_params, base_size, count=pipeline.outputs(base_params, 0))
     )
     job_name = output[0]
 
@@ -471,7 +471,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         needs_device=device,
     )
 
-    step_params = params.with_args(steps=pipeline.steps(base_params, base_size))
+    step_params = base_params.with_args(steps=pipeline.steps(base_params, base_size))
     return jsonify(json_params(output, step_params, base_size))
 
 

From 37daca5178927066e35bbf894100ff69822b848b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 08:44:16 -0500
Subject: [PATCH 042/240] dedupe tile size params

---
 gui/src/client/utils.ts | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 3bd3d403..9bf52118 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -48,6 +48,11 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
     stages: [],
   };
 
+  const tiles = {
+    // eslint-disable-next-line camelcase
+    tile_size: 8192,
+  };
+
   let i = 0;
 
   for (const row of grid.rows.values) {
@@ -61,10 +66,9 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
           ...params,
           ...prompt,
           ...model,
+          ...tiles,
           [grid.columns.parameter]: column,
           [grid.rows.parameter]: row,
-          // eslint-disable-next-line camelcase
-          tile_size: 8192,
         },
       });
 
@@ -78,20 +82,16 @@ export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelPara
     params: {
       ...params,
       ...model,
+      ...tiles,
       height: grid.rows.values.length,
       width: grid.columns.values.length,
-      // eslint-disable-next-line camelcase
-      tile_size: 8192,
     },
   });
 
   pipeline.stages.push({
     name: 'save',
     type: 'persist-disk',
-    params: {
-      // eslint-disable-next-line camelcase
-      tile_size: 8192,
-    },
+    params: tiles,
   });
 
   return pipeline;

From 07bea841553cffb072895d5dc18f2890a2cd107b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 08:44:57 -0500
Subject: [PATCH 043/240] syntax fix

---
 api/onnx_web/server/api.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 15569fc4..fa4cc449 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -455,7 +455,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     logger.info("running chain pipeline with %s stages", len(pipeline.stages))
 
     output = make_output_name(
-        server, "chain", base_params, base_size, count=pipeline.outputs(base_params, 0))
+        server, "chain", base_params, base_size, count=pipeline.outputs(base_params, 0)
     )
     job_name = output[0]
 

From e7aad281b0e35cc97166261b77a7a2cef57497ad Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 17:26:43 -0500
Subject: [PATCH 044/240] fix(api): only remove one retry after each tile
 failure

---
 api/Makefile               | 2 +-
 api/onnx_web/chain/base.py | 8 ++++----
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/api/Makefile b/api/Makefile
index 283c1ef1..780fa7d1 100644
--- a/api/Makefile
+++ b/api/Makefile
@@ -18,7 +18,7 @@ pip-dev: check-venv
 
 test:
 	python -m coverage erase
-	python -m coverage run -m unittest discover -s tests/
+	python -m coverage run -m unittest discover -v -s tests/
 	python -m coverage html -i
 	python -m coverage xml -i
 
diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index c775776d..ff01125a 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -175,7 +175,7 @@ class ChainPipeline:
                         tile_mask: Image.Image,
                         dims: Tuple[int, int, int],
                     ) -> Image.Image:
-                        for i in range(worker.retries):
+                        for _i in range(worker.retries):
                             try:
                                 output_tile = stage_pipe.run(
                                     worker,
@@ -201,13 +201,13 @@ class ChainPipeline:
 
                                 return output_tile[0]
                             except Exception:
+                                worker.retries = worker.retries - 1
                                 logger.exception(
-                                    "error while running stage pipeline for tile, retry %s of 3",
-                                    i,
+                                    "error while running stage pipeline for tile, %s retries left",
+                                    worker.retries,
                                 )
                                 server.cache.clear()
                                 run_gc([worker.get_device()])
-                                worker.retries = worker.retries - (i + 1)
 
                         raise RetryException("exhausted retries on tile")
 

From 8a5e2111729c9e3aa8bc7eef7c22e6b4bf642416 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 17:27:05 -0500
Subject: [PATCH 045/240] lint(api): deduplicate some imports

---
 api/onnx_web/convert/diffusion/diffusion.py | 23 ++-------------------
 1 file changed, 2 insertions(+), 21 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index 9b90e5ef..93bc96a1 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -16,22 +16,14 @@ from shutil import rmtree
 from typing import Any, Dict, Optional, Tuple, Union
 
 import torch
-from diffusers import (
-    AutoencoderKL,
-    OnnxRuntimeModel,
-    OnnxStableDiffusionPipeline,
-    StableDiffusionControlNetPipeline,
-    StableDiffusionInstructPix2PixPipeline,
-    StableDiffusionPipeline,
-    StableDiffusionUpscalePipeline,
-)
+from diffusers import AutoencoderKL, OnnxRuntimeModel, OnnxStableDiffusionPipeline
 from diffusers.pipelines.stable_diffusion.convert_from_ckpt import (
     download_from_original_stable_diffusion_ckpt,
 )
 from onnx import load_model, save_model
 
 from ...constants import ONNX_MODEL, ONNX_WEIGHTS
-from ...diffusers.load import optimize_pipeline
+from ...diffusers.load import available_pipelines, optimize_pipeline
 from ...diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
 from ...diffusers.version_safe_diffusers import AttnProcessor
 from ...models.cnet import UNet2DConditionModel_CNet
@@ -41,17 +33,6 @@ from .checkpoint import convert_extract_checkpoint
 
 logger = getLogger(__name__)
 
-available_pipelines = {
-    "controlnet": StableDiffusionControlNetPipeline,
-    "img2img": StableDiffusionPipeline,
-    "inpaint": StableDiffusionPipeline,
-    "lpw": StableDiffusionPipeline,
-    "panorama": StableDiffusionPipeline,
-    "pix2pix": StableDiffusionInstructPix2PixPipeline,
-    "txt2img": StableDiffusionPipeline,
-    "upscale": StableDiffusionUpscalePipeline,
-}
-
 
 def get_model_version(
     source,

From a33c88e67072330e68f2190b7724f1fccb1b37f9 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 17:27:44 -0500
Subject: [PATCH 046/240] fix(api): make request parsing consistent between
 JSON and forms

---
 api/onnx_web/chain/base.py              |   8 +-
 api/onnx_web/chain/stage.py             |   4 +-
 api/onnx_web/server/api.py              |  70 ++++-----
 api/onnx_web/server/model_cache.py      |   2 +-
 api/onnx_web/server/params.py           | 183 ++++++++++++++++--------
 api/tests/chain/__init__.py             |   0
 api/tests/chain/test_blend_linear.py    |  18 +++
 api/tests/chain/test_tile.py            |  42 ++++++
 api/tests/chain/test_upscale_highres.py |  13 ++
 api/tests/models/__init__.py            |   0
 api/tests/models/test_meta.py           |  12 ++
 api/tests/prompt/test_parser.py         |   2 +
 api/tests/server/test_model_cache.py    |  31 +++-
 api/tests/test_params.py                |   1 +
 api/tests/test_test.py                  |   1 +
 api/tests/worker/__init__.py            |   0
 api/tests/worker/test_pool.py           |  12 ++
 17 files changed, 295 insertions(+), 104 deletions(-)
 create mode 100644 api/tests/chain/__init__.py
 create mode 100644 api/tests/chain/test_blend_linear.py
 create mode 100644 api/tests/chain/test_tile.py
 create mode 100644 api/tests/chain/test_upscale_highres.py
 create mode 100644 api/tests/models/__init__.py
 create mode 100644 api/tests/models/test_meta.py
 create mode 100644 api/tests/worker/__init__.py
 create mode 100644 api/tests/worker/test_pool.py

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index ff01125a..9b554de3 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -87,15 +87,15 @@ class ChainPipeline:
 
     def steps(self, params: ImageParams, size: Size):
         steps = 0
-        for callback, _params, _kwargs in self.stages:
-            steps += callback.steps(params, size)
+        for callback, _params, kwargs in self.stages:
+            steps += callback.steps(kwargs.get("params", params), size)
 
         return steps
 
     def outputs(self, params: ImageParams, sources: int):
         outputs = sources
-        for callback, _params, _kwargs in self.stages:
-            outputs += callback.outputs(params, outputs)
+        for callback, _params, kwargs in self.stages:
+            outputs += callback.outputs(kwargs.get("params", params), outputs)
 
         return outputs
 
diff --git a/api/onnx_web/chain/stage.py b/api/onnx_web/chain/stage.py
index fff56ba7..3942460b 100644
--- a/api/onnx_web/chain/stage.py
+++ b/api/onnx_web/chain/stage.py
@@ -21,14 +21,14 @@ class BaseStage:
         stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
-        raise NotImplementedError()
+        raise NotImplementedError()  # noqa
 
     def steps(
         self,
         params: ImageParams,
         size: Size,
     ) -> int:
-        return 1
+        return 1  # noqa
 
     def outputs(
         self,
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index fa4cc449..3865cea4 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -18,7 +18,7 @@ from ..diffusers.run import (
 )
 from ..diffusers.utils import replace_wildcards
 from ..output import json_params, make_output_name
-from ..params import Border, Size, StageParams, TileOrder, UpscaleParams
+from ..params import Size, StageParams, TileOrder
 from ..transformers.run import run_txt2txt_pipeline
 from ..utils import (
     base_join,
@@ -50,10 +50,11 @@ from .load import (
     get_wildcard_data,
 )
 from .params import (
-    border_from_request,
-    highres_from_request,
+    build_border,
+    build_highres,
+    build_upscale,
+    pipeline_from_json,
     pipeline_from_request,
-    upscale_from_request,
 )
 from .utils import wrap_route
 
@@ -168,8 +169,8 @@ def img2img(server: ServerContext, pool: DevicePoolExecutor):
     size = Size(source.width, source.height)
 
     device, params, _size = pipeline_from_request(server, "img2img")
-    upscale = upscale_from_request()
-    highres = highres_from_request()
+    upscale = build_upscale()
+    highres = build_highres()
     source_filter = get_from_list(
         request.args, "sourceFilter", list(get_source_filters().keys())
     )
@@ -217,8 +218,8 @@ def img2img(server: ServerContext, pool: DevicePoolExecutor):
 
 def txt2img(server: ServerContext, pool: DevicePoolExecutor):
     device, params, size = pipeline_from_request(server, "txt2img")
-    upscale = upscale_from_request()
-    highres = highres_from_request()
+    upscale = build_upscale()
+    highres = build_highres()
 
     replace_wildcards(params, get_wildcard_data())
 
@@ -271,9 +272,9 @@ def inpaint(server: ServerContext, pool: DevicePoolExecutor):
     )
 
     device, params, _size = pipeline_from_request(server, "inpaint")
-    expand = border_from_request()
-    upscale = upscale_from_request()
-    highres = highres_from_request()
+    expand = build_border()
+    upscale = build_upscale()
+    highres = build_highres()
 
     fill_color = get_not_empty(request.args, "fillColor", "white")
     mask_filter = get_from_map(request.args, "filter", get_mask_filters(), "none")
@@ -341,8 +342,8 @@ def upscale(server: ServerContext, pool: DevicePoolExecutor):
     source = Image.open(BytesIO(source_file.read())).convert("RGB")
 
     device, params, size = pipeline_from_request(server)
-    upscale = upscale_from_request()
-    highres = highres_from_request()
+    upscale = build_upscale()
+    highres = build_highres()
 
     replace_wildcards(params, get_wildcard_data())
 
@@ -367,6 +368,10 @@ def upscale(server: ServerContext, pool: DevicePoolExecutor):
     return jsonify(json_params(output, params, size, upscale=upscale, highres=highres))
 
 
+# keys that are specially parsed by params and should not show up in with_args
+CHAIN_POP_KEYS = ["model", "control"]
+
+
 def chain(server: ServerContext, pool: DevicePoolExecutor):
     if request.is_json:
         logger.debug("chain pipeline request with JSON body")
@@ -386,9 +391,8 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
     logger.debug("validating chain request: %s against %s", data, schema)
     validate(data, schema)
 
-    # get defaults from the regular parameters
-    device, base_params, base_size = pipeline_from_request(
-        server, data=data.get("defaults", None)
+    device, base_params, base_size = pipeline_from_json(
+        server, data=data.get("defaults")
     )
 
     # start building the pipeline
@@ -399,32 +403,32 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         logger.info("request stage: %s, %s", stage_class.__name__, kwargs)
 
         # TODO: combine base params with stage params
-        _device, params, size = pipeline_from_request(server, data=kwargs)
+        _device, params, size = pipeline_from_json(server, data=kwargs)
         replace_wildcards(params, get_wildcard_data())
 
-        if "model" in kwargs:
-            kwargs.pop("model")
-
-        if "control" in kwargs:
-            logger.warning("TODO: resolve controlnet model")
-            kwargs.pop("control")
+        # remove parsed keys, like model names (which become paths)
+        for pop_key in CHAIN_POP_KEYS:
+            if pop_key in kwargs:
+                kwargs.pop(pop_key)
 
+        # replace kwargs with parsed versions
         kwargs["params"] = params
+        kwargs["size"] = size
 
+        border = build_border(kwargs)
+        kwargs["border"] = border
+
+        upscale = build_upscale(kwargs)
+        kwargs["upscale"] = upscale
+
+        # prepare the stage metadata
         stage = StageParams(
             stage_data.get("name", stage_class.__name__),
-            tile_size=get_size(kwargs.get("tile_size")),
+            tile_size=get_size(kwargs.get("tiles")),
             outscale=get_and_clamp_int(kwargs, "outscale", 1, 4),
         )
 
-        if "border" in kwargs:
-            border = Border.even(int(kwargs.get("border")))
-            kwargs["border"] = border
-
-        if "upscale" in kwargs:
-            upscale = UpscaleParams(kwargs.get("upscale"))
-            kwargs["upscale"] = upscale
-
+        # load any images related to this stage
         stage_source_name = "source:%s" % (stage.name)
         stage_mask_name = "mask:%s" % (stage.name)
 
@@ -494,7 +498,7 @@ def blend(server: ServerContext, pool: DevicePoolExecutor):
             sources.append(source)
 
     device, params, size = pipeline_from_request(server)
-    upscale = upscale_from_request()
+    upscale = build_upscale()
 
     output = make_output_name(server, "upscale", params, size)
     job_name = output[0]
diff --git a/api/onnx_web/server/model_cache.py b/api/onnx_web/server/model_cache.py
index 21da25f4..6525d4ae 100644
--- a/api/onnx_web/server/model_cache.py
+++ b/api/onnx_web/server/model_cache.py
@@ -51,7 +51,7 @@ class ModelCache:
             return
 
         for i in range(len(cache)):
-            t, k, v = cache[i]
+            t, k, _v = cache[i]
             if tag == t and key != k:
                 logger.debug("updating model cache: %s %s", tag, key)
                 cache[i] = (tag, key, value)
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index c32fdbf2..bc6ef14d 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Dict, Tuple
+from typing import Dict, Optional, Tuple
 
 import numpy as np
 from flask import request
@@ -34,16 +34,10 @@ from .utils import get_model_path
 logger = getLogger(__name__)
 
 
-def pipeline_from_request(
+def build_device(
     server: ServerContext,
-    default_pipeline: str = "txt2img",
-    data: Dict[str, str] = None,
-) -> Tuple[DeviceParams, ImageParams, Size]:
-    user = request.remote_addr
-
-    if data is None:
-        data = request.args
-
+    data: Dict[str, str],
+) -> Optional[DeviceParams]:
     # platform stuff
     device = None
     device_name = data.get("platform")
@@ -53,6 +47,14 @@ def pipeline_from_request(
             if platform.device == device_name:
                 device = platform
 
+    return device
+
+
+def build_params(
+    server: ServerContext,
+    default_pipeline: str,
+    data: Dict[str, str],
+) -> ImageParams:
     # diffusion model
     model = get_not_empty(data, "model", get_config_value("model"))
     model_path = get_model_path(server, model)
@@ -115,20 +117,6 @@ def pipeline_from_request(
         get_config_value("steps", "max"),
         get_config_value("steps", "min"),
     )
-    height = get_and_clamp_int(
-        data,
-        "height",
-        get_config_value("height"),
-        get_config_value("height", "max"),
-        get_config_value("height", "min"),
-    )
-    width = get_and_clamp_int(
-        data,
-        "width",
-        get_config_value("width"),
-        get_config_value("width", "max"),
-        get_config_value("width", "min"),
-    )
     tiled_vae = get_boolean(data, "tiledVAE", get_config_value("tiledVAE"))
     tiles = get_and_clamp_int(
         data,
@@ -161,21 +149,6 @@ def pipeline_from_request(
         # this one can safely use np.random because it produces a single value
         seed = np.random.randint(np.iinfo(np.int32).max)
 
-    logger.info(
-        "request from %s: %s steps of %s using %s in %s on %s, %sx%s, %s, %s - %s",
-        user,
-        steps,
-        scheduler,
-        model_path,
-        pipeline,
-        device or "any device",
-        width,
-        height,
-        cfg,
-        seed,
-        prompt,
-    )
-
     params = ImageParams(
         model_path,
         pipeline,
@@ -194,34 +167,60 @@ def pipeline_from_request(
         overlap=overlap,
         stride=stride,
     )
-    size = Size(width, height)
-    return (device, params, size)
+
+    return params
 
 
-def border_from_request() -> Border:
+def build_size(
+    server: ServerContext,
+    data: Dict[str, str],
+) -> Size:
+    height = get_and_clamp_int(
+        data,
+        "height",
+        get_config_value("height"),
+        get_config_value("height", "max"),
+        get_config_value("height", "min"),
+    )
+    width = get_and_clamp_int(
+        data,
+        "width",
+        get_config_value("width"),
+        get_config_value("width", "max"),
+        get_config_value("width", "min"),
+    )
+    return Size(width, height)
+
+
+def build_border(
+    data: Dict[str, str] = None,
+) -> Border:
+    if data is None:
+        data = request.args
+
     left = get_and_clamp_int(
-        request.args,
+        data,
         "left",
         get_config_value("left"),
         get_config_value("left", "max"),
         get_config_value("left", "min"),
     )
     right = get_and_clamp_int(
-        request.args,
+        data,
         "right",
         get_config_value("right"),
         get_config_value("right", "max"),
         get_config_value("right", "min"),
     )
     top = get_and_clamp_int(
-        request.args,
+        data,
         "top",
         get_config_value("top"),
         get_config_value("top", "max"),
         get_config_value("top", "min"),
     )
     bottom = get_and_clamp_int(
-        request.args,
+        data,
         "bottom",
         get_config_value("bottom"),
         get_config_value("bottom", "max"),
@@ -231,46 +230,51 @@ def border_from_request() -> Border:
     return Border(left, right, top, bottom)
 
 
-def upscale_from_request() -> UpscaleParams:
+def build_upscale(
+    data: Dict[str, str] = None,
+) -> UpscaleParams:
+    if data is None:
+        data = request.args
+
     denoise = get_and_clamp_float(
-        request.args,
+        data,
         "denoise",
         get_config_value("denoise"),
         get_config_value("denoise", "max"),
         get_config_value("denoise", "min"),
     )
     scale = get_and_clamp_int(
-        request.args,
+        data,
         "scale",
         get_config_value("scale"),
         get_config_value("scale", "max"),
         get_config_value("scale", "min"),
     )
     outscale = get_and_clamp_int(
-        request.args,
+        data,
         "outscale",
         get_config_value("outscale"),
         get_config_value("outscale", "max"),
         get_config_value("outscale", "min"),
     )
-    upscaling = get_from_list(request.args, "upscaling", get_upscaling_models())
-    correction = get_from_list(request.args, "correction", get_correction_models())
-    faces = get_not_empty(request.args, "faces", "false") == "true"
+    upscaling = get_from_list(data, "upscaling", get_upscaling_models())
+    correction = get_from_list(data, "correction", get_correction_models())
+    faces = get_not_empty(data, "faces", "false") == "true"
     face_outscale = get_and_clamp_int(
-        request.args,
+        data,
         "faceOutscale",
         get_config_value("faceOutscale"),
         get_config_value("faceOutscale", "max"),
         get_config_value("faceOutscale", "min"),
     )
     face_strength = get_and_clamp_float(
-        request.args,
+        data,
         "faceStrength",
         get_config_value("faceStrength"),
         get_config_value("faceStrength", "max"),
         get_config_value("faceStrength", "min"),
     )
-    upscale_order = request.args.get("upscaleOrder", "correction-first")
+    upscale_order = data.get("upscaleOrder", "correction-first")
 
     return UpscaleParams(
         upscaling,
@@ -286,37 +290,43 @@ def upscale_from_request() -> UpscaleParams:
     )
 
 
-def highres_from_request() -> HighresParams:
-    enabled = get_boolean(request.args, "highres", get_config_value("highres"))
+def build_highres(
+    data: Dict[str, str] = None,
+) -> HighresParams:
+    if data is None:
+        data = request.args
+
+    enabled = get_boolean(data, "highres", get_config_value("highres"))
     iterations = get_and_clamp_int(
-        request.args,
+        data,
         "highresIterations",
         get_config_value("highresIterations"),
         get_config_value("highresIterations", "max"),
         get_config_value("highresIterations", "min"),
     )
-    method = get_from_list(request.args, "highresMethod", get_highres_methods())
+    method = get_from_list(data, "highresMethod", get_highres_methods())
     scale = get_and_clamp_int(
-        request.args,
+        data,
         "highresScale",
         get_config_value("highresScale"),
         get_config_value("highresScale", "max"),
         get_config_value("highresScale", "min"),
     )
     steps = get_and_clamp_int(
-        request.args,
+        data,
         "highresSteps",
         get_config_value("highresSteps"),
         get_config_value("highresSteps", "max"),
         get_config_value("highresSteps", "min"),
     )
     strength = get_and_clamp_float(
-        request.args,
+        data,
         "highresStrength",
         get_config_value("highresStrength"),
         get_config_value("highresStrength", "max"),
         get_config_value("highresStrength", "min"),
     )
+
     return HighresParams(
         enabled,
         scale,
@@ -325,3 +335,50 @@ def highres_from_request() -> HighresParams:
         method=method,
         iterations=iterations,
     )
+
+
+PipelineParams = Tuple[Optional[DeviceParams], ImageParams, Size]
+
+
+def pipeline_from_json(
+    server: ServerContext,
+    data: Dict[str, str],
+    default_pipeline: str = "txt2img",
+) -> PipelineParams:
+    """
+    Like pipeline_from_request but expects a nested structure.
+    """
+
+    device = build_device(server, data.get("device", data))
+    params = build_params(server, default_pipeline, data.get("params", data))
+    size = build_size(server, data.get("params", data))
+
+    return (device, params, size)
+
+
+def pipeline_from_request(
+    server: ServerContext,
+    default_pipeline: str = "txt2img",
+) -> PipelineParams:
+    user = request.remote_addr
+
+    device = build_device(server, request.args)
+    params = build_params(server, default_pipeline, request.args)
+    size = build_size(server, request.args)
+
+    logger.info(
+        "request from %s: %s steps of %s using %s in %s on %s, %sx%s, %s, %s - %s",
+        user,
+        params.steps,
+        params.scheduler,
+        params.model_path,
+        params.pipeline,
+        device or "any device",
+        params.width,
+        params.height,
+        params.cfg,
+        params.seed,
+        params.prompt,
+    )
+
+    return (device, params, size)
diff --git a/api/tests/chain/__init__.py b/api/tests/chain/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/chain/test_blend_linear.py b/api/tests/chain/test_blend_linear.py
new file mode 100644
index 00000000..9d20fe55
--- /dev/null
+++ b/api/tests/chain/test_blend_linear.py
@@ -0,0 +1,18 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.blend_linear import BlendLinearStage
+
+
+class BlendLinearStageTests(unittest.TestCase):
+    def test_stage(self):
+        stage = BlendLinearStage()
+        sources = [
+            Image.new("RGB", (64, 64), "black"),
+        ]
+        stage_source = Image.new("RGB", (64, 64), "white")
+        result = stage.run(None, None, None, None, sources, alpha=0.5, stage_source=stage_source)
+
+        self.assertEqual(len(result), 1)
+        self.assertEqual(result[0].getpixel((0,0)), (127, 127, 127))
\ No newline at end of file
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
new file mode 100644
index 00000000..71b7d2e5
--- /dev/null
+++ b/api/tests/chain/test_tile.py
@@ -0,0 +1,42 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.tile import complete_tile
+
+
+class TestCompleteTile(unittest.TestCase):
+  def test_with_complete_tile(self):
+    partial = Image.new("RGB", (64, 64))
+    output = complete_tile(partial, 64)
+
+    self.assertEqual(output.size, (64, 64))
+
+  def test_with_partial_tile(self):
+    partial = Image.new("RGB", (64, 32))
+    output = complete_tile(partial, 64)
+
+    self.assertEqual(output.size, (64, 64))
+
+  def test_with_nothing(self):
+    output = complete_tile(None, 64)
+    self.assertIsNone(output)
+
+
+class TestNeedsTile(unittest.TestCase):
+  def test_with_undersized(self):
+    pass
+
+  def test_with_oversized(self):
+    pass
+
+  def test_with_mixed(self):
+    pass
+
+
+class TestTileGrads(unittest.TestCase):
+  def test_center_tile(self):
+    pass
+
+  def test_edge_tile(self):
+    pass
diff --git a/api/tests/chain/test_upscale_highres.py b/api/tests/chain/test_upscale_highres.py
new file mode 100644
index 00000000..f5e17a84
--- /dev/null
+++ b/api/tests/chain/test_upscale_highres.py
@@ -0,0 +1,13 @@
+import unittest
+
+from onnx_web.chain.upscale_highres import UpscaleHighresStage
+from onnx_web.params import HighresParams, UpscaleParams
+
+
+class UpscaleHighresStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = UpscaleHighresStage()
+        sources = []
+        result = stage.run(None, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
+
+        self.assertEqual(len(result), 0)
\ No newline at end of file
diff --git a/api/tests/models/__init__.py b/api/tests/models/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/models/test_meta.py b/api/tests/models/test_meta.py
new file mode 100644
index 00000000..458c8c37
--- /dev/null
+++ b/api/tests/models/test_meta.py
@@ -0,0 +1,12 @@
+import unittest
+
+from onnx_web.models.meta import NetworkModel
+
+
+class NetworkModelTests(unittest.TestCase):
+    def test_json(self):
+        model = NetworkModel("test", "inversion")
+        json = model.tojson()
+
+        self.assertIn("name", json)
+        self.assertIn("type", json)
diff --git a/api/tests/prompt/test_parser.py b/api/tests/prompt/test_parser.py
index 20c03341..b6b13a23 100644
--- a/api/tests/prompt/test_parser.py
+++ b/api/tests/prompt/test_parser.py
@@ -1,7 +1,9 @@
 import unittest
+
 from onnx_web.prompt.grammar import PromptPhrase
 from onnx_web.prompt.parser import parse_prompt_onnx
 
+
 class ParserTests(unittest.TestCase):
     def test_single_word_phrase(self):
         res = parse_prompt_onnx(None, "foo (bar) bin", debug=False)
diff --git a/api/tests/server/test_model_cache.py b/api/tests/server/test_model_cache.py
index 000065d0..0e4839c9 100644
--- a/api/tests/server/test_model_cache.py
+++ b/api/tests/server/test_model_cache.py
@@ -2,7 +2,8 @@ import unittest
 
 from onnx_web.server.model_cache import ModelCache
 
-class TestStringMethods(unittest.TestCase):
+
+class TestModelCache(unittest.TestCase):
   def test_drop_existing(self):
     cache = ModelCache(10)
     cache.clear()
@@ -32,3 +33,31 @@ class TestStringMethods(unittest.TestCase):
     cache.set("foo", ("bar",), value)
     self.assertGreater(cache.size, 0)
     self.assertIs(cache.get("foo", ("bin",)), None)
+
+  """
+  def test_set_existing(self):
+    cache = ModelCache(10)
+    cache.clear()
+    cache.set("foo", ("bar",), {
+      "value": 1,
+    })
+    value = {
+      "value": 2,
+    }
+    cache.set("foo", ("bar",), value)
+    self.assertIs(cache.get("foo", ("bar",)), value)
+  """
+
+  def test_set_missing(self):
+    cache = ModelCache(10)
+    cache.clear()
+    value = {}
+    cache.set("foo", ("bar",), value)
+    self.assertIs(cache.get("foo", ("bar",)), value)
+
+  def test_set_zero(self):
+    cache = ModelCache(0)
+    cache.clear()
+    value = {}
+    cache.set("foo", ("bar",), value)
+    self.assertEqual(cache.size, 0)
diff --git a/api/tests/test_params.py b/api/tests/test_params.py
index 0f84cfab..09eb7576 100644
--- a/api/tests/test_params.py
+++ b/api/tests/test_params.py
@@ -2,6 +2,7 @@ import unittest
 
 from onnx_web.params import Border, Size
 
+
 class BorderTests(unittest.TestCase):
     def test_json(self):
         border = Border.even(0)
diff --git a/api/tests/test_test.py b/api/tests/test_test.py
index c6ee310c..ae70622f 100644
--- a/api/tests/test_test.py
+++ b/api/tests/test_test.py
@@ -1,5 +1,6 @@
 import unittest
 
+
 # just to get CI happy
 class ErrorTest(unittest.TestCase):
     def test(self):
diff --git a/api/tests/worker/__init__.py b/api/tests/worker/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
new file mode 100644
index 00000000..cbb4c42c
--- /dev/null
+++ b/api/tests/worker/test_pool.py
@@ -0,0 +1,12 @@
+import unittest
+
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.pool import DevicePoolExecutor
+
+
+class TestWorkerPool(unittest.TestCase):
+  def test_no_devices(self):
+    server = ServerContext()
+    pool = DevicePoolExecutor(server, [])
+    pool.start()
+    pool.join()
\ No newline at end of file

From c9f7caae397e454a3399fd37bd02236eac0cbf76 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 17:28:38 -0500
Subject: [PATCH 047/240] clean up chain params to match backend

---
 common/pipelines/codeformer.json              |   2 +-
 common/pipelines/complex.json                 |   6 +-
 common/pipelines/outpaint.json                |   2 +-
 docs/chain-pipelines.md                       |   2 +-
 gui/src/client/api.ts                         |  26 +-
 gui/src/client/base.ts                        | 110 +++++
 gui/src/client/local.ts                       |   2 +-
 gui/src/client/types.ts                       | 425 ------------------
 gui/src/client/utils.ts                       |   5 +-
 gui/src/components/Profiles.tsx               |   5 +-
 gui/src/components/card/ErrorCard.tsx         |   2 +-
 gui/src/components/card/ImageCard.tsx         |   2 +-
 gui/src/components/card/LoadingCard.tsx       |   2 +-
 gui/src/components/control/HighresControl.tsx |   2 +-
 gui/src/components/control/ImageControl.tsx   |   2 +-
 gui/src/components/control/ModelControl.tsx   |   2 +-
 gui/src/components/control/UpscaleControl.tsx |   2 +-
 gui/src/components/input/MaskCanvas.tsx       |   2 +-
 .../input/model/CorrectionModel.tsx           |   2 +-
 .../components/input/model/DiffusionModel.tsx |   2 +-
 .../components/input/model/ExtraNetwork.tsx   |   2 +-
 .../components/input/model/ExtraSource.tsx    |   2 +-
 .../components/input/model/UpscalingModel.tsx |   2 +-
 gui/src/components/tab/Blend.tsx              |   2 +-
 gui/src/components/tab/Img2Img.tsx            |   6 +-
 gui/src/components/tab/Inpaint.tsx            |   4 +-
 gui/src/components/tab/Models.tsx             |   2 +-
 gui/src/components/tab/Txt2Img.tsx            |  10 +-
 gui/src/components/tab/Upscale.tsx            |   4 +-
 gui/src/config.ts                             |   2 +-
 gui/src/main.tsx                              |   2 +-
 gui/src/state.ts                              |  14 +-
 gui/src/types/api.ts                          | 120 +++++
 gui/src/types/chain.ts                        |  40 ++
 gui/src/{types.ts => types/model.ts}          |   0
 gui/src/types/params.ts                       | 165 +++++++
 36 files changed, 498 insertions(+), 484 deletions(-)
 create mode 100644 gui/src/client/base.ts
 delete mode 100644 gui/src/client/types.ts
 create mode 100644 gui/src/types/api.ts
 create mode 100644 gui/src/types/chain.ts
 rename gui/src/{types.ts => types/model.ts} (100%)
 create mode 100644 gui/src/types/params.ts

diff --git a/common/pipelines/codeformer.json b/common/pipelines/codeformer.json
index 1d026a56..5ce967c1 100644
--- a/common/pipelines/codeformer.json
+++ b/common/pipelines/codeformer.json
@@ -9,7 +9,7 @@
       "name": "save-local",
       "type": "persist-disk",
       "params": {
-        "tile_size": "hd8k"
+        "tiles": "hd8k"
       }
     }
   ]
diff --git a/common/pipelines/complex.json b/common/pipelines/complex.json
index 547991e0..f878a889 100644
--- a/common/pipelines/complex.json
+++ b/common/pipelines/complex.json
@@ -23,14 +23,14 @@
         "prompt": "a magical wizard in a robe fighting a dragon",
         "scale": 4,
         "outscale": 4,
-        "tile_size": "mini"
+        "tiles": "mini"
       }
     },
     {
       "name": "save-local",
       "type": "persist-disk",
       "params": {
-        "tile_size": "hd8k"
+        "tiles": "hd8k"
       }
     },
     {
@@ -40,7 +40,7 @@
         "bucket": "storage-stable-diffusion",
         "endpoint_url": "http://scylla.home.holdmyran.ch:8000",
         "profile_name": "ceph",
-        "tile_size": "hd8k"
+        "tiles": "hd8k"
       }
     }
   ]
diff --git a/common/pipelines/outpaint.json b/common/pipelines/outpaint.json
index cf45aeb1..925de349 100644
--- a/common/pipelines/outpaint.json
+++ b/common/pipelines/outpaint.json
@@ -20,7 +20,7 @@
       "name": "save-local",
       "type": "persist-disk",
       "params": {
-        "tile_size": "hd8k"
+        "tiles": "hd8k"
       }
     }
   ]
diff --git a/docs/chain-pipelines.md b/docs/chain-pipelines.md
index 23a8c7ae..3737a18c 100644
--- a/docs/chain-pipelines.md
+++ b/docs/chain-pipelines.md
@@ -66,7 +66,7 @@ and can also save intermediate output, such as the result of a `source-txt2img`
       "name": "save-local",
       "type": "persist-disk",
       "params": {
-        "tile_size": "hd8k"
+        "tiles": "hd8k"
       }
     }
   ]
diff --git a/gui/src/client/api.ts b/gui/src/client/api.ts
index 99d55baa..3702440a 100644
--- a/gui/src/client/api.ts
+++ b/gui/src/client/api.ts
@@ -2,29 +2,31 @@
 import { doesExist, InvalidArgumentError, Maybe } from '@apextoaster/js-utils';
 
 import { ServerParams } from '../config.js';
-import { range } from '../utils.js';
 import {
-  ApiClient,
-  BaseImgParams,
-  BlendParams,
-  ChainPipeline,
   FilterResponse,
-  HighresParams,
   ImageResponse,
   ImageResponseWithRetry,
+  ModelResponse,
+  ReadyResponse,
+  RetryParams,
+  WriteExtrasResponse,
+} from '../types/api.js';
+import { ChainPipeline } from '../types/chain.js';
+import { ExtrasFile } from '../types/model.js';
+import {
+  BaseImgParams,
+  BlendParams,
+  HighresParams,
   Img2ImgParams,
   InpaintParams,
   ModelParams,
-  ModelResponse,
   OutpaintParams,
-  ReadyResponse,
-  RetryParams,
   Txt2ImgParams,
   UpscaleParams,
   UpscaleReqParams,
-  WriteExtrasResponse,
-} from './types.js';
-import { ExtrasFile } from '../types.js';
+} from '../types/params.js';
+import { range } from '../utils.js';
+import { ApiClient } from './base.js';
 
 /**
  * Fixed precision for integer parameters.
diff --git a/gui/src/client/base.ts b/gui/src/client/base.ts
new file mode 100644
index 00000000..70e96706
--- /dev/null
+++ b/gui/src/client/base.ts
@@ -0,0 +1,110 @@
+import { ServerParams } from '../config.js';
+import { ExtrasFile } from '../types/model.js';
+import { WriteExtrasResponse, FilterResponse, ModelResponse, ImageResponseWithRetry, ImageResponse, ReadyResponse, RetryParams } from '../types/api.js';
+import { ChainPipeline } from '../types/chain.js';
+import { ModelParams, Txt2ImgParams, UpscaleParams, HighresParams, Img2ImgParams, InpaintParams, OutpaintParams, UpscaleReqParams, BlendParams } from '../types/params.js';
+
+export interface ApiClient {
+  extras(): Promise<ExtrasFile>;
+
+  writeExtras(extras: ExtrasFile): Promise<WriteExtrasResponse>;
+
+  /**
+   * List the available filter masks for inpaint.
+   */
+  filters(): Promise<FilterResponse>;
+
+  /**
+   * List the available models.
+   */
+  models(): Promise<ModelResponse>;
+
+  /**
+   * List the available noise sources for inpaint.
+   */
+  noises(): Promise<Array<string>>;
+
+  /**
+   * Get the valid server parameters to validate image parameters.
+   */
+  params(): Promise<ServerParams>;
+
+  /**
+   * Get the available pipelines.
+   */
+  pipelines(): Promise<Array<string>>;
+
+  /**
+   * Get the available hardware acceleration platforms.
+   */
+  platforms(): Promise<Array<string>>;
+
+  /**
+   * List the available pipeline schedulers.
+   */
+  schedulers(): Promise<Array<string>>;
+
+  /**
+   * Load extra strings from the server.
+   */
+  strings(): Promise<Record<string, {
+    translation: Record<string, string>;
+  }>>;
+
+  /**
+   * Start a txt2img pipeline.
+   */
+  txt2img(model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Start an im2img pipeline.
+   */
+  img2img(model: ModelParams, params: Img2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Start an inpaint pipeline.
+   */
+  inpaint(model: ModelParams, params: InpaintParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Start an outpaint pipeline.
+   */
+  outpaint(model: ModelParams, params: OutpaintParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Start an upscale pipeline.
+   */
+  upscale(model: ModelParams, params: UpscaleReqParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Start a blending pipeline.
+   */
+  blend(model: ModelParams, params: BlendParams, upscale?: UpscaleParams): Promise<ImageResponseWithRetry>;
+
+  chain(model: ModelParams, chain: ChainPipeline): Promise<ImageResponse>;
+
+  /**
+   * Check whether job has finished and its output is ready.
+   */
+  ready(key: string): Promise<ReadyResponse>;
+
+  /**
+   * Cancel an existing job.
+   */
+  cancel(key: string): Promise<boolean>;
+
+  /**
+   * Retry a previous job using the same parameters.
+   */
+  retry(params: RetryParams): Promise<ImageResponseWithRetry>;
+
+  /**
+   * Restart the image job workers.
+   */
+  restart(): Promise<boolean>;
+
+  /**
+   * Check the status of the image job workers.
+   */
+  status(): Promise<Array<unknown>>;
+}
diff --git a/gui/src/client/local.ts b/gui/src/client/local.ts
index f1cefe5d..561417a3 100644
--- a/gui/src/client/local.ts
+++ b/gui/src/client/local.ts
@@ -1,6 +1,6 @@
 import { BaseError } from 'noicejs';
 
-import { ApiClient } from './types.js';
+import { ApiClient } from './base.js';
 
 export class NoServerError extends BaseError {
   constructor() {
diff --git a/gui/src/client/types.ts b/gui/src/client/types.ts
deleted file mode 100644
index 291199e0..00000000
--- a/gui/src/client/types.ts
+++ /dev/null
@@ -1,425 +0,0 @@
-import { ServerParams } from '../config.js';
-import { ExtrasFile } from '../types.js';
-
-/**
- * Shared parameters for anything using models, which is pretty much everything.
- */
-export interface ModelParams {
-  /**
-   * The diffusion model to use.
-   */
-  model: string;
-
-  /**
-   * Specialized pipeline to use.
-   */
-  pipeline: string;
-
-  /**
-   * The hardware acceleration platform to use.
-   */
-  platform: string;
-
-  /**
-   * The upscaling model to use.
-   */
-  upscaling: string;
-
-  /**
-   * The correction model to use.
-   */
-  correction: string;
-
-  /**
-   * ControlNet to be used.
-   */
-  control: string;
-}
-
-/**
- * Shared parameters for most of the image requests.
- */
-export interface BaseImgParams {
-  scheduler: string;
-  prompt: string;
-  negativePrompt?: string;
-
-  batch: number;
-  tiledVAE: boolean;
-  tiles: number;
-  overlap: number;
-  stride: number;
-
-  cfg: number;
-  steps: number;
-  seed: number;
-  eta: number;
-}
-
-/**
- * Parameters for txt2img requests.
- */
-export interface Txt2ImgParams extends BaseImgParams {
-  width: number;
-  height: number;
-}
-
-/**
- * Parameters for img2img requests.
- */
-export interface Img2ImgParams extends BaseImgParams {
-  source: Blob;
-
-  loopback: number;
-  sourceFilter: string;
-  strength: number;
-}
-
-/**
- * Parameters for inpaint requests.
- */
-export interface InpaintParams extends BaseImgParams {
-  mask: Blob;
-  source: Blob;
-
-  filter: string;
-  noise: string;
-  strength: number;
-  fillColor: string;
-  tileOrder: string;
-}
-
-/**
- * Additional parameters for outpaint border.
- *
- * @todo should be nested under inpaint/outpaint params
- */
-export interface OutpaintPixels {
-  enabled: boolean;
-
-  left: number;
-  right: number;
-  top: number;
-  bottom: number;
-}
-
-/**
- * Parameters for outpaint requests.
- */
-export type OutpaintParams = InpaintParams & OutpaintPixels;
-
-/**
- * Additional parameters for the inpaint brush.
- *
- * These are not currently sent to the server and only stored in state.
- *
- * @todo move to state
- */
-export interface BrushParams {
-  color: number;
-  size: number;
-  strength: number;
-}
-
-/**
- * Additional parameters for upscaling. May be sent with most other requests to run a post-pipeline.
- */
-export interface UpscaleParams {
-  enabled: boolean;
-  upscaleOrder: string;
-
-  denoise: number;
-  scale: number;
-  outscale: number;
-
-  faces: boolean;
-  faceStrength: number;
-  faceOutscale: number;
-}
-
-/**
- * Parameters for upscale requests.
- */
-export interface UpscaleReqParams extends BaseImgParams {
-  source: Blob;
-}
-
-/**
- * Parameters for blend requests.
- */
-export interface BlendParams {
-  sources: Array<Blob>;
-  mask: Blob;
-}
-
-export interface HighresParams {
-  enabled: boolean;
-
-  highresIterations: number;
-  highresMethod: string;
-  highresScale: number;
-  highresSteps: number;
-  highresStrength: number;
-}
-
-export interface ChainStageParams {
-  tile_size: number;
-}
-
-export interface Txt2ImgStage {
-  name: string;
-  type: 'source-txt2img';
-  params: Partial<Txt2ImgParams & ChainStageParams>;
-}
-
-export interface Img2ImgStage {
-  name: string;
-  type: 'blend-img2img';
-  params: Partial<Img2ImgParams & ChainStageParams>;
-}
-
-export interface GridStage {
-  name: string;
-  type: 'blend-grid';
-  params: Partial<{
-    height: number;
-    width: number;
-  } & ChainStageParams>;
-}
-
-export interface OutputStage {
-  name: string;
-  type: 'persist-disk';
-  params: Partial<ChainStageParams>;
-}
-
-export interface ChainPipeline {
-  /* defaults?: {
-    txt2img?: Txt2ImgParams;
-    img2img?: Img2ImgParams;
-  }; */
-
-  defaults?: Txt2ImgParams & ModelParams;
-
-  stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
-}
-
-/**
- * Output image data within the response.
- */
-export interface ImageOutput {
-  key: string;
-  url: string;
-}
-
-/**
- * Output image size, after upscaling and outscale.
- */
-export interface ImageSize {
-  width: number;
-  height: number;
-}
-
-/**
- * General response for most image requests.
- */
-export interface ImageResponse {
-  outputs: Array<ImageOutput>;
-  params: Required<BaseImgParams> & Required<ModelParams>;
-  size: ImageSize;
-}
-
-/**
- * Status response from the ready endpoint.
- */
-export interface ReadyResponse {
-  cancelled: boolean;
-  failed: boolean;
-  progress: number;
-  ready: boolean;
-}
-
-export interface NetworkModel {
-  name: string;
-  type: 'control' | 'inversion' | 'lora';
-  // TODO: add token
-  // TODO: add layer/token count
-}
-
-export interface FilterResponse {
-  mask: Array<string>;
-  source: Array<string>;
-}
-
-/**
- * List of available models.
- */
-export interface ModelResponse {
-  correction: Array<string>;
-  diffusion: Array<string>;
-  networks: Array<NetworkModel>;
-  upscaling: Array<string>;
-}
-
-export interface WriteExtrasResponse {
-  file: string;
-  successful: Array<string>;
-  errors: Array<string>;
-}
-
-export type RetryParams = {
-  type: 'txt2img';
-  model: ModelParams;
-  params: Txt2ImgParams;
-  upscale?: UpscaleParams;
-  highres?: HighresParams;
-} | {
-  type: 'img2img';
-  model: ModelParams;
-  params: Img2ImgParams;
-  upscale?: UpscaleParams;
-  highres?: HighresParams;
-} | {
-  type: 'inpaint';
-  model: ModelParams;
-  params: InpaintParams;
-  upscale?: UpscaleParams;
-  highres?: HighresParams;
-} | {
-  type: 'outpaint';
-  model: ModelParams;
-  params: OutpaintParams;
-  upscale?: UpscaleParams;
-  highres?: HighresParams;
-} | {
-  type: 'upscale';
-  model: ModelParams;
-  params: UpscaleReqParams;
-  upscale?: UpscaleParams;
-  highres?: HighresParams;
-} | {
-  type: 'blend';
-  model: ModelParams;
-  params: BlendParams;
-  upscale?: UpscaleParams;
-};
-
-export interface ImageResponseWithRetry {
-  image: ImageResponse;
-  retry: RetryParams;
-}
-
-export interface ImageMetadata {
-  highres: HighresParams;
-  outputs: string | Array<string>;
-  params: Txt2ImgParams | Img2ImgParams | InpaintParams;
-  upscale: UpscaleParams;
-
-  input_size: ImageSize;
-  size: ImageSize;
-}
-
-export interface ApiClient {
-  extras(): Promise<ExtrasFile>;
-
-  writeExtras(extras: ExtrasFile): Promise<WriteExtrasResponse>;
-
-  /**
-   * List the available filter masks for inpaint.
-   */
-  filters(): Promise<FilterResponse>;
-
-  /**
-   * List the available models.
-   */
-  models(): Promise<ModelResponse>;
-
-  /**
-   * List the available noise sources for inpaint.
-   */
-  noises(): Promise<Array<string>>;
-
-  /**
-   * Get the valid server parameters to validate image parameters.
-   */
-  params(): Promise<ServerParams>;
-
-  /**
-   * Get the available pipelines.
-   */
-  pipelines(): Promise<Array<string>>;
-
-  /**
-   * Get the available hardware acceleration platforms.
-   */
-  platforms(): Promise<Array<string>>;
-
-  /**
-   * List the available pipeline schedulers.
-   */
-  schedulers(): Promise<Array<string>>;
-
-  /**
-   * Load extra strings from the server.
-   */
-  strings(): Promise<Record<string, {
-    translation: Record<string, string>;
-  }>>;
-
-  /**
-   * Start a txt2img pipeline.
-   */
-  txt2img(model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Start an im2img pipeline.
-   */
-  img2img(model: ModelParams, params: Img2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Start an inpaint pipeline.
-   */
-  inpaint(model: ModelParams, params: InpaintParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Start an outpaint pipeline.
-   */
-  outpaint(model: ModelParams, params: OutpaintParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Start an upscale pipeline.
-   */
-  upscale(model: ModelParams, params: UpscaleReqParams, upscale?: UpscaleParams, highres?: HighresParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Start a blending pipeline.
-   */
-  blend(model: ModelParams, params: BlendParams, upscale?: UpscaleParams): Promise<ImageResponseWithRetry>;
-
-  chain(model: ModelParams, chain: ChainPipeline): Promise<ImageResponse>;
-
-  /**
-   * Check whether job has finished and its output is ready.
-   */
-  ready(key: string): Promise<ReadyResponse>;
-
-  /**
-   * Cancel an existing job.
-   */
-  cancel(key: string): Promise<boolean>;
-
-  /**
-   * Retry a previous job using the same parameters.
-   */
-  retry(params: RetryParams): Promise<ImageResponseWithRetry>;
-
-  /**
-   * Restart the image job workers.
-   */
-  restart(): Promise<boolean>;
-
-  /**
-   * Check the status of the image job workers.
-   */
-  status(): Promise<Array<unknown>>;
-}
diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 9bf52118..8f51fedc 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -1,5 +1,6 @@
 import { doesExist } from '@apextoaster/js-utils';
-import { ChainPipeline, HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from './types.js';
+import { HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from '../types/params.js';
+import { ChainPipeline } from '../types/chain.js';
 
 export interface PipelineVariable {
   parameter: 'prompt' | 'cfg' | 'seed' | 'steps' | 'eta' | 'scheduler' | 'token';
@@ -39,7 +40,7 @@ export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, c
 }
 
 // eslint-disable-next-line max-params
-export function buildPipelineForTxt2ImgGrid(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
+export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
     defaults: {
       ...model,
diff --git a/gui/src/components/Profiles.tsx b/gui/src/components/Profiles.tsx
index 5ed9de77..baf022b3 100644
--- a/gui/src/components/Profiles.tsx
+++ b/gui/src/components/Profiles.tsx
@@ -21,9 +21,10 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { BaseImgParams, HighresParams, ImageMetadata, Txt2ImgParams, UpscaleParams } from '../client/types.js';
 import { OnnxState, StateContext } from '../state.js';
-import { DeepPartial } from '../types.js';
+import { ImageMetadata } from '../types/api.js';
+import { DeepPartial } from '../types/model.js';
+import { BaseImgParams, HighresParams, Txt2ImgParams, UpscaleParams } from '../types/params.js';
 
 const { useState } = React;
 
diff --git a/gui/src/components/card/ErrorCard.tsx b/gui/src/components/card/ErrorCard.tsx
index 9bb6e455..bb3ac6c9 100644
--- a/gui/src/components/card/ErrorCard.tsx
+++ b/gui/src/components/card/ErrorCard.tsx
@@ -9,8 +9,8 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { ImageResponse, ReadyResponse, RetryParams } from '../../client/types.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { ImageResponse, ReadyResponse, RetryParams } from '../../types/api.js';
 
 export interface ErrorCardProps {
   image: ImageResponse;
diff --git a/gui/src/components/card/ImageCard.tsx b/gui/src/components/card/ImageCard.tsx
index bb1b6e17..7c35acb2 100644
--- a/gui/src/components/card/ImageCard.tsx
+++ b/gui/src/components/card/ImageCard.tsx
@@ -8,8 +8,8 @@ import { useHash } from 'react-use/lib/useHash';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { ImageResponse } from '../../client/types.js';
 import { BLEND_SOURCES, ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { ImageResponse } from '../../types/api.js';
 import { range, visibleIndex } from '../../utils.js';
 
 export interface ImageCardProps {
diff --git a/gui/src/components/card/LoadingCard.tsx b/gui/src/components/card/LoadingCard.tsx
index 1f339060..e0fcdb68 100644
--- a/gui/src/components/card/LoadingCard.tsx
+++ b/gui/src/components/card/LoadingCard.tsx
@@ -8,9 +8,9 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { ImageResponse } from '../../client/types.js';
 import { POLL_TIME } from '../../config.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { ImageResponse } from '../../types/api.js';
 
 const LOADING_PERCENT = 100;
 const LOADING_OVERAGE = 99;
diff --git a/gui/src/components/control/HighresControl.tsx b/gui/src/components/control/HighresControl.tsx
index 83b10581..91525b21 100644
--- a/gui/src/components/control/HighresControl.tsx
+++ b/gui/src/components/control/HighresControl.tsx
@@ -5,8 +5,8 @@ import { useContext } from 'react';
 import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 
-import { HighresParams } from '../../client/types.js';
 import { ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { HighresParams } from '../../types/params.js';
 import { NumericField } from '../input/NumericField.js';
 
 export interface HighresControlProps {
diff --git a/gui/src/components/control/ImageControl.tsx b/gui/src/components/control/ImageControl.tsx
index c0b7b6dc..d031b9c5 100644
--- a/gui/src/components/control/ImageControl.tsx
+++ b/gui/src/components/control/ImageControl.tsx
@@ -9,9 +9,9 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { BaseImgParams } from '../../client/types.js';
 import { STALE_TIME } from '../../config.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { BaseImgParams } from '../../types/params.js';
 import { NumericField } from '../input/NumericField.js';
 import { PromptInput } from '../input/PromptInput.js';
 import { QueryList } from '../input/QueryList.js';
diff --git a/gui/src/components/control/ModelControl.tsx b/gui/src/components/control/ModelControl.tsx
index 43c3cfcd..ba08998f 100644
--- a/gui/src/components/control/ModelControl.tsx
+++ b/gui/src/components/control/ModelControl.tsx
@@ -5,9 +5,9 @@ import * as React from 'react';
 import { useContext } from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { ModelParams } from '../../client/types.js';
 import { STALE_TIME } from '../../config.js';
 import { ClientContext } from '../../state.js';
+import { ModelParams } from '../../types/params.js';
 import { QueryList } from '../input/QueryList.js';
 
 export interface ModelControlProps {
diff --git a/gui/src/components/control/UpscaleControl.tsx b/gui/src/components/control/UpscaleControl.tsx
index 5d3d0044..a90dd330 100644
--- a/gui/src/components/control/UpscaleControl.tsx
+++ b/gui/src/components/control/UpscaleControl.tsx
@@ -5,8 +5,8 @@ import { useContext } from 'react';
 import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 
-import { UpscaleParams } from '../../client/types.js';
 import { ConfigContext, OnnxState, StateContext } from '../../state.js';
+import { UpscaleParams } from '../../types/params.js';
 import { NumericField } from '../input/NumericField.js';
 
 export interface UpscaleControlProps {
diff --git a/gui/src/components/input/MaskCanvas.tsx b/gui/src/components/input/MaskCanvas.tsx
index 0bc4673c..ae7f2723 100644
--- a/gui/src/components/input/MaskCanvas.tsx
+++ b/gui/src/components/input/MaskCanvas.tsx
@@ -5,9 +5,9 @@ import { throttle } from 'lodash';
 import React, { RefObject, useContext, useEffect, useMemo, useRef } from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { BrushParams } from '../../client/types.js';
 import { SAVE_TIME } from '../../config.js';
 import { ConfigContext, LoggerContext, StateContext } from '../../state.js';
+import { BrushParams } from '../../types/params.js';
 import { imageFromBlob } from '../../utils.js';
 import { NumericField } from './NumericField';
 
diff --git a/gui/src/components/input/model/CorrectionModel.tsx b/gui/src/components/input/model/CorrectionModel.tsx
index a1db14e6..68f31bf3 100644
--- a/gui/src/components/input/model/CorrectionModel.tsx
+++ b/gui/src/components/input/model/CorrectionModel.tsx
@@ -2,7 +2,7 @@ import { Button, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { CorrectionArch, CorrectionModel, ModelFormat } from '../../../types.js';
+import { CorrectionArch, CorrectionModel, ModelFormat } from '../../../types/model.js';
 
 export interface CorrectionModelInputProps {
   key?: number | string;
diff --git a/gui/src/components/input/model/DiffusionModel.tsx b/gui/src/components/input/model/DiffusionModel.tsx
index b7d7b98b..e042b4fa 100644
--- a/gui/src/components/input/model/DiffusionModel.tsx
+++ b/gui/src/components/input/model/DiffusionModel.tsx
@@ -2,7 +2,7 @@ import { Button, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { DiffusionModel, ModelFormat } from '../../../types.js';
+import { DiffusionModel, ModelFormat } from '../../../types/model.js';
 
 export interface DiffusionModelInputProps {
   key?: number | string;
diff --git a/gui/src/components/input/model/ExtraNetwork.tsx b/gui/src/components/input/model/ExtraNetwork.tsx
index 2fcdef2b..1d279525 100644
--- a/gui/src/components/input/model/ExtraNetwork.tsx
+++ b/gui/src/components/input/model/ExtraNetwork.tsx
@@ -2,7 +2,7 @@ import { Button, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { ExtraNetwork, ModelFormat, NetworkModel, NetworkType } from '../../../types.js';
+import { ExtraNetwork, ModelFormat, NetworkModel, NetworkType } from '../../../types/model.js';
 
 export interface ExtraNetworkInputProps {
   key?: number | string;
diff --git a/gui/src/components/input/model/ExtraSource.tsx b/gui/src/components/input/model/ExtraSource.tsx
index c2011123..5a19ad18 100644
--- a/gui/src/components/input/model/ExtraSource.tsx
+++ b/gui/src/components/input/model/ExtraSource.tsx
@@ -2,7 +2,7 @@ import { Button, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { AnyFormat, ExtraSource } from '../../../types.js';
+import { AnyFormat, ExtraSource } from '../../../types/model.js';
 
 export interface ExtraSourceInputProps {
   key?: number | string;
diff --git a/gui/src/components/input/model/UpscalingModel.tsx b/gui/src/components/input/model/UpscalingModel.tsx
index c315da91..cf151df9 100644
--- a/gui/src/components/input/model/UpscalingModel.tsx
+++ b/gui/src/components/input/model/UpscalingModel.tsx
@@ -2,7 +2,7 @@ import { Button, MenuItem, Select, Stack, TextField } from '@mui/material';
 import * as React from 'react';
 import { useTranslation } from 'react-i18next';
 
-import { ModelFormat, UpscalingArch, UpscalingModel } from '../../../types.js';
+import { ModelFormat, UpscalingArch, UpscalingModel } from '../../../types/model.js';
 import { NumericField } from '../NumericField.js';
 
 export interface UpscalingModelInputProps {
diff --git a/gui/src/components/tab/Blend.tsx b/gui/src/components/tab/Blend.tsx
index 5d75ecd8..a1a304d1 100644
--- a/gui/src/components/tab/Blend.tsx
+++ b/gui/src/components/tab/Blend.tsx
@@ -7,9 +7,9 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { BlendParams, BrushParams, ModelParams, UpscaleParams } from '../../client/types.js';
 import { IMAGE_FILTER } from '../../config.js';
 import { BLEND_SOURCES, ClientContext, OnnxState, StateContext, TabState } from '../../state.js';
+import { BlendParams, BrushParams, ModelParams, UpscaleParams } from '../../types/params.js';
 import { range } from '../../utils.js';
 import { UpscaleControl } from '../control/UpscaleControl.js';
 import { ImageInput } from '../input/ImageInput.js';
diff --git a/gui/src/components/tab/Img2Img.tsx b/gui/src/components/tab/Img2Img.tsx
index 306bdd14..cddb8539 100644
--- a/gui/src/components/tab/Img2Img.tsx
+++ b/gui/src/components/tab/Img2Img.tsx
@@ -5,11 +5,12 @@ import * as React from 'react';
 import { useContext } from 'react';
 import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
-import { shallow} from 'zustand/shallow';
+import { shallow } from 'zustand/shallow';
 
-import { HighresParams, Img2ImgParams, ModelParams, UpscaleParams } from '../../client/types.js';
 import { IMAGE_FILTER, STALE_TIME } from '../../config.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext, TabState } from '../../state.js';
+import { HighresParams, Img2ImgParams, ModelParams, UpscaleParams } from '../../types/params.js';
+import { Profiles } from '../Profiles.js';
 import { HighresControl } from '../control/HighresControl.js';
 import { ImageControl } from '../control/ImageControl.js';
 import { ModelControl } from '../control/ModelControl.js';
@@ -17,7 +18,6 @@ import { UpscaleControl } from '../control/UpscaleControl.js';
 import { ImageInput } from '../input/ImageInput.js';
 import { NumericField } from '../input/NumericField.js';
 import { QueryList } from '../input/QueryList.js';
-import { Profiles } from '../Profiles.js';
 
 export function Img2Img() {
   const { params } = mustExist(useContext(ConfigContext));
diff --git a/gui/src/components/tab/Inpaint.tsx b/gui/src/components/tab/Inpaint.tsx
index 62fbeb1b..b783f5b5 100644
--- a/gui/src/components/tab/Inpaint.tsx
+++ b/gui/src/components/tab/Inpaint.tsx
@@ -7,9 +7,10 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { BrushParams, HighresParams, InpaintParams, ModelParams, UpscaleParams } from '../../client/types.js';
 import { IMAGE_FILTER, STALE_TIME } from '../../config.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext, TabState } from '../../state.js';
+import { BrushParams, HighresParams, InpaintParams, ModelParams, UpscaleParams } from '../../types/params.js';
+import { Profiles } from '../Profiles.js';
 import { HighresControl } from '../control/HighresControl.js';
 import { ImageControl } from '../control/ImageControl.js';
 import { ModelControl } from '../control/ModelControl.js';
@@ -19,7 +20,6 @@ import { ImageInput } from '../input/ImageInput.js';
 import { MaskCanvas } from '../input/MaskCanvas.js';
 import { NumericField } from '../input/NumericField.js';
 import { QueryList } from '../input/QueryList.js';
-import { Profiles } from '../Profiles.js';
 
 export function Inpaint() {
   const { params } = mustExist(useContext(ConfigContext));
diff --git a/gui/src/components/tab/Models.tsx b/gui/src/components/tab/Models.tsx
index a0cf13b0..e634485a 100644
--- a/gui/src/components/tab/Models.tsx
+++ b/gui/src/components/tab/Models.tsx
@@ -19,7 +19,7 @@ import {
   NetworkType,
   SafetensorFormat,
   UpscalingModel,
-} from '../../types.js';
+} from '../../types/model.js';
 import { EditableList } from '../input/EditableList';
 import { CorrectionModelInput } from '../input/model/CorrectionModel.js';
 import { DiffusionModelInput } from '../input/model/DiffusionModel.js';
diff --git a/gui/src/components/tab/Txt2Img.tsx b/gui/src/components/tab/Txt2Img.tsx
index f5fab31b..921def1f 100644
--- a/gui/src/components/tab/Txt2Img.tsx
+++ b/gui/src/components/tab/Txt2Img.tsx
@@ -7,16 +7,16 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from '../../client/types.js';
+import { PipelineGrid, makeTxt2ImgGridPipeline } from '../../client/utils.js';
 import { ClientContext, ConfigContext, OnnxState, StateContext, TabState } from '../../state.js';
+import { HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from '../../types/params.js';
+import { Profiles } from '../Profiles.js';
 import { HighresControl } from '../control/HighresControl.js';
 import { ImageControl } from '../control/ImageControl.js';
 import { ModelControl } from '../control/ModelControl.js';
 import { UpscaleControl } from '../control/UpscaleControl.js';
-import { NumericField } from '../input/NumericField.js';
-import { Profiles } from '../Profiles.js';
 import { VariableControl } from '../control/VariableControl.js';
-import { PipelineGrid, buildPipelineForTxt2ImgGrid } from '../../client/utils.js';
+import { NumericField } from '../input/NumericField.js';
 
 export function Txt2Img() {
   const { params } = mustExist(useContext(ConfigContext));
@@ -29,7 +29,7 @@ export function Txt2Img() {
     const highres = selectHighres(state);
 
     if (grid.enabled) {
-      const chain = buildPipelineForTxt2ImgGrid(grid, model, params2, upscale, highres);
+      const chain = makeTxt2ImgGridPipeline(grid, model, params2, upscale, highres);
       const image = await client.chain(model, chain);
       pushHistory(image);
     } else {
diff --git a/gui/src/components/tab/Upscale.tsx b/gui/src/components/tab/Upscale.tsx
index 0c6a90f0..06314579 100644
--- a/gui/src/components/tab/Upscale.tsx
+++ b/gui/src/components/tab/Upscale.tsx
@@ -7,15 +7,15 @@ import { useTranslation } from 'react-i18next';
 import { useStore } from 'zustand';
 import { shallow } from 'zustand/shallow';
 
-import { HighresParams, ModelParams, UpscaleParams, UpscaleReqParams } from '../../client/types.js';
 import { IMAGE_FILTER } from '../../config.js';
 import { ClientContext, OnnxState, StateContext, TabState } from '../../state.js';
+import { HighresParams, ModelParams, UpscaleParams, UpscaleReqParams } from '../../types/params.js';
+import { Profiles } from '../Profiles.js';
 import { HighresControl } from '../control/HighresControl.js';
 import { ModelControl } from '../control/ModelControl.js';
 import { UpscaleControl } from '../control/UpscaleControl.js';
 import { ImageInput } from '../input/ImageInput.js';
 import { PromptInput } from '../input/PromptInput.js';
-import { Profiles } from '../Profiles.js';
 
 export function Upscale() {
   async function uploadSource() {
diff --git a/gui/src/config.ts b/gui/src/config.ts
index a7b221cb..08b3ebe8 100644
--- a/gui/src/config.ts
+++ b/gui/src/config.ts
@@ -10,7 +10,7 @@ import {
   OutpaintParams,
   Txt2ImgParams,
   UpscaleParams,
-} from './client/types.js';
+} from './types/params.js';
 
 export interface ConfigBoolean {
   default: boolean;
diff --git a/gui/src/main.tsx b/gui/src/main.tsx
index fc557e55..d0b83a11 100644
--- a/gui/src/main.tsx
+++ b/gui/src/main.tsx
@@ -12,7 +12,7 @@ import { createJSONStorage, persist } from 'zustand/middleware';
 
 import { makeClient } from './client/api.js';
 import { LOCAL_CLIENT } from './client/local.js';
-import { ApiClient } from './client/types.js';
+import { ApiClient } from './client/base.js';
 import { ParamsVersionError } from './components/error/ParamsVersion.js';
 import { ServerParamsError } from './components/error/ServerParams.js';
 import { LoadingScreen } from './components/LoadingScreen.js';
diff --git a/gui/src/state.ts b/gui/src/state.ts
index 5144fd7d..861f0e67 100644
--- a/gui/src/state.ts
+++ b/gui/src/state.ts
@@ -8,24 +8,24 @@ import { StateCreator, StoreApi } from 'zustand';
 
 import {
   ApiClient,
+} from './client/base.js';
+import { PipelineGrid } from './client/utils.js';
+import { Config, ConfigFiles, ConfigState, ServerParams } from './config.js';
+import { CorrectionModel, DiffusionModel, ExtraNetwork, ExtraSource, ExtrasFile, UpscalingModel } from './types/model.js';
+import { ImageResponse, ReadyResponse, RetryParams } from './types/api.js';
+import {
   BaseImgParams,
   BlendParams,
   BrushParams,
   HighresParams,
-  ImageResponse,
   Img2ImgParams,
   InpaintParams,
   ModelParams,
   OutpaintPixels,
-  ReadyResponse,
-  RetryParams,
   Txt2ImgParams,
   UpscaleParams,
   UpscaleReqParams,
-} from './client/types.js';
-import { Config, ConfigFiles, ConfigState, ServerParams } from './config.js';
-import { CorrectionModel, DiffusionModel, ExtraNetwork, ExtraSource, ExtrasFile, UpscalingModel } from './types.js';
-import { PipelineGrid } from './client/utils.js';
+} from './types/params.js';
 
 export const MISSING_INDEX = -1;
 
diff --git a/gui/src/types/api.ts b/gui/src/types/api.ts
new file mode 100644
index 00000000..70b99f7a
--- /dev/null
+++ b/gui/src/types/api.ts
@@ -0,0 +1,120 @@
+import {
+  BaseImgParams,
+  ModelParams,
+  Txt2ImgParams,
+  UpscaleParams,
+  HighresParams,
+  Img2ImgParams,
+  InpaintParams,
+  OutpaintParams,
+  UpscaleReqParams,
+  BlendParams,
+  ImageSize,
+} from './params.js';
+
+/**
+ * Output image data within the response.
+ */
+export interface ImageOutput {
+  key: string;
+  url: string;
+}
+
+/**
+ * General response for most image requests.
+ */
+export interface ImageResponse {
+  outputs: Array<ImageOutput>;
+  params: Required<BaseImgParams> & Required<ModelParams>;
+  size: ImageSize;
+}
+
+/**
+ * Status response from the ready endpoint.
+ */
+export interface ReadyResponse {
+  cancelled: boolean;
+  failed: boolean;
+  progress: number;
+  ready: boolean;
+}
+
+export interface NetworkModel {
+  name: string;
+  type: 'control' | 'inversion' | 'lora';
+  // TODO: add token
+  // TODO: add layer/token count
+}
+
+export interface FilterResponse {
+  mask: Array<string>;
+  source: Array<string>;
+}
+
+/**
+ * List of available models.
+ */
+export interface ModelResponse {
+  correction: Array<string>;
+  diffusion: Array<string>;
+  networks: Array<NetworkModel>;
+  upscaling: Array<string>;
+}
+
+export interface WriteExtrasResponse {
+  file: string;
+  successful: Array<string>;
+  errors: Array<string>;
+}
+
+export type RetryParams = {
+  type: 'txt2img';
+  model: ModelParams;
+  params: Txt2ImgParams;
+  upscale?: UpscaleParams;
+  highres?: HighresParams;
+} | {
+  type: 'img2img';
+  model: ModelParams;
+  params: Img2ImgParams;
+  upscale?: UpscaleParams;
+  highres?: HighresParams;
+} | {
+  type: 'inpaint';
+  model: ModelParams;
+  params: InpaintParams;
+  upscale?: UpscaleParams;
+  highres?: HighresParams;
+} | {
+  type: 'outpaint';
+  model: ModelParams;
+  params: OutpaintParams;
+  upscale?: UpscaleParams;
+  highres?: HighresParams;
+} | {
+  type: 'upscale';
+  model: ModelParams;
+  params: UpscaleReqParams;
+  upscale?: UpscaleParams;
+  highres?: HighresParams;
+} | {
+  type: 'blend';
+  model: ModelParams;
+  params: BlendParams;
+  upscale?: UpscaleParams;
+};
+
+export interface ImageResponseWithRetry {
+  image: ImageResponse;
+  retry: RetryParams;
+}
+
+export interface ImageMetadata {
+  highres: HighresParams;
+  outputs: string | Array<string>;
+  params: Txt2ImgParams | Img2ImgParams | InpaintParams;
+  upscale: UpscaleParams;
+
+  input_size: ImageSize;
+  size: ImageSize;
+}
diff --git a/gui/src/types/chain.ts b/gui/src/types/chain.ts
new file mode 100644
index 00000000..11d72020
--- /dev/null
+++ b/gui/src/types/chain.ts
@@ -0,0 +1,40 @@
+import { ImageSize, Img2ImgParams, ModelParams, Txt2ImgParams } from './params.js';
+
+export interface ChainStageParams {
+  tile_size: number;
+}
+
+export interface Txt2ImgStage {
+  name: string;
+  type: 'source-txt2img';
+  params: Partial<Txt2ImgParams & ChainStageParams>;
+}
+
+export interface Img2ImgStage {
+  name: string;
+  type: 'blend-img2img';
+  params: Partial<Img2ImgParams & ChainStageParams>;
+}
+
+export interface GridStage {
+  name: string;
+  type: 'blend-grid';
+  params: Partial<ImageSize & ChainStageParams>;
+}
+
+export interface OutputStage {
+  name: string;
+  type: 'persist-disk';
+  params: Partial<ChainStageParams>;
+}
+
+export interface ChainPipeline {
+  /* defaults?: {
+    txt2img?: Txt2ImgParams;
+    img2img?: Img2ImgParams;
+  }; */
+
+  defaults?: Txt2ImgParams & ModelParams;
+
+  stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
+}
diff --git a/gui/src/types.ts b/gui/src/types/model.ts
similarity index 100%
rename from gui/src/types.ts
rename to gui/src/types/model.ts
diff --git a/gui/src/types/params.ts b/gui/src/types/params.ts
new file mode 100644
index 00000000..2b4b3888
--- /dev/null
+++ b/gui/src/types/params.ts
@@ -0,0 +1,165 @@
+/**
+ * Output image size, after upscaling and outscale.
+ */
+export interface ImageSize {
+  width: number;
+  height: number;
+}
+
+/**
+ * Shared parameters for anything using models, which is pretty much everything.
+ */
+export interface ModelParams {
+  /**
+   * The diffusion model to use.
+   */
+  model: string;
+
+  /**
+   * Specialized pipeline to use.
+   */
+  pipeline: string;
+
+  /**
+   * The hardware acceleration platform to use.
+   */
+  platform: string;
+
+  /**
+   * The upscaling model to use.
+   */
+  upscaling: string;
+
+  /**
+   * The correction model to use.
+   */
+  correction: string;
+
+  /**
+   * ControlNet to be used.
+   */
+  control: string;
+}
+
+/**
+ * Shared parameters for most of the image requests.
+ */
+export interface BaseImgParams {
+  scheduler: string;
+  prompt: string;
+  negativePrompt?: string;
+
+  batch: number;
+  tiledVAE: boolean;
+  tiles: number;
+  overlap: number;
+  stride: number;
+
+  cfg: number;
+  steps: number;
+  seed: number;
+  eta: number;
+}
+
+/**
+ * Parameters for txt2img requests.
+ */
+export type Txt2ImgParams = BaseImgParams & ImageSize;
+
+/**
+ * Parameters for img2img requests.
+ */
+export interface Img2ImgParams extends BaseImgParams {
+  source: Blob;
+
+  loopback: number;
+  sourceFilter: string;
+  strength: number;
+}
+
+/**
+ * Parameters for inpaint requests.
+ */
+export interface InpaintParams extends BaseImgParams {
+  mask: Blob;
+  source: Blob;
+
+  filter: string;
+  noise: string;
+  strength: number;
+  fillColor: string;
+  tileOrder: string;
+}
+
+/**
+ * Additional parameters for outpaint border.
+ *
+ * @todo should be nested under inpaint/outpaint params
+ */
+export interface OutpaintPixels {
+  enabled: boolean;
+
+  left: number;
+  right: number;
+  top: number;
+  bottom: number;
+}
+
+/**
+ * Parameters for outpaint requests.
+ */
+export type OutpaintParams = InpaintParams & OutpaintPixels;
+
+/**
+ * Additional parameters for the inpaint brush.
+ *
+ * These are not currently sent to the server and only stored in state.
+ *
+ * @todo move to state
+ */
+export interface BrushParams {
+  color: number;
+  size: number;
+  strength: number;
+}
+
+/**
+ * Additional parameters for upscaling. May be sent with most other requests to run a post-pipeline.
+ */
+export interface UpscaleParams {
+  enabled: boolean;
+  upscaleOrder: string;
+
+  denoise: number;
+  scale: number;
+  outscale: number;
+
+  faces: boolean;
+  faceStrength: number;
+  faceOutscale: number;
+}
+
+/**
+ * Parameters for upscale requests.
+ */
+export interface UpscaleReqParams extends BaseImgParams {
+  source: Blob;
+}
+
+/**
+ * Parameters for blend requests.
+ */
+export interface BlendParams {
+  sources: Array<Blob>;
+  mask: Blob;
+}
+
+export interface HighresParams {
+  enabled: boolean;
+
+  highresIterations: number;
+  highresMethod: string;
+  highresScale: number;
+  highresSteps: number;
+  highresStrength: number;
+}

From e034ebfc1395aa9637e5706532f2a87313c6818f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:03:39 -0500
Subject: [PATCH 048/240] add a bunch of tests

---
 api/onnx_web/chain/tile.py            |   4 +-
 api/onnx_web/diffusers/load.py        |   2 +-
 api/tests/chain/test_tile.py          |  49 +++++++++---
 api/tests/test_diffusers/__init__.py  |   0
 api/tests/test_diffusers/test_load.py |  59 ++++++++++++++
 api/tests/worker/test_pool.py         | 108 +++++++++++++++++++++++++-
 6 files changed, 206 insertions(+), 16 deletions(-)
 create mode 100644 api/tests/test_diffusers/__init__.py
 create mode 100644 api/tests/test_diffusers/test_load.py

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 7e40c7dc..44f62671 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -53,8 +53,8 @@ def needs_tile(
     logger.trace(
         "checking image tile dimensions: %s, %s, %s",
         tile,
-        source.width > tile or source.height > tile,
-        size.width > tile or size.height > tile,
+        source.width > tile or source.height > tile if source is not None else False,
+        size.width > tile or size.height > tile if size is not None else False,
     )
 
     if source is not None:
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 94778e33..0ab7bf9a 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -544,7 +544,7 @@ def patch_pipeline(
 ) -> None:
     logger.debug("patching SD pipeline")
 
-    if params.is_lpw():
+    if not params.is_lpw():
         pipe._encode_prompt = expand_prompt.__get__(pipe, pipeline)
 
     if not params.is_xl():
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index 71b7d2e5..097d6ad1 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -2,7 +2,8 @@ import unittest
 
 from PIL import Image
 
-from onnx_web.chain.tile import complete_tile
+from onnx_web.chain.tile import complete_tile, get_tile_grads, needs_tile
+from onnx_web.params import Size
 
 
 class TestCompleteTile(unittest.TestCase):
@@ -20,23 +21,51 @@ class TestCompleteTile(unittest.TestCase):
 
   def test_with_nothing(self):
     output = complete_tile(None, 64)
+
     self.assertIsNone(output)
 
 
 class TestNeedsTile(unittest.TestCase):
-  def test_with_undersized(self):
-    pass
+  def test_with_undersized_source(self):
+    small = Image.new("RGB", (32, 32))
 
-  def test_with_oversized(self):
-    pass
+    self.assertFalse(needs_tile(64, 64, source=small))
 
-  def test_with_mixed(self):
-    pass
+  def test_with_oversized_source(self):
+    large = Image.new("RGB", (64, 64))
+
+    self.assertTrue(needs_tile(32, 32, source=large))
+
+  def test_with_undersized_size(self):
+    small = Size(32, 32)
+
+    self.assertFalse(needs_tile(64, 64, size=small))
+
+  def test_with_oversized_source(self):
+    large = Size(64, 64)
+
+    self.assertTrue(needs_tile(32, 32, size=large))
+
+  def test_with_nothing(self):
+    self.assertFalse(needs_tile(32, 32))
 
 
 class TestTileGrads(unittest.TestCase):
   def test_center_tile(self):
-    pass
+    grad_x, grad_y = get_tile_grads(32, 32, 8, 64, 64)
 
-  def test_edge_tile(self):
-    pass
+    self.assertEqual(grad_x, [0, 1, 1, 0])
+    self.assertEqual(grad_y, [0, 1, 1, 0])
+
+  def test_vertical_edge_tile(self):
+    grad_x, grad_y = get_tile_grads(32, 0, 8, 64, 8)
+
+    self.assertEqual(grad_x, [0, 1, 1, 0])
+    self.assertEqual(grad_y, [1, 1, 1, 1])
+
+
+  def test_horizontal_edge_tile(self):
+    grad_x, grad_y = get_tile_grads(0, 32, 8, 8, 64)
+
+    self.assertEqual(grad_x, [1, 1, 1, 1])
+    self.assertEqual(grad_y, [0, 1, 1, 0])
diff --git a/api/tests/test_diffusers/__init__.py b/api/tests/test_diffusers/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
new file mode 100644
index 00000000..8ed80e18
--- /dev/null
+++ b/api/tests/test_diffusers/test_load.py
@@ -0,0 +1,59 @@
+import unittest
+
+from onnx_web.diffusers.load import get_available_pipelines, get_pipeline_schedulers, get_scheduler_name
+from diffusers import DDIMScheduler
+
+
+class TestAvailablePipelines(unittest.TestCase):
+  def test_available_pipelines(self):
+    pipelines = get_available_pipelines()
+
+    self.assertIn("txt2img", pipelines)
+
+
+class TestPipelineSchedulers(unittest.TestCase):
+  def test_pipeline_schedulers(self):
+    schedulers = get_pipeline_schedulers()
+
+    self.assertIn("euler-a", schedulers)
+
+
+class TestSchedulerNames(unittest.TestCase):
+  def test_valid_name(self):
+    scheduler = get_scheduler_name(DDIMScheduler)
+
+    self.assertEqual("ddim", scheduler)
+
+  def test_missing_names(self):
+    self.assertIsNone(get_scheduler_name("test"))
+
+
+class TestOptimizePipeline(unittest.TestCase):
+  def test_auto_attention_slicing(self):
+    pass
+
+  def test_max_attention_slicing(self):
+    pass
+
+  def test_vae_slicing(self):
+    pass
+
+  def test_cpu_offload_sequential(self):
+    pass
+
+  def test_cpu_offload_model(self):
+    pass
+
+  def test_memory_efficient_attention(self):
+    pass
+
+
+class TestPatchPipeline(unittest.TestCase):
+  def test_expand_not_lpw(self):
+    pass
+
+  def test_unet_wrapper_not_xl(self):
+    pass
+
+  def test_vae_wrapper(self):
+    pass
\ No newline at end of file
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index cbb4c42c..34e8a867 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -1,12 +1,114 @@
+from typing import Optional
+from multiprocessing import Event
 import unittest
+from onnx_web.params import DeviceParams
+from time import sleep
 
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.pool import DevicePoolExecutor
 
+TEST_JOIN_TIMEOUT = 0.2
+
+def test_job(*args, lock: Event, **kwargs):
+  lock.wait()
+
 
 class TestWorkerPool(unittest.TestCase):
+  lock: Optional[Event]
+  pool: Optional[DevicePoolExecutor]
+
+  def setUp(self) -> None:
+    self.lock = Event()
+    self.pool = None
+
+  def tearDown(self) -> None:
+    if self.pool is not None:
+        self.pool.join()
+
   def test_no_devices(self):
     server = ServerContext()
-    pool = DevicePoolExecutor(server, [])
-    pool.start()
-    pool.join()
\ No newline at end of file
+    self.pool = DevicePoolExecutor(server, [], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+  def test_fake_worker(self):
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+    self.assertEqual(len(self.pool.workers), 1)
+
+  def test_cancel_pending(self):
+    pass
+
+  def test_cancel_running(self):
+    pass
+
+  def test_next_device(self):
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.assertEqual(self.pool.get_next_device(), 0)
+
+  def test_needs_device(self):
+    device1 = DeviceParams("cpu1", "CPUProvider")
+    device2 = DeviceParams("cpu2", "CPUProvider")
+    server = ServerContext()
+    self.pool = DevicePoolExecutor(server, [device1, device2], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.assertEqual(self.pool.get_next_device(needs_device=device2), 1)
+
+  def test_done_running(self):
+    """
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.pool.submit("test", test_job, lock=self.lock)
+    sleep(5.0)
+    self.assertEqual(self.pool.done("test"), (False, None))
+    """
+    pass
+
+  def test_done_pending(self):
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.pool.submit("test1", test_job, lock=self.lock)
+    self.pool.submit("test2", test_job, lock=self.lock)
+    self.assertTrue(self.pool.done("test2"), (True, None))
+
+    self.lock.set()
+
+  def test_done_finished(self):
+    """
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.pool.submit("test", test_job, lock=self.lock)
+    self.assertEqual(self.pool.done("test"), (True, None))
+
+    self.lock.set()
+    sleep(5.0)
+    self.assertEqual(self.pool.done("test"), (False, None))
+    """
+    pass
+
+  def test_recycle_live(self):
+    pass
+
+  def test_recycle_dead(self):
+    pass
+
+  def test_running_status(self):
+    pass
\ No newline at end of file

From b4240a288d480bb8efa493389b931baaaeeff695 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:04:31 -0500
Subject: [PATCH 049/240] apply lint

---
 api/tests/test_diffusers/test_load.py | 7 ++++++-
 api/tests/worker/test_pool.py         | 6 +++---
 2 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index 8ed80e18..c3649a47 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -1,8 +1,13 @@
 import unittest
 
-from onnx_web.diffusers.load import get_available_pipelines, get_pipeline_schedulers, get_scheduler_name
 from diffusers import DDIMScheduler
 
+from onnx_web.diffusers.load import (
+    get_available_pipelines,
+    get_pipeline_schedulers,
+    get_scheduler_name,
+)
+
 
 class TestAvailablePipelines(unittest.TestCase):
   def test_available_pipelines(self):
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index 34e8a867..2547512f 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -1,9 +1,9 @@
-from typing import Optional
-from multiprocessing import Event
 import unittest
-from onnx_web.params import DeviceParams
+from multiprocessing import Event
 from time import sleep
+from typing import Optional
 
+from onnx_web.params import DeviceParams
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.pool import DevicePoolExecutor
 

From 4d0e24a47b78038b4c368c421f56b5dfefb9e261 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:06:12 -0500
Subject: [PATCH 050/240] fix request log keys

---
 api/onnx_web/server/params.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index bc6ef14d..62332944 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -371,11 +371,11 @@ def pipeline_from_request(
         user,
         params.steps,
         params.scheduler,
-        params.model_path,
+        params.model,
         params.pipeline,
         device or "any device",
-        params.width,
-        params.height,
+        size.width,
+        size.height,
         params.cfg,
         params.seed,
         params.prompt,

From bbff1913ef2cf84799c7dcce37e50d2a0a97c265 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:09:41 -0500
Subject: [PATCH 051/240] fix(api): do not apply prompt expansion patch to SDXL

---
 api/onnx_web/diffusers/load.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 0ab7bf9a..fb5d256f 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -544,7 +544,7 @@ def patch_pipeline(
 ) -> None:
     logger.debug("patching SD pipeline")
 
-    if not params.is_lpw():
+    if not params.is_lpw() and not params.is_xl():
         pipe._encode_prompt = expand_prompt.__get__(pipe, pipeline)
 
     if not params.is_xl():

From 4959c01ddb653948cc944c79b09beb9575d4f997 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:40:22 -0500
Subject: [PATCH 052/240] start testing tile order

---
 api/tests/chain/test_tile.py | 25 +++++++++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index 097d6ad1..a006a34e 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -2,7 +2,7 @@ import unittest
 
 from PIL import Image
 
-from onnx_web.chain.tile import complete_tile, get_tile_grads, needs_tile
+from onnx_web.chain.tile import complete_tile, generate_tile_spiral, get_tile_grads, needs_tile
 from onnx_web.params import Size
 
 
@@ -63,9 +63,30 @@ class TestTileGrads(unittest.TestCase):
     self.assertEqual(grad_x, [0, 1, 1, 0])
     self.assertEqual(grad_y, [1, 1, 1, 1])
 
-
   def test_horizontal_edge_tile(self):
     grad_x, grad_y = get_tile_grads(0, 32, 8, 8, 64)
 
     self.assertEqual(grad_x, [1, 1, 1, 1])
     self.assertEqual(grad_y, [0, 1, 1, 0])
+
+
+class TestGenerateTileSpiral(unittest.TestCase):
+  def test_spiral_complete(self):
+    tiles = generate_tile_spiral(16, 16, 8, 0.0)
+
+    self.assertEqual(len(tiles), 4)
+    self.assertEqual(tiles, [(0, 0), (8, 0), (8, 8), (0, 8)])
+
+  def test_spiral_no_overlap(self):
+    tiles = generate_tile_spiral(64, 64, 8, 0.0)
+
+    self.assertEqual(len(tiles), 64)
+    self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
+    self.assertEqual(tiles[-5:-1], [(16, 24), (24, 24), (32, 24), (32, 32)])
+
+  def test_spiral_50_overlap(self):
+    tiles = generate_tile_spiral(64, 64, 8, 0.5)
+
+    self.assertEqual(len(tiles), 225)
+    self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
+    self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])

From 41b38f910a6a9cc56e86b3cfff4f90914a3ed594 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:40:37 -0500
Subject: [PATCH 053/240] update tile size key to match API

---
 gui/src/client/utils.ts | 7 +++----
 gui/src/types/chain.ts  | 2 +-
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 8f51fedc..2bc02aad 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -1,6 +1,6 @@
 import { doesExist } from '@apextoaster/js-utils';
 import { HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from '../types/params.js';
-import { ChainPipeline } from '../types/chain.js';
+import { ChainPipeline, ChainStageParams } from '../types/chain.js';
 
 export interface PipelineVariable {
   parameter: 'prompt' | 'cfg' | 'seed' | 'steps' | 'eta' | 'scheduler' | 'token';
@@ -49,9 +49,8 @@ export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams,
     stages: [],
   };
 
-  const tiles = {
-    // eslint-disable-next-line camelcase
-    tile_size: 8192,
+  const tiles: ChainStageParams = {
+    tiles: 8192,
   };
 
   let i = 0;
diff --git a/gui/src/types/chain.ts b/gui/src/types/chain.ts
index 11d72020..9113a117 100644
--- a/gui/src/types/chain.ts
+++ b/gui/src/types/chain.ts
@@ -1,7 +1,7 @@
 import { ImageSize, Img2ImgParams, ModelParams, Txt2ImgParams } from './params.js';
 
 export interface ChainStageParams {
-  tile_size: number;
+  tiles: number;
 }
 
 export interface Txt2ImgStage {

From 5b659a948a4483857b871b29a93786823380f736 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 13 Sep 2023 22:56:23 -0500
Subject: [PATCH 054/240] more stage tests

---
 api/tests/chain/test_blend_mask.py      | 23 +++++++++++++++++++++++
 api/tests/chain/test_reduce_crop.py     | 23 +++++++++++++++++++++++
 api/tests/chain/test_upscale_highres.py |  2 +-
 3 files changed, 47 insertions(+), 1 deletion(-)
 create mode 100644 api/tests/chain/test_blend_mask.py
 create mode 100644 api/tests/chain/test_reduce_crop.py

diff --git a/api/tests/chain/test_blend_mask.py b/api/tests/chain/test_blend_mask.py
new file mode 100644
index 00000000..410249fe
--- /dev/null
+++ b/api/tests/chain/test_blend_mask.py
@@ -0,0 +1,23 @@
+import unittest
+from PIL import Image
+
+from onnx_web.chain.blend_mask import BlendMaskStage
+from onnx_web.params import HighresParams, UpscaleParams
+
+
+class BlendMaskStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = BlendMaskStage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            stage_mask=Image.new("RGBA", (64, 64)),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_reduce_crop.py b/api/tests/chain/test_reduce_crop.py
new file mode 100644
index 00000000..4e79d8f8
--- /dev/null
+++ b/api/tests/chain/test_reduce_crop.py
@@ -0,0 +1,23 @@
+import unittest
+
+from onnx_web.chain.reduce_crop import ReduceCropStage
+from onnx_web.params import HighresParams, Size, UpscaleParams
+
+
+class ReduceCropStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = ReduceCropStage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            origin=Size(0, 0),
+            size=Size(128, 128),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_upscale_highres.py b/api/tests/chain/test_upscale_highres.py
index f5e17a84..95897c2c 100644
--- a/api/tests/chain/test_upscale_highres.py
+++ b/api/tests/chain/test_upscale_highres.py
@@ -10,4 +10,4 @@ class UpscaleHighresStageTests(unittest.TestCase):
         sources = []
         result = stage.run(None, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
 
-        self.assertEqual(len(result), 0)
\ No newline at end of file
+        self.assertEqual(len(result), 0)

From b851c234fe1de84e8504ba8675f712e283aca404 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 14 Sep 2023 19:35:48 -0500
Subject: [PATCH 055/240] more tests

---
 api/Makefile                               |   1 +
 api/onnx_web/chain/base.py                 |   2 +-
 api/onnx_web/chain/source_noise.py         |   4 +-
 api/onnx_web/chain/source_url.py           |   4 +-
 api/onnx_web/convert/diffusion/lora.py     |   6 +-
 api/tests/chain/test_blend_grid.py         |  21 +++
 api/tests/chain/test_blend_img2img.py      |  26 ++++
 api/tests/chain/test_blend_mask.py         |   1 +
 api/tests/chain/test_correct_codeformer.py |  33 ++++
 api/tests/chain/test_reduce_thumbnail.py   |  28 ++++
 api/tests/chain/test_source_noise.py       |  25 +++
 api/tests/chain/test_source_s3.py          |  25 +++
 api/tests/chain/test_source_url.py         |  24 +++
 api/tests/chain/test_tile.py               |   7 +-
 api/tests/convert/__init__.py              |   0
 api/tests/convert/diffusion/__init__.py    |   0
 api/tests/convert/diffusion/test_lora.py   | 170 +++++++++++++++++++++
 api/tests/convert/test_utils.py            |  19 +++
 api/tests/server/test_load.py              |  83 ++++++++++
 19 files changed, 470 insertions(+), 9 deletions(-)
 create mode 100644 api/tests/chain/test_blend_grid.py
 create mode 100644 api/tests/chain/test_blend_img2img.py
 create mode 100644 api/tests/chain/test_correct_codeformer.py
 create mode 100644 api/tests/chain/test_reduce_thumbnail.py
 create mode 100644 api/tests/chain/test_source_noise.py
 create mode 100644 api/tests/chain/test_source_s3.py
 create mode 100644 api/tests/chain/test_source_url.py
 create mode 100644 api/tests/convert/__init__.py
 create mode 100644 api/tests/convert/diffusion/__init__.py
 create mode 100644 api/tests/convert/diffusion/test_lora.py
 create mode 100644 api/tests/convert/test_utils.py
 create mode 100644 api/tests/server/test_load.py

diff --git a/api/Makefile b/api/Makefile
index 780fa7d1..b5c90421 100644
--- a/api/Makefile
+++ b/api/Makefile
@@ -21,6 +21,7 @@ test:
 	python -m coverage run -m unittest discover -v -s tests/
 	python -m coverage html -i
 	python -m coverage xml -i
+	python -m coverage report -i
 
 package: package-dist package-upload
 
diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 9b554de3..b67bf40b 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -95,7 +95,7 @@ class ChainPipeline:
     def outputs(self, params: ImageParams, sources: int):
         outputs = sources
         for callback, _params, kwargs in self.stages:
-            outputs += callback.outputs(kwargs.get("params", params), outputs)
+            outputs = callback.outputs(kwargs.get("params", params), outputs)
 
         return outputs
 
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 738e9878..89e65abc 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Callable, List
+from typing import Callable, List, Optional
 
 from PIL import Image
 
@@ -22,7 +22,7 @@ class SourceNoiseStage(BaseStage):
         *,
         size: Size,
         noise_source: Callable,
-        stage_source: Image.Image,
+        stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
         logger.info("generating image from noise source")
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 8b1683f8..33e5ac78 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -1,6 +1,6 @@
 from io import BytesIO
 from logging import getLogger
-from typing import List
+from typing import List, Optional
 
 import requests
 from PIL import Image
@@ -23,7 +23,7 @@ class SourceURLStage(BaseStage):
         sources: List[Image.Image],
         *,
         source_urls: List[str],
-        stage_source: Image.Image,
+        stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
         logger.info("loading image from URL source")
diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index e2dc0058..3d3fed7c 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -5,7 +5,7 @@ from typing import Any, Dict, List, Literal, Optional, Tuple, Union
 
 import numpy as np
 import torch
-from onnx import ModelProto, load, numpy_helper
+from onnx import ModelProto, NodeProto, load, numpy_helper
 from onnx.checker import check_model
 from onnx.external_data_helper import (
     convert_model_to_external_data,
@@ -39,7 +39,7 @@ def sum_weights(a: np.ndarray, b: np.ndarray) -> np.ndarray:
         lr = a
 
     if kernel == (1, 1):
-        lr = np.expand_dims(lr, axis=(2, 3))
+        lr = np.expand_dims(lr, axis=(2, 3))  # TODO: generate axis
 
     return hr + lr
 
@@ -78,7 +78,7 @@ def fix_node_name(key: str):
         return fixed_name
 
 
-def fix_xl_names(keys: Dict[str, Any], nodes: List[Any]):
+def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
     fixed = {}
 
     for key, value in keys.items():
diff --git a/api/tests/chain/test_blend_grid.py b/api/tests/chain/test_blend_grid.py
new file mode 100644
index 00000000..8244df5e
--- /dev/null
+++ b/api/tests/chain/test_blend_grid.py
@@ -0,0 +1,21 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.blend_grid import BlendGridStage
+from onnx_web.chain.blend_linear import BlendLinearStage
+
+
+class BlendGridStageTests(unittest.TestCase):
+    def test_stage(self):
+        stage = BlendGridStage()
+        sources = [
+            Image.new("RGB", (64, 64), "black"),
+            Image.new("RGB", (64, 64), "white"),
+            Image.new("RGB", (64, 64), "black"),
+            Image.new("RGB", (64, 64), "white"),
+        ]
+        result = stage.run(None, None, None, None, sources, height=2, width=2)
+
+        self.assertEqual(len(result), 5)
+        self.assertEqual(result[-1].getpixel((0,0)), (0, 0, 0))
\ No newline at end of file
diff --git a/api/tests/chain/test_blend_img2img.py b/api/tests/chain/test_blend_img2img.py
new file mode 100644
index 00000000..21b583f0
--- /dev/null
+++ b/api/tests/chain/test_blend_img2img.py
@@ -0,0 +1,26 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.blend_img2img import BlendImg2ImgStage
+from onnx_web.params import DeviceParams, ImageParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+
+
+class BlendImg2ImgStageTests(unittest.TestCase):
+    def test_stage(self):
+        """
+        stage = BlendImg2ImgStage()
+        params = ImageParams("runwayml/stable-diffusion-v1-5", "txt2img", "euler-a", "an astronaut eating a hamburger", 3.0, 1, 1)
+        server = ServerContext()
+        worker = WorkerContext("test", DeviceParams("cpu", "CPUProvider"), None, None, None, None, None, None, 0)
+        sources = [
+            Image.new("RGB", (64, 64), "black"),
+        ]
+        result = stage.run(worker, server, None, params, sources, strength=0.5, steps=1)
+
+        self.assertEqual(len(result), 1)
+        self.assertEqual(result[0].getpixel((0,0)), (127, 127, 127))
+        """
+        pass
\ No newline at end of file
diff --git a/api/tests/chain/test_blend_mask.py b/api/tests/chain/test_blend_mask.py
index 410249fe..cf70535f 100644
--- a/api/tests/chain/test_blend_mask.py
+++ b/api/tests/chain/test_blend_mask.py
@@ -1,4 +1,5 @@
 import unittest
+
 from PIL import Image
 
 from onnx_web.chain.blend_mask import BlendMaskStage
diff --git a/api/tests/chain/test_correct_codeformer.py b/api/tests/chain/test_correct_codeformer.py
new file mode 100644
index 00000000..8203e876
--- /dev/null
+++ b/api/tests/chain/test_correct_codeformer.py
@@ -0,0 +1,33 @@
+import unittest
+
+from onnx_web.chain.correct_codeformer import CorrectCodeformerStage
+from onnx_web.params import DeviceParams, HighresParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.server.hacks import apply_patches
+from onnx_web.worker.context import WorkerContext
+
+
+class CorrectCodeformerStageTests(unittest.TestCase):
+    def test_empty(self):
+        """
+        server = ServerContext()
+        apply_patches(server)
+
+        worker = WorkerContext(
+            "test",
+            DeviceParams("cpu", "CPUProvider"),
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            0,
+        )
+        stage = CorrectCodeformerStage()
+        sources = []
+        result = stage.run(worker, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
+
+        self.assertEqual(len(result), 0)
+        """
+        pass
\ No newline at end of file
diff --git a/api/tests/chain/test_reduce_thumbnail.py b/api/tests/chain/test_reduce_thumbnail.py
new file mode 100644
index 00000000..14cb12a7
--- /dev/null
+++ b/api/tests/chain/test_reduce_thumbnail.py
@@ -0,0 +1,28 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.reduce_crop import ReduceCropStage
+from onnx_web.chain.reduce_thumbnail import ReduceThumbnailStage
+from onnx_web.params import HighresParams, Size, UpscaleParams
+
+
+class ReduceThumbnailStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage_source = Image.new("RGB", (64, 64))
+        stage = ReduceThumbnailStage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            origin=Size(0, 0),
+            size=Size(128, 128),
+            stage_source=stage_source,
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_source_noise.py b/api/tests/chain/test_source_noise.py
new file mode 100644
index 00000000..8187a751
--- /dev/null
+++ b/api/tests/chain/test_source_noise.py
@@ -0,0 +1,25 @@
+import unittest
+
+from onnx_web.chain.source_noise import SourceNoiseStage
+from onnx_web.image.noise_source import noise_source_fill_edge
+from onnx_web.params import HighresParams, Size, UpscaleParams
+
+
+class SourceNoiseStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = SourceNoiseStage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            origin=Size(0, 0),
+            size=Size(128, 128),
+            noise_source=noise_source_fill_edge,
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_source_s3.py b/api/tests/chain/test_source_s3.py
new file mode 100644
index 00000000..aad37c5b
--- /dev/null
+++ b/api/tests/chain/test_source_s3.py
@@ -0,0 +1,25 @@
+import unittest
+
+from onnx_web.chain.source_s3 import SourceS3Stage
+from onnx_web.params import HighresParams, Size, UpscaleParams
+
+
+class SourceS3StageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = SourceS3Stage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            origin=Size(0, 0),
+            size=Size(128, 128),
+            bucket="test",
+            source_keys=[],
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_source_url.py b/api/tests/chain/test_source_url.py
new file mode 100644
index 00000000..1f185b7b
--- /dev/null
+++ b/api/tests/chain/test_source_url.py
@@ -0,0 +1,24 @@
+import unittest
+
+from onnx_web.chain.source_url import SourceURLStage
+from onnx_web.params import HighresParams, Size, UpscaleParams
+
+
+class SourceURLStageTests(unittest.TestCase):
+    def test_empty(self):
+        stage = SourceURLStage()
+        sources = []
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+            origin=Size(0, 0),
+            size=Size(128, 128),
+            source_urls=[],
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index a006a34e..a613a719 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -2,7 +2,12 @@ import unittest
 
 from PIL import Image
 
-from onnx_web.chain.tile import complete_tile, generate_tile_spiral, get_tile_grads, needs_tile
+from onnx_web.chain.tile import (
+    complete_tile,
+    generate_tile_spiral,
+    get_tile_grads,
+    needs_tile,
+)
 from onnx_web.params import Size
 
 
diff --git a/api/tests/convert/__init__.py b/api/tests/convert/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/convert/diffusion/__init__.py b/api/tests/convert/diffusion/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
new file mode 100644
index 00000000..cbc64979
--- /dev/null
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -0,0 +1,170 @@
+import unittest
+
+import numpy as np
+from onnx import GraphProto, ModelProto, NodeProto
+from onnx.numpy_helper import from_array
+
+from onnx_web.convert.diffusion.lora import (
+    blend_loras,
+    buffer_external_data_tensors,
+    fix_initializer_name,
+    fix_node_name,
+    fix_xl_names,
+    interp_to_match,
+    kernel_slice,
+    sum_weights,
+)
+
+
+class SumWeightsTests(unittest.TestCase):
+    def test_same_shape(self):
+        weights = sum_weights(np.zeros((4, 4)), np.ones((4, 4)))
+        self.assertEqual(weights.shape, (4, 4))
+
+    def test_1x1_kernel(self):
+        weights = sum_weights(np.zeros((4, 4, 1, 1)), np.ones((4, 4)))
+        self.assertEqual(weights.shape, (4, 4, 1, 1))
+
+        weights = sum_weights(np.zeros((4, 4)), np.ones((4, 4, 1, 1)))
+        self.assertEqual(weights.shape, (4, 4, 1, 1))
+
+
+    def test_3x3_kernel(self):
+        """
+        weights = sum_weights(np.zeros((4, 4, 3, 3)), np.ones((4, 4)))
+        self.assertEqual(weights.shape, (4, 4, 1, 1))
+        """
+        pass
+
+
+class BufferExternalDataTensorTests(unittest.TestCase):
+    def test_basic_external(self):
+        model = ModelProto(
+            graph=GraphProto(
+                initializer=[
+                    from_array(np.zeros((4, 4))),
+                ],
+            )
+        )
+        (slim_model, external_weights) = buffer_external_data_tensors(model)
+
+        self.assertEqual(len(slim_model.graph.initializer), len(model.graph.initializer))
+        self.assertEqual(len(external_weights), 1)
+
+
+class FixInitializerKeyTests(unittest.TestCase):
+    def test_fix_name(self):
+        inputs = ["lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0.lora_down.weight"]
+        outputs = ["lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_lora_down_weight"]
+
+        for input, output in zip(inputs, outputs):
+            self.assertEqual(fix_initializer_name(input), output)
+
+
+class FixNodeNameTests(unittest.TestCase):
+    def test_fix_name(self):
+        inputs = [
+            "lora_unet/up_blocks/3/attentions/2/transformer_blocks/0/attn2_to_out/0.lora_down.weight",
+            "_prefix",
+        ]
+        outputs = [
+            "lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_lora_down_weight",
+            "prefix",
+        ]
+
+        for input, output in zip(inputs, outputs):
+            self.assertEqual(fix_node_name(input), output)
+
+
+class FixXLNameTests(unittest.TestCase):
+    def test_empty(self):
+        nodes = {}
+        fixed = fix_xl_names(nodes, [])
+
+        self.assertEqual(fixed, {})
+
+    def test_input_block(self):
+        nodes = {
+            "input_block_proj.lora_down.weight": {},
+        }
+        fixed = fix_xl_names(nodes, [
+            NodeProto(name="/down_blocks_proj/MatMul"),
+        ])
+
+        self.assertEqual(fixed, {
+            "down_blocks_proj": nodes["input_block_proj.lora_down.weight"],
+        })
+
+    def test_middle_block(self):
+        nodes = {
+            "middle_block_proj.lora_down.weight": {},
+        }
+        fixed = fix_xl_names(nodes, [
+            NodeProto(name="/mid_blocks_proj/MatMul"),
+        ])
+
+        self.assertEqual(fixed, {
+            "mid_blocks_proj": nodes["middle_block_proj.lora_down.weight"],
+        })
+
+    def test_output_block(self):
+        pass
+
+    def test_text_model(self):
+        pass
+
+    def test_unknown_block(self):
+        pass
+
+    def test_unmatched_block(self):
+        nodes = {
+            "lora_unet.input_block.lora_down.weight": {},
+        }
+        fixed = fix_xl_names(nodes, [""])
+
+        self.assertEqual(fixed, nodes)
+
+    def test_output_projection(self):
+        nodes = {
+            "output_block_proj_o.lora_down.weight": {},
+        }
+        fixed = fix_xl_names(nodes, [
+            NodeProto(name="/up_blocks_proj_o/MatMul"),
+        ])
+
+        self.assertEqual(fixed, {
+            "up_blocks_proj_out": nodes["output_block_proj_o.lora_down.weight"],
+        })
+
+
+class KernelSliceTests(unittest.TestCase):
+    def test_within_kernel(self):
+        self.assertEqual(
+            kernel_slice(1, 1, (3, 3, 3, 3)),
+            (1, 1),
+        )
+
+    def test_outside_kernel(self):
+        self.assertEqual(
+            kernel_slice(9, 9, (3, 3, 3, 3)),
+            (2, 2),
+        )
+
+class BlendLoRATests(unittest.TestCase):
+    pass
+
+class InterpToMatchTests(unittest.TestCase):
+    def test_same_shape(self):
+        ref = np.zeros((4, 4))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+
+    def test_different_one_dim(self):
+        ref = np.zeros((4, 2))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+
+    def test_different_both_dims(self):
+        ref = np.zeros((2, 2))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
diff --git a/api/tests/convert/test_utils.py b/api/tests/convert/test_utils.py
new file mode 100644
index 00000000..755d6032
--- /dev/null
+++ b/api/tests/convert/test_utils.py
@@ -0,0 +1,19 @@
+import unittest
+
+from onnx_web.convert.utils import DEFAULT_OPSET, ConversionContext, download_progress
+
+
+class ConversionContextTests(unittest.TestCase):
+    def test_from_environ(self):
+      context = ConversionContext.from_environ()
+      self.assertEqual(context.opset, DEFAULT_OPSET)
+
+    def test_map_location(self):
+      context = ConversionContext.from_environ()
+      self.assertEqual(context.map_location.type, "cpu")
+
+
+class DownloadProgressTests(unittest.TestCase):
+   def test_download_example(self):
+      path = download_progress([("https://example.com", "/tmp/example-dot-com")])
+      self.assertEqual(path, "/tmp/example-dot-com")
diff --git a/api/tests/server/test_load.py b/api/tests/server/test_load.py
new file mode 100644
index 00000000..67a5f4e4
--- /dev/null
+++ b/api/tests/server/test_load.py
@@ -0,0 +1,83 @@
+import unittest
+
+from onnx_web.server.load import (
+    get_available_platforms,
+    get_config_params,
+    get_correction_models,
+    get_diffusion_models,
+    get_extra_hashes,
+    get_extra_strings,
+    get_highres_methods,
+    get_mask_filters,
+    get_network_models,
+    get_noise_sources,
+    get_source_filters,
+    get_upscaling_models,
+    get_wildcard_data,
+)
+
+
+class ConfigParamTests(unittest.TestCase):
+    def test_before_setup(self):
+        params = get_config_params()
+        self.assertIsNotNone(params)
+
+class AvailablePlatformTests(unittest.TestCase):
+    def test_before_setup(self):
+        platforms = get_available_platforms()
+        self.assertIsNotNone(platforms)
+
+class CorrectModelTests(unittest.TestCase):
+    def test_before_setup(self):
+        models = get_correction_models()
+        self.assertIsNotNone(models)
+
+class DiffusionModelTests(unittest.TestCase):
+    def test_before_setup(self):
+        models = get_diffusion_models()
+        self.assertIsNotNone(models)
+
+class NetworkModelTests(unittest.TestCase):
+    def test_before_setup(self):
+        models = get_network_models()
+        self.assertIsNotNone(models)
+
+class UpscalingModelTests(unittest.TestCase):
+    def test_before_setup(self):
+        models = get_upscaling_models()
+        self.assertIsNotNone(models)
+
+class WildcardDataTests(unittest.TestCase):
+    def test_before_setup(self):
+        wildcards = get_wildcard_data()
+        self.assertIsNotNone(wildcards)
+
+class ExtraStringsTests(unittest.TestCase):
+    def test_before_setup(self):
+        strings = get_extra_strings()
+        self.assertIsNotNone(strings)
+
+class ExtraHashesTests(unittest.TestCase):
+    def test_before_setup(self):
+        hashes = get_extra_hashes()
+        self.assertIsNotNone(hashes)
+
+class HighresMethodTests(unittest.TestCase):
+    def test_before_setup(self):
+        methods = get_highres_methods()
+        self.assertIsNotNone(methods)
+
+class MaskFilterTests(unittest.TestCase):
+    def test_before_setup(self):
+        filters = get_mask_filters()
+        self.assertIsNotNone(filters)
+
+class NoiseSourceTests(unittest.TestCase):
+    def test_before_setup(self):
+        sources = get_noise_sources()
+        self.assertIsNotNone(sources)
+
+class SourceFilterTests(unittest.TestCase):
+    def test_before_setup(self):
+        filters = get_source_filters()
+        self.assertIsNotNone(filters)

From 3137a465ab365e717a35a87427b83c35f2584eb4 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 06:56:01 -0500
Subject: [PATCH 056/240] adjust node names in projection test

---
 api/tests/convert/diffusion/test_lora.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index cbc64979..58462b80 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -126,14 +126,14 @@ class FixXLNameTests(unittest.TestCase):
 
     def test_output_projection(self):
         nodes = {
-            "output_block_proj_o.lora_down.weight": {},
+            "output_block_proj_out.lora_down.weight": {},
         }
         fixed = fix_xl_names(nodes, [
-            NodeProto(name="/up_blocks_proj_o/MatMul"),
+            NodeProto(name="/up_blocks_proj_out/MatMul"),
         ])
 
         self.assertEqual(fixed, {
-            "up_blocks_proj_out": nodes["output_block_proj_o.lora_down.weight"],
+            "up_blocks_proj_out": nodes["output_block_proj_out.lora_down.weight"],
         })
 
 

From db82c6b760257c13f3138d96a539812aed0526ed Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 08:40:06 -0500
Subject: [PATCH 057/240] fix(build): add vscode config for API testing

---
 api/.vscode/settings.json | 11 +++++++++++
 1 file changed, 11 insertions(+)
 create mode 100644 api/.vscode/settings.json

diff --git a/api/.vscode/settings.json b/api/.vscode/settings.json
new file mode 100644
index 00000000..beeac074
--- /dev/null
+++ b/api/.vscode/settings.json
@@ -0,0 +1,11 @@
+{
+  "python.testing.unittestArgs": [
+    "-v",
+    "-s",
+    "./tests",
+    "-p",
+    "test_*.py"
+  ],
+  "python.testing.pytestEnabled": false,
+  "python.testing.unittestEnabled": true
+}
\ No newline at end of file

From a71298ff33f457933e1c2e082e6c68fd8d174c5b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 08:40:56 -0500
Subject: [PATCH 058/240] remove unused schema, lint

---
 api/onnx_web/chain/blend_img2img.py      |   2 +-
 api/onnx_web/chain/source_txt2img.py     |   2 +-
 api/onnx_web/chain/upscale_outpaint.py   |   2 +-
 api/onnx_web/convert/diffusion/lora.py   |   3 -
 api/onnx_web/params.py                   |   2 +-
 api/schemas/generate.yaml                | 117 -----------------------
 api/tests/chain/test_base.py             |  26 +++++
 api/tests/convert/diffusion/test_lora.py |  11 ++-
 8 files changed, 40 insertions(+), 125 deletions(-)
 delete mode 100644 api/schemas/generate.yaml
 create mode 100644 api/tests/chain/test_base.py

diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index 020cd917..0d5ad28e 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -16,7 +16,7 @@ logger = getLogger(__name__)
 
 
 class BlendImg2ImgStage(BaseStage):
-    max_tile = SizeChart.unlimited
+    max_tile = SizeChart.max
 
     def run(
         self,
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index dfed652a..b4dd7c24 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -22,7 +22,7 @@ logger = getLogger(__name__)
 
 
 class SourceTxt2ImgStage(BaseStage):
-    max_tile = SizeChart.unlimited
+    max_tile = SizeChart.max
 
     def run(
         self,
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 71de2629..67f7ca0a 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -24,7 +24,7 @@ logger = getLogger(__name__)
 
 
 class UpscaleOutpaintStage(BaseStage):
-    max_tile = SizeChart.unlimited
+    max_tile = SizeChart.max
 
     def run(
         self,
diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index 3d3fed7c..cb0e2db9 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -543,9 +543,6 @@ def blend_loras(
     if len(unmatched_keys) > 0:
         logger.warning("could not find nodes for some keys: %s", unmatched_keys)
 
-    # if model_type == "unet":
-    #     save_model(base_model, f"/tmp/lora_blend_{model_type}.onnx", save_as_external_data=True, all_tensors_to_one_file=True, location="weights.pb")
-
     return base_model
 
 
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 5b504c6a..885b09b3 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -24,7 +24,7 @@ class SizeChart(IntEnum):
     hd16k = 2**14
     hd32k = 2**15
     hd64k = 2**16
-    unlimited = 2**32  # sort of
+    max = 2**32  # should be a reasonable upper limit for now
 
 
 class TileOrder:
diff --git a/api/schemas/generate.yaml b/api/schemas/generate.yaml
deleted file mode 100644
index 8666468e..00000000
--- a/api/schemas/generate.yaml
+++ /dev/null
@@ -1,117 +0,0 @@
-$id: TODO
-$schema: https://json-schema.org/draft/2020-12/schema
-
-$defs:
-  grid:
-    type: object
-    additionalProperties: False
-    required: [width, height]
-    width:
-      type: number
-    height:
-      type: number
-    labels:
-      type: object
-      additionalProperties: False
-      properties:
-        title:
-          type: string
-        rows:
-          type: array
-          items:
-            type: string
-        columns:
-          type: array
-          items:
-            type: string
-    order:
-      type: array
-      items: number
-
-  job_base:
-    type: object
-    additionalProperties: true
-    required: [
-      device,
-      model,
-      pipeline,
-      scheduler,
-      prompt,
-      cfg,
-      steps,
-      seed,
-    ]
-    properties:
-      batch:
-        type: number
-      device:
-        type: string
-      model:
-        type: string
-      control:
-        type: string
-      pipeline:
-        type: string
-      scheduler:
-        type: string
-      prompt:
-        type: string
-      negative_prompt:
-        type: string
-      cfg:
-        type: number
-      eta:
-        type: number
-      steps:
-        type: number
-      tiled_vae:
-        type: boolean
-      tiles:
-        type: number
-      overlap:
-        type: number
-      seed:
-        type: number
-      stride:
-        type: number
-
-  job_txt2img:
-    allOf:
-      - $ref: "#/$defs/job_base"
-      - type: object
-        additionalProperties: False
-        required: [
-          height,
-          width,
-        ]
-        properties:
-          width:
-            type: number
-          height:
-            type: number
-
-  job_img2img:
-    allOf:
-      - $ref: "#/$defs/job_base"
-      - type: object
-        additionalProperties: False
-        required: []
-        properties:
-          loopback:
-            type: number
-
-type: object
-additionalProperties: False
-properties:
-  txt2img:
-    type: array
-    items:
-      $ref: "#/$defs/job_txt2img"
-  img2img:
-    type: array
-    items:
-      $ref: "#/$defs/job_img2img"
-  grid:
-    type: array
-    items:
-      $ref: "#/$defs/grid"
diff --git a/api/tests/chain/test_base.py b/api/tests/chain/test_base.py
new file mode 100644
index 00000000..a2530600
--- /dev/null
+++ b/api/tests/chain/test_base.py
@@ -0,0 +1,26 @@
+import unittest
+
+from onnx_web.chain.base import ChainProgress
+
+
+class ChainProgressTests(unittest.TestCase):
+    def test_accumulate_with_reset(self):
+        def parent(step, timestep, latents):
+            pass
+
+        progress = ChainProgress(parent)
+        progress(5, 1, None)
+        progress(0, 1, None)
+        progress(5, 1, None)
+
+        self.assertEqual(progress.get_total(), 10)
+
+    def test_start_value(self):
+        def parent(step, timestep, latents):
+            pass
+
+        progress = ChainProgress(parent, 5)
+        self.assertEqual(progress.get_total(), 5)
+
+        progress(10, 1, None)
+        self.assertEqual(progress.get_total(), 10)
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index 58462b80..672c6be6 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -150,8 +150,17 @@ class KernelSliceTests(unittest.TestCase):
             (2, 2),
         )
 
+
 class BlendLoRATests(unittest.TestCase):
-    pass
+    def test_blend_unet(self):
+        pass
+
+    def test_blend_text_encoder(self):
+        pass
+
+    def test_blend_text_encoder_index(self):
+        pass
+
 
 class InterpToMatchTests(unittest.TestCase):
     def test_same_shape(self):

From d8ea00582e85e8467b465a04c0c302bd26839b4f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 08:44:02 -0500
Subject: [PATCH 059/240] fix(build): sort imports in tests

---
 api/Makefile | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/api/Makefile b/api/Makefile
index b5c90421..db142073 100644
--- a/api/Makefile
+++ b/api/Makefile
@@ -1,4 +1,4 @@
-.PHONY: ci check-venv pip pip-dev lint-check lint-fix test typecheck package package-dist package-upload
+.PHONY: ci check-venv pip pip-dev lint-check lint-fix test typecheck package package-dist package-upload style
 
 onnx_env: ## create virtual env
 	python -v venv onnx_env
@@ -33,13 +33,17 @@ package-upload:
 
 lint-check:
 	black --check onnx_web/
-	isort --check-only --skip __init__.py --filter-files onnx_web
 	flake8 onnx_web
+	isort --check-only --skip __init__.py --filter-files onnx_web
+	isort --check-only --skip __init__.py --filter-files tests
 
 lint-fix:
 	black onnx_web/
-	isort --skip __init__.py --filter-files onnx_web
 	flake8 onnx_web
+	isort --skip __init__.py --filter-files onnx_web
+	isort --skip __init__.py --filter-files tests
+
+style: lint-fix
 
 typecheck:
 	mypy onnx_web

From 963794abaa4a131018f2435a1c7f09baf444a2b4 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 19:16:47 -0500
Subject: [PATCH 060/240] lint, tests

---
 api/onnx_web/chain/blend_grid.py         | 10 +--
 api/onnx_web/chain/stage.py              | 14 ++--
 api/onnx_web/server/params.py            |  4 +-
 api/tests/convert/diffusion/test_lora.py | 21 ++++++
 api/tests/mocks.py                       | 43 ++++++++++++
 api/tests/test_diffusers/test_load.py    | 85 +++++++++++++++++++++---
 api/tests/test_diffusers/test_utils.py   | 85 ++++++++++++++++++++++++
 7 files changed, 240 insertions(+), 22 deletions(-)
 create mode 100644 api/tests/mocks.py
 create mode 100644 api/tests/test_diffusers/test_utils.py

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index cf4b9f90..19b1eca2 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -22,12 +22,12 @@ class BlendGridStage(BaseStage):
         *,
         height: int,
         width: int,
-        rows: Optional[List[str]] = None,
-        columns: Optional[List[str]] = None,
-        title: Optional[str] = None,
+        # rows: Optional[List[str]] = None,
+        # columns: Optional[List[str]] = None,
+        # title: Optional[str] = None,
         order: Optional[int] = None,
         stage_source: Optional[Image.Image] = None,
-        _callback: Optional[ProgressCallback] = None,
+        callback: Optional[ProgressCallback] = None,
         **kwargs,
     ) -> List[Image.Image]:
         logger.info("combining source images using grid layout")
@@ -51,7 +51,7 @@ class BlendGridStage(BaseStage):
 
     def outputs(
         self,
-        params: ImageParams,
+        _params: ImageParams,
         sources: int,
     ) -> int:
         return sources + 1
diff --git a/api/onnx_web/chain/stage.py b/api/onnx_web/chain/stage.py
index 3942460b..c9c6eafd 100644
--- a/api/onnx_web/chain/stage.py
+++ b/api/onnx_web/chain/stage.py
@@ -12,11 +12,11 @@ class BaseStage:
 
     def run(
         self,
-        worker: WorkerContext,
-        server: ServerContext,
-        stage: StageParams,
+        _worker: WorkerContext,
+        _server: ServerContext,
+        _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        _sources: List[Image.Image],
         *args,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
@@ -25,14 +25,14 @@ class BaseStage:
 
     def steps(
         self,
-        params: ImageParams,
-        size: Size,
+        _params: ImageParams,
+        _size: Size,
     ) -> int:
         return 1  # noqa
 
     def outputs(
         self,
-        params: ImageParams,
+        _params: ImageParams,
         sources: int,
     ) -> int:
         return sources
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index 62332944..d68e2dcc 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -35,7 +35,7 @@ logger = getLogger(__name__)
 
 
 def build_device(
-    server: ServerContext,
+    _server: ServerContext,
     data: Dict[str, str],
 ) -> Optional[DeviceParams]:
     # platform stuff
@@ -172,7 +172,7 @@ def build_params(
 
 
 def build_size(
-    server: ServerContext,
+    _server: ServerContext,
     data: Dict[str, str],
 ) -> Size:
     height = get_and_clamp_int(
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index 672c6be6..01372e93 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -153,12 +153,33 @@ class KernelSliceTests(unittest.TestCase):
 
 class BlendLoRATests(unittest.TestCase):
     def test_blend_unet(self):
+        """
+        blend_loras(None, "test", [], "unet")
+        """
         pass
 
     def test_blend_text_encoder(self):
+        """
+        blend_loras(None, "test", [], "text_encoder")
+        """
         pass
 
     def test_blend_text_encoder_index(self):
+        """
+        blend_loras(None, "test", [], "text_encoder", model_index=2)
+        """
+        pass
+
+    def test_unmatched_keys(self):
+        pass
+
+    def test_xl_keys(self):
+        """
+        blend_loras(None, "test", [], "unet", xl=True)
+        """
+        pass
+
+    def test_node_dtype(self):
         pass
 
 
diff --git a/api/tests/mocks.py b/api/tests/mocks.py
new file mode 100644
index 00000000..f16ae22f
--- /dev/null
+++ b/api/tests/mocks.py
@@ -0,0 +1,43 @@
+from typing import Any, Optional
+
+
+class MockPipeline():
+  # flags
+  slice_size: Optional[str]
+  vae_slicing: Optional[bool]
+  sequential_offload: Optional[bool]
+  model_offload: Optional[bool]
+  xformers: Optional[bool]
+
+  # stubs
+  _encode_prompt: Optional[Any]
+  unet: Optional[Any]
+  vae_decoder: Optional[Any]
+  vae_encoder: Optional[Any]
+
+  def __init__(self) -> None:
+    self.slice_size = None
+    self.vae_slicing = None
+    self.sequential_offload = None
+    self.model_offload = None
+    self.xformers = None
+
+    self._encode_prompt = None
+    self.unet = None
+    self.vae_decoder = None
+    self.vae_encoder = None
+
+  def enable_attention_slicing(self, slice_size: str = None):
+    self.slice_size = slice_size
+
+  def enable_vae_slicing(self):
+    self.vae_slicing = True
+
+  def enable_sequential_cpu_offload(self):
+    self.sequential_offload = True
+
+  def enable_model_cpu_offload(self):
+    self.model_offload = True
+
+  def enable_xformers_memory_efficient_attention(self):
+    self.xformers = True
\ No newline at end of file
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index c3649a47..474b86d9 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -6,7 +6,15 @@ from onnx_web.diffusers.load import (
     get_available_pipelines,
     get_pipeline_schedulers,
     get_scheduler_name,
+    optimize_pipeline,
+    patch_pipeline,
 )
+from onnx_web.diffusers.patches.unet import UNetWrapper
+from onnx_web.diffusers.patches.vae import VAEWrapper
+from onnx_web.diffusers.utils import expand_prompt
+from onnx_web.params import ImageParams
+from onnx_web.server.context import ServerContext
+from tests.mocks import MockPipeline
 
 
 class TestAvailablePipelines(unittest.TestCase):
@@ -35,30 +43,91 @@ class TestSchedulerNames(unittest.TestCase):
 
 class TestOptimizePipeline(unittest.TestCase):
   def test_auto_attention_slicing(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-attention-slicing-auto",
+      ],
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.slice_size, "auto")
 
   def test_max_attention_slicing(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-attention-slicing-max",
+      ]
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.slice_size, "max")
 
   def test_vae_slicing(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-vae-slicing",
+      ]
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.vae_slicing, True)
 
   def test_cpu_offload_sequential(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-cpu-offload-sequential",
+      ]
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.sequential_offload, True)
 
   def test_cpu_offload_model(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-cpu-offload-model",
+      ]
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.model_offload, True)
 
   def test_memory_efficient_attention(self):
-    pass
+    server = ServerContext(
+      optimizations=[
+        "diffusers-memory-efficient-attention",
+      ]
+    )
+    pipeline = MockPipeline()
+    optimize_pipeline(server, pipeline)
+    self.assertEqual(pipeline.xformers, True)
 
 
 class TestPatchPipeline(unittest.TestCase):
   def test_expand_not_lpw(self):
+    """
+    server = ServerContext()
+    pipeline = MockPipeline()
+    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
+    self.assertEqual(pipeline._encode_prompt, expand_prompt)
+    """
     pass
 
   def test_unet_wrapper_not_xl(self):
-    pass
+    server = ServerContext()
+    pipeline = MockPipeline()
+    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
+    self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
+
+  def test_unet_wrapper_xl(self):
+    server = ServerContext()
+    pipeline = MockPipeline()
+    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img-sdxl", "ddim", "test", 1.0, 10, 1))
+    self.assertFalse(isinstance(pipeline.unet, UNetWrapper))
 
   def test_vae_wrapper(self):
-    pass
\ No newline at end of file
+    server = ServerContext()
+    pipeline = MockPipeline()
+    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
+    self.assertTrue(isinstance(pipeline.vae_decoder, VAEWrapper))
+    self.assertTrue(isinstance(pipeline.vae_encoder, VAEWrapper))
diff --git a/api/tests/test_diffusers/test_utils.py b/api/tests/test_diffusers/test_utils.py
new file mode 100644
index 00000000..b723beee
--- /dev/null
+++ b/api/tests/test_diffusers/test_utils.py
@@ -0,0 +1,85 @@
+import unittest
+
+import numpy as np
+
+from onnx_web.diffusers.utils import (
+  expand_interval_ranges,
+  expand_alternative_ranges,
+  get_inversions_from_prompt,
+  get_latents_from_seed,
+  get_loras_from_prompt,
+  get_scaled_latents,
+  get_tokens_from_prompt,
+)
+from onnx_web.params import Size
+
+class TestExpandIntervalRanges(unittest.TestCase):
+  def test_prompt_with_no_ranges(self):
+    prompt = "an astronaut eating a hamburger"
+    result = expand_interval_ranges(prompt)
+    self.assertEqual(prompt, result)
+
+  def test_prompt_with_range(self):
+    prompt = "an astronaut-{1,4} eating a hamburger"
+    result = expand_interval_ranges(prompt)
+    self.assertEqual(result, "an astronaut-1 astronaut-2 astronaut-3 eating a hamburger")
+
+class TestExpandAlternativeRanges(unittest.TestCase):
+  def test_prompt_with_no_ranges(self):
+    prompt = "an astronaut eating a hamburger"
+    result = expand_alternative_ranges(prompt)
+    self.assertEqual([prompt], result)
+
+  def test_ranges_match(self):
+    prompt = "(an astronaut|a squirrel) eating (a hamburger|an acorn)"
+    result = expand_alternative_ranges(prompt)
+    self.assertEqual(result, ["an astronaut eating a hamburger", "a squirrel eating an acorn"])
+
+class TestInversionsFromPrompt(unittest.TestCase):
+  def test_get_inversions(self):
+    prompt = "<inversion:test:1.0> an astronaut eating an embedding"
+    result, tokens = get_inversions_from_prompt(prompt)
+
+    self.assertEqual(result, " an astronaut eating an embedding")
+    self.assertEqual(tokens, [("test", 1.0)])
+
+class TestLoRAsFromPrompt(unittest.TestCase):
+  def test_get_loras(self):
+    prompt = "<lora:test:1.0> an astronaut eating a LoRA"
+    result, tokens = get_loras_from_prompt(prompt)
+
+    self.assertEqual(result, " an astronaut eating a LoRA")
+    self.assertEqual(tokens, [("test", 1.0)])
+
+class TestLatentsFromSeed(unittest.TestCase):
+  def test_batch_size(self):
+    latents = get_latents_from_seed(1, Size(64, 64), batch=4)
+    self.assertEqual(latents.shape, (4, 4, 8, 8))
+
+  def test_consistency(self):
+    latents1 = get_latents_from_seed(1, Size(64, 64))
+    latents2 = get_latents_from_seed(1, Size(64, 64))
+    self.assertTrue(np.array_equal(latents1, latents2))
+
+class TestTileLatents(unittest.TestCase):
+  def test_full_tile(self):
+    pass
+
+  def test_partial_tile(self):
+    pass
+
+class TestScaledLatents(unittest.TestCase):
+  def test_scale_up(self):
+    latents = get_latents_from_seed(1, Size(16, 16))
+    scaled = get_scaled_latents(1, Size(16, 16), scale=2)
+    self.assertEqual(latents[0, 0, 0, 0], scaled[0, 0, 0, 0])
+
+  def test_scale_down(self):
+    latents = get_latents_from_seed(1, Size(16, 16))
+    scaled = get_scaled_latents(1, Size(16, 16), scale=0.5)
+    self.assertEqual((
+      latents[0, 0, 0, 0] +
+      latents[0, 0, 0, 1] +
+      latents[0, 0, 1, 0] +
+      latents[0, 0, 1, 1]
+    ) / 4, scaled[0, 0, 0, 0])

From af6cb1f295f891bb9a3124fa7e174ed85b129b31 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 19:22:53 -0500
Subject: [PATCH 061/240] more lint

---
 api/onnx_web/diffusers/load.py                 |  4 ++--
 gui/src/components/control/VariableControl.tsx | 10 +++++-----
 onnx-web.code-workspace                        |  1 +
 3 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index fb5d256f..e0e800b9 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -444,13 +444,13 @@ def load_pipeline(
         if "vae_decoder_session" in components:
             pipe.vae_decoder = ORTModelVaeDecoder(
                 components["vae_decoder_session"],
-                pipe,  # TODO: find the right class to provide here. ORTModel is missing the dict json method
+                pipe,
             )
 
         if "vae_encoder_session" in components:
             pipe.vae_encoder = ORTModelVaeEncoder(
                 components["vae_encoder_session"],
-                pipe,  # TODO: find the right class to provide here. ORTModel is missing the dict json method
+                pipe,
             )
 
         if not server.show_progress:
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index a4752691..09340b08 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -19,7 +19,7 @@ export function VariableControl(props: VariableControlProps) {
   const grid = useStore(store, props.selectGrid);
 
   const stack = [
-    <Stack direction='row' spacing={2}>
+    <Stack direction='row' spacing={2} key='variable-enable'>
       <FormControl>
         <FormControlLabel
           label='Grid Mode'
@@ -36,7 +36,7 @@ export function VariableControl(props: VariableControlProps) {
 
   if (grid.enabled) {
     stack.push(
-      <Stack direction='row' spacing={2}>
+      <Stack direction='row' spacing={2} key='variable-row'>
         <FormControl>
           <InputLabel id='TODO'>Columns</InputLabel>
           <Select onChange={(event) => props.setGrid({
@@ -57,7 +57,7 @@ export function VariableControl(props: VariableControlProps) {
           },
         })} />
       </Stack>,
-      <Stack direction='row' spacing={2}>
+      <Stack direction='row' spacing={2} key='variable-column'>
         <FormControl>
           <InputLabel id='TODO'>Rows</InputLabel>
           <Select onChange={(event) => props.setGrid({
@@ -94,8 +94,8 @@ export function rangeSplit(parameter: string, value: string): Array<number | str
   return csv.flatMap((it) => expandRanges(it));
 }
 
-export const EXPR_STRICT_NUMBER = /^-?[0-9]+$/;
-export const EXPR_NUMBER_RANGE = /^([0-9]+)-([0-9]+)$/;
+export const EXPR_STRICT_NUMBER = /^-?\d+$/;
+export const EXPR_NUMBER_RANGE = /^(\d+)-(\d+)$/;
 
 export function expandRanges(range: string): Array<string | number> {
   if (EXPR_STRICT_NUMBER.test(range)) {
diff --git a/onnx-web.code-workspace b/onnx-web.code-workspace
index 71b1e537..f859a141 100644
--- a/onnx-web.code-workspace
+++ b/onnx-web.code-workspace
@@ -103,6 +103,7 @@
 			"virtualenv",
 			"VRAM",
 			"webp",
+			"xformers",
 			"zustand"
 		]
 	}

From 466a28c13bad8e1ab4539796bbc8652582d0acaf Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 15 Sep 2023 22:06:53 -0500
Subject: [PATCH 062/240] apply lint

---
 api/tests/test_diffusers/test_utils.py | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/api/tests/test_diffusers/test_utils.py b/api/tests/test_diffusers/test_utils.py
index b723beee..5377f24c 100644
--- a/api/tests/test_diffusers/test_utils.py
+++ b/api/tests/test_diffusers/test_utils.py
@@ -3,16 +3,17 @@ import unittest
 import numpy as np
 
 from onnx_web.diffusers.utils import (
-  expand_interval_ranges,
-  expand_alternative_ranges,
-  get_inversions_from_prompt,
-  get_latents_from_seed,
-  get_loras_from_prompt,
-  get_scaled_latents,
-  get_tokens_from_prompt,
+    expand_alternative_ranges,
+    expand_interval_ranges,
+    get_inversions_from_prompt,
+    get_latents_from_seed,
+    get_loras_from_prompt,
+    get_scaled_latents,
+    get_tokens_from_prompt,
 )
 from onnx_web.params import Size
 
+
 class TestExpandIntervalRanges(unittest.TestCase):
   def test_prompt_with_no_ranges(self):
     prompt = "an astronaut eating a hamburger"

From 8a97fca6d023d1d3501871f66ac3148a7bb05616 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 16 Sep 2023 12:44:54 -0500
Subject: [PATCH 063/240] tests for prompt slicing, latent tiling

---
 api/tests/test_diffusers/test_utils.py | 47 ++++++++++++++++++++++++--
 1 file changed, 44 insertions(+), 3 deletions(-)

diff --git a/api/tests/test_diffusers/test_utils.py b/api/tests/test_diffusers/test_utils.py
index 5377f24c..b3f8d8ce 100644
--- a/api/tests/test_diffusers/test_utils.py
+++ b/api/tests/test_diffusers/test_utils.py
@@ -9,7 +9,10 @@ from onnx_web.diffusers.utils import (
     get_latents_from_seed,
     get_loras_from_prompt,
     get_scaled_latents,
+    get_tile_latents,
     get_tokens_from_prompt,
+    pop_random,
+    slice_prompt,
 )
 from onnx_web.params import Size
 
@@ -64,10 +67,19 @@ class TestLatentsFromSeed(unittest.TestCase):
 
 class TestTileLatents(unittest.TestCase):
   def test_full_tile(self):
-    pass
+    partial = np.zeros((1, 1, 64, 64))
+    full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
+    self.assertEqual(full.shape, (1, 1, 8, 8))
 
-  def test_partial_tile(self):
-    pass
+  def test_contract_tile(self):
+    partial = np.zeros((1, 1, 64, 64))
+    full = get_tile_latents(partial, 1, (32, 32), (0, 0, 32))
+    self.assertEqual(full.shape, (1, 1, 4, 4))
+
+  def test_expand_tile(self):
+    partial = np.zeros((1, 1, 32, 32))
+    full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
+    self.assertEqual(full.shape, (1, 1, 8, 8))
 
 class TestScaledLatents(unittest.TestCase):
   def test_scale_up(self):
@@ -84,3 +96,32 @@ class TestScaledLatents(unittest.TestCase):
       latents[0, 0, 1, 0] +
       latents[0, 0, 1, 1]
     ) / 4, scaled[0, 0, 0, 0])
+
+class TestReplaceWildcards(unittest.TestCase):
+  pass
+
+class TestPopRandom(unittest.TestCase):
+  def test_pop(self):
+    items = ["1", "2", "3"]
+    pop_random(items)
+    self.assertEqual(len(items), 2)
+
+class TestRepairNaN(unittest.TestCase):
+  def test_unchanged(self):
+    pass
+
+  def test_missing(self):
+    pass
+
+class TestSlicePrompt(unittest.TestCase):
+  def test_slice_no_delimiter(self):
+    slice = slice_prompt("foo", 1)
+    self.assertEqual(slice, "foo")
+
+  def test_slice_within_range(self):
+    slice = slice_prompt("foo || bar", 1)
+    self.assertEqual(slice, " bar")
+
+  def test_slice_outside_range(self):
+    slice = slice_prompt("foo || bar", 9)
+    self.assertEqual(slice, " bar")
\ No newline at end of file

From 90d1812decee63f46a510c403f5ad0572da37bae Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 20 Sep 2023 19:27:37 -0500
Subject: [PATCH 064/240] fix(gui): use new grid seeds for every generation

---
 gui/src/client/utils.ts                       | 29 +++++++++++++++++--
 .../components/control/VariableControl.tsx    | 15 +---------
 2 files changed, 28 insertions(+), 16 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index 2bc02aad..a8e2a112 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -39,6 +39,28 @@ export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, c
   return result;
 }
 
+export const MAX_SEED_SIZE = 32;
+export const MAX_SEED = (2**MAX_SEED_SIZE) - 1;
+
+export function newSeed(): number {
+  return Math.floor(Math.random() * MAX_SEED);
+}
+
+export function replaceRandomSeeds(key: string, values: Array<number | string>): Array<number | string> {
+  if (key !== 'seed') {
+    return values;
+  }
+
+  return values.map((it) => {
+    // eslint-disable-next-line @typescript-eslint/no-magic-numbers
+    if (it === '-1' || it === -1) {
+      return newSeed();
+    }
+
+    return it;
+  });
+}
+
 // eslint-disable-next-line max-params
 export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
@@ -53,10 +75,13 @@ export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams,
     tiles: 8192,
   };
 
+  const rows = replaceRandomSeeds(grid.rows.parameter, grid.rows.values);
+  const columns = replaceRandomSeeds(grid.columns.parameter, grid.columns.values);
+
   let i = 0;
 
-  for (const row of grid.rows.values) {
-    for (const column of grid.columns.values) {
+  for (const row of rows) {
+    for (const column of columns) {
       const prompt = replacePromptTokens(grid, params, column, row);
 
       pipeline.stages.push({
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index 09340b08..9a14cb3b 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -99,14 +99,8 @@ export const EXPR_NUMBER_RANGE = /^(\d+)-(\d+)$/;
 
 export function expandRanges(range: string): Array<string | number> {
   if (EXPR_STRICT_NUMBER.test(range)) {
-    // entirely numeric, return without parsing
+    // entirely numeric, return after parsing
     const val = parseInt(range, 10);
-
-    // eslint-disable-next-line @typescript-eslint/no-magic-numbers
-    if (val === -1) {
-      return [newSeed()];
-    }
-
     return [val];
   }
 
@@ -124,13 +118,6 @@ export function expandRanges(range: string): Array<string | number> {
   return [];
 }
 
-export const MAX_SEED_SIZE = 32;
-export const MAX_SEED = (2**MAX_SEED_SIZE) - 1;
-
-export function newSeed(): number {
-  return Math.floor(Math.random() * MAX_SEED);
-}
-
 export const VARIABLE_PARAMETERS = ['prompt', 'negativePrompt', 'seed', 'steps', 'cfg', 'scheduler', 'eta', 'token'];
 export const STRING_PARAMETERS = ['prompt', 'negativePrompt', 'scheduler', 'token'];
 

From d48dbf7d6e8e31b27d3643c03752546e195b92c2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 20 Sep 2023 19:28:34 -0500
Subject: [PATCH 065/240] fix(api): enable Unet patch for SDXL

---
 api/onnx_web/diffusers/load.py         |  7 +++----
 api/onnx_web/diffusers/patches/unet.py | 22 ++++++++++++++++------
 api/tests/test_diffusers/test_utils.py |  2 +-
 3 files changed, 20 insertions(+), 11 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index e0e800b9..c38fe487 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -547,10 +547,9 @@ def patch_pipeline(
     if not params.is_lpw() and not params.is_xl():
         pipe._encode_prompt = expand_prompt.__get__(pipe, pipeline)
 
-    if not params.is_xl():
-        original_unet = pipe.unet
-        pipe.unet = UNetWrapper(server, original_unet)
-        logger.debug("patched UNet with wrapper")
+    original_unet = pipe.unet
+    pipe.unet = UNetWrapper(server, original_unet, params.is_xl())
+    logger.debug("patched UNet with wrapper")
 
     if hasattr(pipe, "vae_decoder"):
         original_decoder = pipe.vae_decoder
diff --git a/api/onnx_web/diffusers/patches/unet.py b/api/onnx_web/diffusers/patches/unet.py
index 9ad49cfc..fbe0f4f8 100644
--- a/api/onnx_web/diffusers/patches/unet.py
+++ b/api/onnx_web/diffusers/patches/unet.py
@@ -14,14 +14,17 @@ class UNetWrapper(object):
     prompt_index: int = 0
     server: ServerContext
     wrapped: OnnxRuntimeModel
+    xl: bool
 
     def __init__(
         self,
         server: ServerContext,
         wrapped: OnnxRuntimeModel,
+        xl: bool,
     ):
         self.server = server
         self.wrapped = wrapped
+        self.xl = xl
 
     def __call__(
         self,
@@ -43,13 +46,20 @@ class UNetWrapper(object):
             encoder_hidden_states = self.prompt_embeds[step_index]
             self.prompt_index += 1
 
-        if sample.dtype != timestep.dtype:
-            logger.trace("converting UNet sample to timestep dtype")
-            sample = sample.astype(timestep.dtype)
+        if self.xl:
+            logger.trace(
+                "converting UNet sample to hidden state dtype for XL: %s",
+                encoder_hidden_states.dtype,
+            )
+            sample = sample.astype(encoder_hidden_states.dtype)
+        else:
+            if sample.dtype != timestep.dtype:
+                logger.trace("converting UNet sample to timestep dtype")
+                sample = sample.astype(timestep.dtype)
 
-        if encoder_hidden_states.dtype != timestep.dtype:
-            logger.trace("converting UNet hidden states to timestep dtype")
-            encoder_hidden_states = encoder_hidden_states.astype(timestep.dtype)
+            if encoder_hidden_states.dtype != timestep.dtype:
+                logger.trace("converting UNet hidden states to timestep dtype")
+                encoder_hidden_states = encoder_hidden_states.astype(timestep.dtype)
 
         return self.wrapped(
             sample=sample,
diff --git a/api/tests/test_diffusers/test_utils.py b/api/tests/test_diffusers/test_utils.py
index b3f8d8ce..a98647cb 100644
--- a/api/tests/test_diffusers/test_utils.py
+++ b/api/tests/test_diffusers/test_utils.py
@@ -124,4 +124,4 @@ class TestSlicePrompt(unittest.TestCase):
 
   def test_slice_outside_range(self):
     slice = slice_prompt("foo || bar", 9)
-    self.assertEqual(slice, " bar")
\ No newline at end of file
+    self.assertEqual(slice, " bar")

From 761bfa8364c8c0db24c458f3fa31902c7be95ea2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 20 Sep 2023 21:24:16 -0500
Subject: [PATCH 066/240] update test for SDXL Unet wrapper

---
 api/tests/test_diffusers/test_load.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index 474b86d9..a7f4c97c 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -123,7 +123,7 @@ class TestPatchPipeline(unittest.TestCase):
     server = ServerContext()
     pipeline = MockPipeline()
     patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img-sdxl", "ddim", "test", 1.0, 10, 1))
-    self.assertFalse(isinstance(pipeline.unet, UNetWrapper))
+    self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
 
   def test_vae_wrapper(self):
     server = ServerContext()

From 52fdf4f48ae939bf0d4ed039eccd7f3a9063196c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 21 Sep 2023 18:24:08 -0500
Subject: [PATCH 067/240] fix(api): test LoRA blending code

---
 api/onnx_web/convert/diffusion/lora.py   | 582 +++++++++++------------
 api/scripts/onnx-lora.py                 |  74 +++
 api/tests/convert/diffusion/test_lora.py | 161 ++++++-
 3 files changed, 488 insertions(+), 329 deletions(-)
 create mode 100644 api/scripts/onnx-lora.py

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index cb0e2db9..afa681f2 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -1,22 +1,15 @@
-from argparse import ArgumentParser
 from logging import getLogger
-from os import path
 from typing import Any, Dict, List, Literal, Optional, Tuple, Union
 
 import numpy as np
 import torch
-from onnx import ModelProto, NodeProto, load, numpy_helper
-from onnx.checker import check_model
-from onnx.external_data_helper import (
-    convert_model_to_external_data,
-    set_external_data,
-    write_external_data_tensors,
-)
-from onnxruntime import InferenceSession, OrtValue, SessionOptions
+from onnx import ModelProto, NodeProto, TensorProto, load, numpy_helper
+from onnx.external_data_helper import set_external_data
+from onnxruntime import OrtValue
 from scipy import interpolate
 
 from ...server.context import ServerContext
-from ..utils import ConversionContext, load_tensor
+from ..utils import load_tensor
 
 logger = getLogger(__name__)
 
@@ -161,6 +154,245 @@ def kernel_slice(x: int, y: int, shape: Tuple[int, int, int, int]) -> Tuple[int,
     )
 
 
+def blend_weights_loha(
+    key: str, lora_prefix: str, lora_model: Dict, dtype
+) -> Tuple[str, np.ndarray]:
+    base_key = key[: key.index(".hada_w1_a")].replace(lora_prefix, "")
+
+    t1_key = key.replace("hada_w1_a", "hada_t1")
+    t2_key = key.replace("hada_w1_a", "hada_t2")
+    w1b_key = key.replace("hada_w1_a", "hada_w1_b")
+    w2a_key = key.replace("hada_w1_a", "hada_w2_a")
+    w2b_key = key.replace("hada_w1_a", "hada_w2_b")
+    alpha_key = key[: key.index("hada_w1_a")] + "alpha"
+    logger.trace(
+        "blending weights for LoHA keys: %s, %s, %s, %s, %s",
+        key,
+        w1b_key,
+        w2a_key,
+        w2b_key,
+        alpha_key,
+    )
+
+    w1a_weight = lora_model[key].to(dtype=dtype)
+    w1b_weight = lora_model[w1b_key].to(dtype=dtype)
+    w2a_weight = lora_model[w2a_key].to(dtype=dtype)
+    w2b_weight = lora_model[w2b_key].to(dtype=dtype)
+
+    t1_weight = lora_model.get(t1_key, None)
+    t2_weight = lora_model.get(t2_key, None)
+
+    dim = w1b_weight.size()[0]
+    alpha = lora_model.get(alpha_key, dim).to(dtype).numpy()
+
+    if t1_weight is not None and t2_weight is not None:
+        t1_weight = t1_weight.to(dtype=dtype)
+        t2_weight = t2_weight.to(dtype=dtype)
+
+        logger.trace(
+            "composing weights for LoHA node: (%s, %s, %s) * (%s, %s, %s)",
+            t1_weight.shape,
+            w1a_weight.shape,
+            w1b_weight.shape,
+            t2_weight.shape,
+            w2a_weight.shape,
+            w2b_weight.shape,
+        )
+        weights_1 = torch.einsum(
+            "i j k l, j r, i p -> p r k l",
+            t1_weight,
+            w1b_weight,
+            w1a_weight,
+        )
+        weights_2 = torch.einsum(
+            "i j k l, j r, i p -> p r k l",
+            t2_weight,
+            w2b_weight,
+            w2a_weight,
+        )
+        weights = weights_1 * weights_2
+        np_weights = weights.numpy() * (alpha / dim)
+    else:
+        logger.trace(
+            "blending weights for LoHA node: (%s @ %s) * (%s @ %s)",
+            w1a_weight.shape,
+            w1b_weight.shape,
+            w2a_weight.shape,
+            w2b_weight.shape,
+        )
+        weights = (w1a_weight @ w1b_weight) * (w2a_weight @ w2b_weight)
+        np_weights = weights.numpy() * (alpha / dim)
+
+    return base_key, np_weights
+
+
+def blend_weights_lora(
+    key: str, lora_prefix: str, lora_model: Dict, dtype
+) -> Tuple[str, np.ndarray]:
+    base_key = key[: key.index(".lora_down")].replace(lora_prefix, "")
+
+    mid_key = key.replace("lora_down", "lora_mid")
+    up_key = key.replace("lora_down", "lora_up")
+    alpha_key = key[: key.index("lora_down")] + "alpha"
+    logger.trace("blending weights for LoRA keys: %s, %s, %s", key, up_key, alpha_key)
+
+    down_weight = lora_model[key].to(dtype=dtype)
+    up_weight = lora_model[up_key].to(dtype=dtype)
+
+    mid_weight = None
+    if mid_key in lora_model:
+        mid_weight = lora_model[mid_key].to(dtype=dtype)
+
+    dim = down_weight.size()[0]
+    alpha = lora_model.get(alpha_key, dim)
+
+    if not isinstance(alpha, int):
+        alpha = alpha.to(dtype).numpy()
+
+    kernel = down_weight.shape[-2:]
+    if mid_weight is not None:
+        kernel = mid_weight.shape[-2:]
+
+    if len(down_weight.size()) == 2:
+        # blend for nn.Linear
+        logger.trace(
+            "blending weights for Linear node: (%s @ %s) * %s",
+            down_weight.shape,
+            up_weight.shape,
+            alpha,
+        )
+        weights = up_weight @ down_weight
+        np_weights = weights.numpy() * (alpha / dim)
+    elif len(down_weight.size()) == 4 and kernel == (
+        1,
+        1,
+    ):
+        # blend for nn.Conv2d 1x1
+        logger.trace(
+            "blending weights for Conv 1x1 node: %s, %s, %s",
+            down_weight.shape,
+            up_weight.shape,
+            alpha,
+        )
+        weights = (
+            (up_weight.squeeze(3).squeeze(2) @ down_weight.squeeze(3).squeeze(2))
+            .unsqueeze(2)
+            .unsqueeze(3)
+        )
+        np_weights = weights.numpy() * (alpha / dim)
+    elif len(down_weight.size()) == 4 and kernel == (
+        3,
+        3,
+    ):
+        if mid_weight is not None:
+            # blend for nn.Conv2d 3x3 with CP decomp
+            logger.trace(
+                "composing weights for Conv 3x3 node: %s, %s, %s, %s",
+                down_weight.shape,
+                up_weight.shape,
+                mid_weight.shape,
+                alpha,
+            )
+            weights = torch.zeros((up_weight.shape[0], down_weight.shape[1], *kernel))
+
+            for w in range(kernel[0]):
+                for h in range(kernel[1]):
+                    weights[:, :, w, h] = (
+                        up_weight.squeeze(3).squeeze(2) @ mid_weight[:, :, w, h]
+                    ) @ down_weight.squeeze(3).squeeze(2)
+
+            np_weights = weights.numpy() * (alpha / dim)
+        else:
+            # blend for nn.Conv2d 3x3
+            logger.trace(
+                "blending weights for Conv 3x3 node: %s, %s, %s",
+                down_weight.shape,
+                up_weight.shape,
+                alpha,
+            )
+            weights = torch.zeros((up_weight.shape[0], down_weight.shape[1], *kernel))
+
+            for w in range(kernel[0]):
+                for h in range(kernel[1]):
+                    down_w, down_h = kernel_slice(w, h, down_weight.shape)
+                    up_w, up_h = kernel_slice(w, h, up_weight.shape)
+
+                    weights[:, :, w, h] = (
+                        up_weight[:, :, up_w, up_h] @ down_weight[:, :, down_w, down_h]
+                    )
+
+            np_weights = weights.numpy() * (alpha / dim)
+    else:
+        logger.warning(
+            "unknown LoRA node type at %s: %s",
+            base_key,
+            up_weight.shape[-2:],
+        )
+        # TODO: should this be None?
+        np_weights = np.zeros((1, 1, 1, 1))
+
+    return base_key, np_weights
+
+
+def blend_node_conv_gemm(weight_node, weights) -> TensorProto:
+    # blending
+    onnx_weights = numpy_helper.to_array(weight_node)
+    logger.trace(
+        "found blended weights for conv: %s, %s",
+        onnx_weights.shape,
+        weights.shape,
+    )
+
+    if onnx_weights.shape[-2:] == (1, 1):
+        if weights.shape[-2:] == (1, 1):
+            blended = onnx_weights.squeeze((3, 2)) + weights.squeeze((3, 2))
+        else:
+            blended = onnx_weights.squeeze((3, 2)) + weights
+
+        blended = np.expand_dims(blended, (2, 3))
+    else:
+        if onnx_weights.shape != weights.shape:
+            logger.warning(
+                "reshaping weights for mismatched Conv node: %s, %s",
+                onnx_weights.shape,
+                weights.shape,
+            )
+            # TODO: test if this can be replaced with interpolation, simply reshaping is pretty sus
+            blended = onnx_weights + weights.reshape(onnx_weights.shape)
+        else:
+            blended = onnx_weights + weights
+
+    logger.trace("blended weight shape: %s", blended.shape)
+
+    # replace the original initializer
+    return numpy_helper.from_array(blended.astype(onnx_weights.dtype), weight_node.name)
+
+
+def blend_node_matmul(matmul_node, weights, matmul_key) -> TensorProto:
+    onnx_weights = numpy_helper.to_array(matmul_node)
+    logger.trace(
+        "found blended weights for matmul: %s, %s",
+        weights.shape,
+        onnx_weights.shape,
+    )
+
+    t_weights = weights.transpose()
+    if weights.shape != onnx_weights.shape and t_weights.shape != onnx_weights.shape:
+        logger.warning(
+            "weight shapes do not match for %s: %s vs %s",
+            matmul_key,
+            weights.shape,
+            onnx_weights.shape,
+        )
+        t_weights = interp_to_match(weights, onnx_weights).transpose()
+
+    blended = onnx_weights + t_weights
+    logger.trace("blended weight shape: %s, %s", blended.shape, onnx_weights.dtype)
+
+    # replace the original initializer
+    return numpy_helper.from_array(blended.astype(onnx_weights.dtype), matmul_node.name)
+
+
 def blend_loras(
     _conversion: ServerContext,
     base_name: Union[str, ModelProto],
@@ -194,205 +426,41 @@ def blend_loras(
         for key in lora_model.keys():
             if ".hada_w1_a" in key and lora_prefix in key:
                 # LoHA
-                base_key = key[: key.index(".hada_w1_a")].replace(lora_prefix, "")
-
-                t1_key = key.replace("hada_w1_a", "hada_t1")
-                t2_key = key.replace("hada_w1_a", "hada_t2")
-                w1b_key = key.replace("hada_w1_a", "hada_w1_b")
-                w2a_key = key.replace("hada_w1_a", "hada_w2_a")
-                w2b_key = key.replace("hada_w1_a", "hada_w2_b")
-                alpha_key = key[: key.index("hada_w1_a")] + "alpha"
-                logger.trace(
-                    "blending weights for LoHA keys: %s, %s, %s, %s, %s",
-                    key,
-                    w1b_key,
-                    w2a_key,
-                    w2b_key,
-                    alpha_key,
+                base_key, np_weights = blend_weights_loha(
+                    key, lora_prefix, lora_model, dtype
                 )
-
-                w1a_weight = lora_model[key].to(dtype=dtype)
-                w1b_weight = lora_model[w1b_key].to(dtype=dtype)
-                w2a_weight = lora_model[w2a_key].to(dtype=dtype)
-                w2b_weight = lora_model[w2b_key].to(dtype=dtype)
-
-                t1_weight = lora_model.get(t1_key, None)
-                t2_weight = lora_model.get(t2_key, None)
-
-                dim = w1b_weight.size()[0]
-                alpha = lora_model.get(alpha_key, dim).to(dtype).numpy()
-
-                if t1_weight is not None and t2_weight is not None:
-                    t1_weight = t1_weight.to(dtype=dtype)
-                    t2_weight = t2_weight.to(dtype=dtype)
-
-                    logger.trace(
-                        "composing weights for LoHA node: (%s, %s, %s) * (%s, %s, %s)",
-                        t1_weight.shape,
-                        w1a_weight.shape,
-                        w1b_weight.shape,
-                        t2_weight.shape,
-                        w2a_weight.shape,
-                        w2b_weight.shape,
-                    )
-                    weights_1 = torch.einsum(
-                        "i j k l, j r, i p -> p r k l",
-                        t1_weight,
-                        w1b_weight,
-                        w1a_weight,
-                    )
-                    weights_2 = torch.einsum(
-                        "i j k l, j r, i p -> p r k l",
-                        t2_weight,
-                        w2b_weight,
-                        w2a_weight,
-                    )
-                    weights = weights_1 * weights_2
-                    np_weights = weights.numpy() * (alpha / dim)
-                else:
-                    logger.trace(
-                        "blending weights for LoHA node: (%s @ %s) * (%s @ %s)",
-                        w1a_weight.shape,
-                        w1b_weight.shape,
-                        w2a_weight.shape,
-                        w2b_weight.shape,
-                    )
-                    weights = (w1a_weight @ w1b_weight) * (w2a_weight @ w2b_weight)
-                    np_weights = weights.numpy() * (alpha / dim)
-
-                np_weights *= lora_weight
+                np_weights = np_weights * lora_weight
                 if base_key in blended:
                     logger.trace(
                         "summing LoHA weights: %s + %s",
                         blended[base_key].shape,
                         np_weights.shape,
                     )
-                    blended[base_key] += sum_weights(blended[base_key], np_weights)
+                    blended[base_key] = sum_weights(blended[base_key], np_weights)
                 else:
+                    logger.trace(
+                        "adding LoHA weights: %s",
+                        np_weights.shape,
+                    )
                     blended[base_key] = np_weights
             elif ".lora_down" in key and lora_prefix in key:
                 # LoRA or LoCON
-                base_key = key[: key.index(".lora_down")].replace(lora_prefix, "")
-
-                mid_key = key.replace("lora_down", "lora_mid")
-                up_key = key.replace("lora_down", "lora_up")
-                alpha_key = key[: key.index("lora_down")] + "alpha"
-                logger.trace(
-                    "blending weights for LoRA keys: %s, %s, %s", key, up_key, alpha_key
+                base_key, np_weights = blend_weights_lora(
+                    key, lora_prefix, lora_model, dtype
                 )
-
-                down_weight = lora_model[key].to(dtype=dtype)
-                up_weight = lora_model[up_key].to(dtype=dtype)
-
-                mid_weight = None
-                if mid_key in lora_model:
-                    mid_weight = lora_model[mid_key].to(dtype=dtype)
-
-                dim = down_weight.size()[0]
-                alpha = lora_model.get(alpha_key, dim)
-
-                if not isinstance(alpha, int):
-                    alpha = alpha.to(dtype).numpy()
-
-                kernel = down_weight.shape[-2:]
-                if mid_weight is not None:
-                    kernel = mid_weight.shape[-2:]
-
-                if len(down_weight.size()) == 2:
-                    # blend for nn.Linear
-                    logger.trace(
-                        "blending weights for Linear node: (%s @ %s) * %s",
-                        down_weight.shape,
-                        up_weight.shape,
-                        alpha,
-                    )
-                    weights = up_weight @ down_weight
-                    np_weights = weights.numpy() * (alpha / dim)
-                elif len(down_weight.size()) == 4 and kernel == (
-                    1,
-                    1,
-                ):
-                    # blend for nn.Conv2d 1x1
-                    logger.trace(
-                        "blending weights for Conv 1x1 node: %s, %s, %s",
-                        down_weight.shape,
-                        up_weight.shape,
-                        alpha,
-                    )
-                    weights = (
-                        (
-                            up_weight.squeeze(3).squeeze(2)
-                            @ down_weight.squeeze(3).squeeze(2)
-                        )
-                        .unsqueeze(2)
-                        .unsqueeze(3)
-                    )
-                    np_weights = weights.numpy() * (alpha / dim)
-                elif len(down_weight.size()) == 4 and kernel == (
-                    3,
-                    3,
-                ):
-                    if mid_weight is not None:
-                        # blend for nn.Conv2d 3x3 with CP decomp
-                        logger.trace(
-                            "composing weights for Conv 3x3 node: %s, %s, %s, %s",
-                            down_weight.shape,
-                            up_weight.shape,
-                            mid_weight.shape,
-                            alpha,
-                        )
-                        weights = torch.zeros(
-                            (up_weight.shape[0], down_weight.shape[1], *kernel)
-                        )
-
-                        for w in range(kernel[0]):
-                            for h in range(kernel[1]):
-                                weights[:, :, w, h] = (
-                                    up_weight.squeeze(3).squeeze(2)
-                                    @ mid_weight[:, :, w, h]
-                                ) @ down_weight.squeeze(3).squeeze(2)
-
-                        np_weights = weights.numpy() * (alpha / dim)
-                    else:
-                        # blend for nn.Conv2d 3x3
-                        logger.trace(
-                            "blending weights for Conv 3x3 node: %s, %s, %s",
-                            down_weight.shape,
-                            up_weight.shape,
-                            alpha,
-                        )
-                        weights = torch.zeros(
-                            (up_weight.shape[0], down_weight.shape[1], *kernel)
-                        )
-
-                        for w in range(kernel[0]):
-                            for h in range(kernel[1]):
-                                down_w, down_h = kernel_slice(w, h, down_weight.shape)
-                                up_w, up_h = kernel_slice(w, h, up_weight.shape)
-
-                                weights[:, :, w, h] = (
-                                    up_weight[:, :, up_w, up_h]
-                                    @ down_weight[:, :, down_w, down_h]
-                                )
-
-                        np_weights = weights.numpy() * (alpha / dim)
-                else:
-                    logger.warning(
-                        "unknown LoRA node type at %s: %s",
-                        base_key,
-                        up_weight.shape[-2:],
-                    )
-                    continue
-
-                np_weights *= lora_weight
+                np_weights = np_weights * lora_weight
                 if base_key in blended:
                     logger.trace(
-                        "summing weights: %s + %s",
+                        "summing LoRA weights: %s + %s",
                         blended[base_key].shape,
                         np_weights.shape,
                     )
                     blended[base_key] = sum_weights(blended[base_key], np_weights)
                 else:
+                    logger.trace(
+                        "adding LoRA weights: %s",
+                        np_weights.shape,
+                    )
                     blended[base_key] = np_weights
 
     # rewrite node names for XL
@@ -400,7 +468,7 @@ def blend_loras(
         nodes = list(base_model.graph.node)
         blended = fix_xl_names(blended, nodes)
 
-    logger.trace(
+    logger.debug(
         "updating %s of %s initializers",
         len(blended.keys()),
         len(base_model.graph.initializer),
@@ -409,10 +477,7 @@ def blend_loras(
     fixed_initializer_names = [
         fix_initializer_name(node.name) for node in base_model.graph.initializer
     ]
-    logger.trace("fixed initializer names: %s", fixed_initializer_names)
-
     fixed_node_names = [fix_node_name(node.name) for node in base_model.graph.node]
-    logger.trace("fixed node names: %s", fixed_node_names)
 
     unmatched_keys = []
     for base_key, weights in blended.items():
@@ -421,9 +486,10 @@ def blend_loras(
         matmul_key = base_key + "_MatMul"
 
         logger.trace(
-            "key %s has conv: %s, matmul: %s",
+            "key %s has conv: %s, gemm: %s, matmul: %s",
             base_key,
             conv_key in fixed_node_names,
+            gemm_key in fixed_node_names,
             matmul_key in fixed_node_names,
         )
 
@@ -449,38 +515,9 @@ def blend_loras(
             weight_node = base_model.graph.initializer[weight_idx]
             logger.trace("found weight initializer: %s", weight_node.name)
 
-            # blending
-            onnx_weights = numpy_helper.to_array(weight_node)
-            logger.trace(
-                "found blended weights for conv: %s, %s",
-                onnx_weights.shape,
-                weights.shape,
-            )
+            # replace the previous node
+            updated_node = blend_node_conv_gemm(weight_node, weights)
 
-            if onnx_weights.shape[-2:] == (1, 1):
-                if weights.shape[-2:] == (1, 1):
-                    blended = onnx_weights.squeeze((3, 2)) + weights.squeeze((3, 2))
-                else:
-                    blended = onnx_weights.squeeze((3, 2)) + weights
-
-                blended = np.expand_dims(blended, (2, 3))
-            else:
-                if onnx_weights.shape != weights.shape:
-                    logger.warning(
-                        "reshaping weights for mismatched Conv node: %s, %s",
-                        onnx_weights.shape,
-                        weights.shape,
-                    )
-                    blended = onnx_weights + weights.reshape(onnx_weights.shape)
-                else:
-                    blended = onnx_weights + weights
-
-            logger.trace("blended weight shape: %s", blended.shape)
-
-            # replace the original initializer
-            updated_node = numpy_helper.from_array(
-                blended.astype(onnx_weights.dtype), weight_node.name
-            )
             del base_model.graph.initializer[weight_idx]
             base_model.graph.initializer.insert(weight_idx, updated_node)
         elif matmul_key in fixed_node_names:
@@ -497,36 +534,9 @@ def blend_loras(
             matmul_node = base_model.graph.initializer[matmul_idx]
             logger.trace("found matmul initializer: %s", matmul_node.name)
 
-            # blending
-            onnx_weights = numpy_helper.to_array(matmul_node)
-            logger.trace(
-                "found blended weights for matmul: %s, %s",
-                weights.shape,
-                onnx_weights.shape,
-            )
+            # replace the previous node
+            updated_node = blend_node_matmul(matmul_node, weights, matmul_key)
 
-            t_weights = weights.transpose()
-            if (
-                weights.shape != onnx_weights.shape
-                and t_weights.shape != onnx_weights.shape
-            ):
-                logger.warning(
-                    "weight shapes do not match for %s: %s vs %s",
-                    matmul_key,
-                    weights.shape,
-                    onnx_weights.shape,
-                )
-                t_weights = interp_to_match(weights, onnx_weights).transpose()
-
-            blended = onnx_weights + t_weights
-            logger.trace(
-                "blended weight shape: %s, %s", blended.shape, onnx_weights.dtype
-            )
-
-            # replace the original initializer
-            updated_node = numpy_helper.from_array(
-                blended.astype(onnx_weights.dtype), matmul_node.name
-            )
             del base_model.graph.initializer[matmul_idx]
             base_model.graph.initializer.insert(matmul_idx, updated_node)
         else:
@@ -565,63 +575,3 @@ def interp_to_match(ref: np.ndarray, resize: np.ndarray) -> np.ndarray:
     logger.debug("weights after interpolation: %s", output.shape)
 
     return output
-
-
-if __name__ == "__main__":
-    context = ConversionContext.from_environ()
-    parser = ArgumentParser()
-    parser.add_argument("--base", type=str)
-    parser.add_argument("--dest", type=str)
-    parser.add_argument("--type", type=str, choices=["text_encoder", "unet"])
-    parser.add_argument("--lora_models", nargs="+", type=str, default=[])
-    parser.add_argument("--lora_weights", nargs="+", type=float, default=[])
-
-    args = parser.parse_args()
-    logger.info(
-        "merging %s with %s with weights: %s",
-        args.lora_models,
-        args.base,
-        args.lora_weights,
-    )
-
-    default_weight = 1.0 / len(args.lora_models)
-    while len(args.lora_weights) < len(args.lora_models):
-        args.lora_weights.append(default_weight)
-
-    blend_model = blend_loras(
-        context,
-        args.base,
-        list(zip(args.lora_models, args.lora_weights)),
-        args.type,
-    )
-    if args.dest is None or args.dest == "" or args.dest == ":load":
-        # convert to external data and save to memory
-        (bare_model, external_data) = buffer_external_data_tensors(blend_model)
-        logger.info("saved external data for %s nodes", len(external_data))
-
-        external_names, external_values = zip(*external_data)
-        opts = SessionOptions()
-        opts.add_external_initializers(list(external_names), list(external_values))
-        sess = InferenceSession(
-            bare_model.SerializeToString(),
-            sess_options=opts,
-            providers=["CPUExecutionProvider"],
-        )
-        logger.info(
-            "successfully loaded blended model: %s", [i.name for i in sess.get_inputs()]
-        )
-    else:
-        convert_model_to_external_data(
-            blend_model, all_tensors_to_one_file=True, location=f"lora-{args.type}.pb"
-        )
-        bare_model = write_external_data_tensors(blend_model, args.dest)
-        dest_file = path.join(args.dest, f"lora-{args.type}.onnx")
-
-        with open(dest_file, "w+b") as model_file:
-            model_file.write(bare_model.SerializeToString())
-
-        logger.info("successfully saved blended model: %s", dest_file)
-
-        check_model(dest_file)
-
-        logger.info("checked blended model")
diff --git a/api/scripts/onnx-lora.py b/api/scripts/onnx-lora.py
new file mode 100644
index 00000000..14e72d14
--- /dev/null
+++ b/api/scripts/onnx-lora.py
@@ -0,0 +1,74 @@
+from argparse import ArgumentParser
+from onnx_web.convert.diffusion.lora import blend_loras, buffer_external_data_tensors
+from os import path
+from onnx.checker import check_model
+from onnx.external_data_helper import (
+    convert_model_to_external_data,
+    write_external_data_tensors,
+)
+from onnxruntime import InferenceSession, SessionOptions
+from logging import getLogger
+
+from onnx_web.convert.utils import ConversionContext
+
+logger = getLogger(__name__)
+
+
+if __name__ == "__main__":
+    context = ConversionContext.from_environ()
+    parser = ArgumentParser()
+    parser.add_argument("--base", type=str)
+    parser.add_argument("--dest", type=str)
+    parser.add_argument("--type", type=str, choices=["text_encoder", "unet"])
+    parser.add_argument("--lora_models", nargs="+", type=str, default=[])
+    parser.add_argument("--lora_weights", nargs="+", type=float, default=[])
+
+    args = parser.parse_args()
+    logger.info(
+        "merging %s with %s with weights: %s",
+        args.lora_models,
+        args.base,
+        args.lora_weights,
+    )
+
+    default_weight = 1.0 / len(args.lora_models)
+    while len(args.lora_weights) < len(args.lora_models):
+        args.lora_weights.append(default_weight)
+
+    blend_model = blend_loras(
+        context,
+        args.base,
+        list(zip(args.lora_models, args.lora_weights)),
+        args.type,
+    )
+    if args.dest is None or args.dest == "" or args.dest == ":load":
+        # convert to external data and save to memory
+        (bare_model, external_data) = buffer_external_data_tensors(blend_model)
+        logger.info("saved external data for %s nodes", len(external_data))
+
+        external_names, external_values = zip(*external_data)
+        opts = SessionOptions()
+        opts.add_external_initializers(list(external_names), list(external_values))
+        sess = InferenceSession(
+            bare_model.SerializeToString(),
+            sess_options=opts,
+            providers=["CPUExecutionProvider"],
+        )
+        logger.info(
+            "successfully loaded blended model: %s", [i.name for i in sess.get_inputs()]
+        )
+    else:
+        convert_model_to_external_data(
+            blend_model, all_tensors_to_one_file=True, location=f"lora-{args.type}.pb"
+        )
+        bare_model = write_external_data_tensors(blend_model, args.dest)
+        dest_file = path.join(args.dest, f"lora-{args.type}.onnx")
+
+        with open(dest_file, "w+b") as model_file:
+            model_file.write(bare_model.SerializeToString())
+
+        logger.info("successfully saved blended model: %s", dest_file)
+
+        check_model(dest_file)
+
+        logger.info("checked blended model")
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index 01372e93..87a7fff0 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -1,11 +1,16 @@
 import unittest
 
 import numpy as np
+import torch
 from onnx import GraphProto, ModelProto, NodeProto
 from onnx.numpy_helper import from_array
 
 from onnx_web.convert.diffusion.lora import (
     blend_loras,
+    blend_node_conv_gemm,
+    blend_node_matmul,
+    blend_weights_loha,
+    blend_weights_lora,
     buffer_external_data_tensors,
     fix_initializer_name,
     fix_node_name,
@@ -151,6 +156,23 @@ class KernelSliceTests(unittest.TestCase):
         )
 
 
+class InterpToMatchTests(unittest.TestCase):
+    def test_same_shape(self):
+        ref = np.zeros((4, 4))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+
+    def test_different_one_dim(self):
+        ref = np.zeros((4, 2))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+
+    def test_different_both_dims(self):
+        ref = np.zeros((2, 2))
+        resize = np.zeros((4, 4))
+        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+
+
 class BlendLoRATests(unittest.TestCase):
     def test_blend_unet(self):
         """
@@ -183,18 +205,131 @@ class BlendLoRATests(unittest.TestCase):
         pass
 
 
-class InterpToMatchTests(unittest.TestCase):
-    def test_same_shape(self):
-        ref = np.zeros((4, 4))
-        resize = np.zeros((4, 4))
-        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+class BlendWeightsLoHATests(unittest.TestCase):
+    def test_blend_t1_t2(self):
+        # blend einsum: i j k l, j r, i p -> p r k l
+        i = 32
+        j = 4
+        k = 1
+        l = 1
+        p = 2
+        r = 4
 
-    def test_different_one_dim(self):
-        ref = np.zeros((4, 2))
-        resize = np.zeros((4, 4))
-        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+        model = {
+            "foo.hada_t1": torch.from_numpy(np.ones((i, j, k, l))),
+            "foo.hada_t2": torch.from_numpy(np.ones((i, j, k, l))),
+            "foo.hada_w1_a": torch.from_numpy(np.ones((i, p))),
+            "foo.hada_w1_b": torch.from_numpy(np.ones((j, r))),
+            "foo.hada_w2_a": torch.from_numpy(np.ones((i, p))),
+            "foo.hada_w2_b": torch.from_numpy(np.ones((j, r))),
+            "foo.alpha": torch.tensor(1),
+        }
+        key, result = blend_weights_loha("foo.hada_w1_a", "", model, torch.float32)
+        self.assertEqual(result.shape, (p, r, k, l))
 
-    def test_different_both_dims(self):
-        ref = np.zeros((2, 2))
-        resize = np.zeros((4, 4))
-        self.assertEqual(interp_to_match(ref, resize).shape, (4, 4))
+    def test_blend_w1_w2(self):
+        model = {
+            "foo.hada_w1_a": torch.from_numpy(np.ones((4, 1))),
+            "foo.hada_w1_b": torch.from_numpy(np.ones((1, 4))),
+            "foo.hada_w2_a": torch.from_numpy(np.ones((4, 1))),
+            "foo.hada_w2_b": torch.from_numpy(np.ones((1, 4))),
+            "foo.alpha": torch.tensor(1),
+        }
+        key, result = blend_weights_loha("foo.hada_w1_a", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4))
+
+    def test_blend_no_dim(self):
+        """
+        model = {
+            "foo.hada_w1_a": torch.from_numpy(np.ones((1, 4))),
+            "foo.hada_w1_b": torch.from_numpy(np.ones((4, 1))),
+            "foo.hada_w2_a": torch.from_numpy(np.ones((1, 4))),
+            "foo.hada_w2_b": torch.from_numpy(np.ones((4, 1))),
+        }
+        result = blend_weights_loha("foo.hada_w1_a", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4))
+        """
+
+class BlendWeightsLoRATests(unittest.TestCase):
+    def test_blend_kernel_none(self):
+        model = {
+            "foo.lora_down": torch.from_numpy(np.ones((1, 4))),
+            "foo.lora_up": torch.from_numpy(np.ones((4, 1))),
+            "foo.alpha": 1,
+        }
+        key, result = blend_weights_lora("foo.lora_down", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4))
+
+
+    def test_blend_kernel_1x1(self):
+        model = {
+            "foo.lora_down": torch.from_numpy(np.ones((1, 4, 1, 1))),
+            "foo.lora_up": torch.from_numpy(np.ones((4, 1, 1, 1))),
+            "foo.alpha": 1,
+        }
+        key, result = blend_weights_lora("foo.lora_down", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4, 1, 1))
+
+    def test_blend_kernel_3x3(self):
+        model = {
+            "foo.lora_down": torch.from_numpy(np.ones((1, 4, 3, 3))),
+            "foo.lora_up": torch.from_numpy(np.ones((4, 1, 3, 3))),
+            "foo.alpha": 1,
+        }
+        key, result = blend_weights_lora("foo.lora_down", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4, 3, 3))
+
+    def test_blend_kernel_3x3_cp_decomp(self):
+        model = {
+            "foo.lora_down": torch.from_numpy(np.ones((2, 4, 1, 1))),
+            "foo.lora_mid": torch.from_numpy(np.ones((2, 2, 3, 3))),
+            "foo.lora_up": torch.from_numpy(np.ones((4, 2, 1, 1))),
+            "foo.alpha": 1,
+        }
+        key, result = blend_weights_lora("foo.lora_down", "", model, torch.float32)
+        self.assertEqual(result.shape, (4, 4, 3, 3))
+
+    def test_blend_unknown(self):
+        pass
+
+
+class BlendNodeConvGemmTests(unittest.TestCase):
+    def test_blend_kernel_1x1_and_1x1(self):
+        node = from_array(np.ones((4, 4, 1, 1)))
+        result = blend_node_conv_gemm(node, np.ones((4, 4, 1, 1)))
+
+        self.assertEqual(result.dims, [4, 4, 1, 1])
+        self.assertEqual(len(result.raw_data), 4 * 4 * 8)
+
+    def test_blend_kernel_1x1_and_none(self):
+        node = from_array(np.ones((4, 4, 1, 1)))
+        result = blend_node_conv_gemm(node, np.ones((4, 4)))
+
+        self.assertEqual(result.dims, [4, 4, 1, 1])
+        self.assertEqual(len(result.raw_data), 4 * 4 * 8)
+
+    def test_blend_other_matching(self):
+        node = from_array(np.ones((4, 4)))
+        result = blend_node_conv_gemm(node, np.ones((4, 4)))
+
+        self.assertEqual(result.dims, [4, 4])
+        self.assertEqual(len(result.raw_data), 4 * 4 * 8)
+
+    def test_blend_other_mismatched(self):
+        pass
+
+
+class BlendNodeMatMulTests(unittest.TestCase):
+    def test_blend_matching(self):
+        node = from_array(np.ones((4, 4)))
+        result = blend_node_matmul(node, np.ones((4, 4)), "test")
+
+        self.assertEqual(result.dims, [4, 4])
+        self.assertEqual(len(result.raw_data), 4 * 4 * 8)
+
+    def test_blend_mismatched(self):
+        node = from_array(np.ones((4, 4)))
+        result = blend_node_matmul(node, np.ones((2, 2)), "test")
+
+        self.assertEqual(result.dims, [4, 4])
+        self.assertEqual(len(result.raw_data), 4 * 4 * 8)

From 38d3999088d10d843a7779320dba8e9ee32b73f3 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 21 Sep 2023 18:24:50 -0500
Subject: [PATCH 068/240] fix(gui): expand grid ranges while building pipeline

---
 gui/src/client/utils.ts                       | 53 ++++++++++++++----
 .../components/control/VariableControl.tsx    | 54 +++----------------
 gui/src/state.ts                              |  6 +--
 gui/src/types/chain.ts                        |  3 ++
 4 files changed, 55 insertions(+), 61 deletions(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index a8e2a112..e2f06552 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -1,11 +1,10 @@
 import { doesExist } from '@apextoaster/js-utils';
 import { HighresParams, ModelParams, Txt2ImgParams, UpscaleParams } from '../types/params.js';
-import { ChainPipeline, ChainStageParams } from '../types/chain.js';
+import { ChainPipeline, ChainStageParams, STRING_PARAMETERS } from '../types/chain.js';
 
 export interface PipelineVariable {
   parameter: 'prompt' | 'cfg' | 'seed' | 'steps' | 'eta' | 'scheduler' | 'token';
-  input: string;
-  values: Array<number | string>;
+  value: string;
 }
 
 export interface PipelineGrid {
@@ -14,6 +13,12 @@ export interface PipelineGrid {
   rows: PipelineVariable;
 }
 
+export const EXPR_STRICT_NUMBER = /^-?\d+$/;
+export const EXPR_NUMBER_RANGE = /^(-?\d+)-(-?\d+)$/;
+
+export const MAX_SEED_SIZE = 32;
+export const MAX_SEED = (2**MAX_SEED_SIZE) - 1;
+
 export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, columnValue: string | number, rowValue: string | number): {prompt: string} {
   const result = {
     negativePrompt: params.negativePrompt,
@@ -39,9 +44,6 @@ export function replacePromptTokens(grid: PipelineGrid, params: Txt2ImgParams, c
   return result;
 }
 
-export const MAX_SEED_SIZE = 32;
-export const MAX_SEED = (2**MAX_SEED_SIZE) - 1;
-
 export function newSeed(): number {
   return Math.floor(Math.random() * MAX_SEED);
 }
@@ -61,6 +63,37 @@ export function replaceRandomSeeds(key: string, values: Array<number | string>):
   });
 }
 
+export function rangeSplit(parameter: string, value: string): Array<number | string> {
+  const csv = value.split(',').map((it) => it.trim());
+
+  if (STRING_PARAMETERS.includes(parameter)) {
+    return csv;
+  }
+
+  return csv.flatMap((it) => expandRanges(it));
+}
+
+export function expandRanges(range: string): Array<string | number> {
+  if (EXPR_STRICT_NUMBER.test(range)) {
+    // entirely numeric, return after parsing
+    const val = parseInt(range, 10);
+    return [val];
+  }
+
+  if (EXPR_NUMBER_RANGE.test(range)) {
+    const match = EXPR_NUMBER_RANGE.exec(range);
+    if (doesExist(match)) {
+      const [_full, startStr, endStr] = Array.from(match);
+      const start = parseInt(startStr, 10);
+      const end = parseInt(endStr, 10);
+
+      return new Array(end - start).fill(0).map((_value, idx) => idx + start);
+    }
+  }
+
+  return [];
+}
+
 // eslint-disable-next-line max-params
 export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
@@ -75,8 +108,8 @@ export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams,
     tiles: 8192,
   };
 
-  const rows = replaceRandomSeeds(grid.rows.parameter, grid.rows.values);
-  const columns = replaceRandomSeeds(grid.columns.parameter, grid.columns.values);
+  const rows = replaceRandomSeeds(grid.rows.parameter, rangeSplit(grid.rows.parameter, grid.rows.value));
+  const columns = replaceRandomSeeds(grid.columns.parameter, rangeSplit(grid.columns.parameter, grid.columns.value));
 
   let i = 0;
 
@@ -108,8 +141,8 @@ export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams,
       ...params,
       ...model,
       ...tiles,
-      height: grid.rows.values.length,
-      width: grid.columns.values.length,
+      height: rows.length,
+      width: columns.length,
     },
   });
 
diff --git a/gui/src/components/control/VariableControl.tsx b/gui/src/components/control/VariableControl.tsx
index 9a14cb3b..32a66660 100644
--- a/gui/src/components/control/VariableControl.tsx
+++ b/gui/src/components/control/VariableControl.tsx
@@ -6,6 +6,7 @@ import { useStore } from 'zustand';
 
 import { PipelineGrid } from '../../client/utils.js';
 import { OnnxState, StateContext } from '../../state.js';
+import { VARIABLE_PARAMETERS } from '../../types/chain.js';
 
 export interface VariableControlProps {
   selectGrid: (state: OnnxState) => PipelineGrid;
@@ -42,18 +43,16 @@ export function VariableControl(props: VariableControlProps) {
           <Select onChange={(event) => props.setGrid({
             columns: {
               parameter: event.target.value as VariableKey,
-              input: '',
-              values: [],
+              value: '',
             },
           })} value={grid.columns.parameter}>
             {...parameterList([grid.rows.parameter])}
           </Select>
         </FormControl>
-        <TextField label={grid.columns.parameter} value={grid.columns.input} onChange={(event) => props.setGrid({
+        <TextField label={grid.columns.parameter} value={grid.columns.value} onChange={(event) => props.setGrid({
           columns: {
             parameter: grid.columns.parameter,
-            input: event.target.value,
-            values: rangeSplit(grid.columns.parameter, event.target.value),
+            value: event.target.value,
           },
         })} />
       </Stack>,
@@ -63,18 +62,16 @@ export function VariableControl(props: VariableControlProps) {
           <Select onChange={(event) => props.setGrid({
             rows: {
               parameter: event.target.value as VariableKey,
-              input: '',
-              values: [],
+              value: '',
             }
           })} value={grid.rows.parameter}>
             {...parameterList([grid.columns.parameter])}
           </Select>
         </FormControl>
-        <TextField label={grid.rows.parameter} value={grid.rows.input} onChange={(event) => props.setGrid({
+        <TextField label={grid.rows.parameter} value={grid.rows.value} onChange={(event) => props.setGrid({
           rows: {
             parameter: grid.rows.parameter,
-            input: event.target.value,
-            values: rangeSplit(grid.rows.parameter, event.target.value),
+            value: event.target.value,
           }
         })} />
       </Stack>
@@ -84,43 +81,6 @@ export function VariableControl(props: VariableControlProps) {
   return <Stack direction='column' spacing={2}>{...stack}</Stack>;
 }
 
-export function rangeSplit(parameter: string, value: string): Array<number | string> {
-  const csv = value.split(',').map((it) => it.trim());
-
-  if (STRING_PARAMETERS.includes(parameter)) {
-    return csv;
-  }
-
-  return csv.flatMap((it) => expandRanges(it));
-}
-
-export const EXPR_STRICT_NUMBER = /^-?\d+$/;
-export const EXPR_NUMBER_RANGE = /^(\d+)-(\d+)$/;
-
-export function expandRanges(range: string): Array<string | number> {
-  if (EXPR_STRICT_NUMBER.test(range)) {
-    // entirely numeric, return after parsing
-    const val = parseInt(range, 10);
-    return [val];
-  }
-
-  if (EXPR_NUMBER_RANGE.test(range)) {
-    const match = EXPR_NUMBER_RANGE.exec(range);
-    if (doesExist(match)) {
-      const [_full, startStr, endStr] = Array.from(match);
-      const start = parseInt(startStr, 10);
-      const end = parseInt(endStr, 10);
-
-      return new Array(end - start).fill(0).map((_value, idx) => idx + start);
-    }
-  }
-
-  return [];
-}
-
-export const VARIABLE_PARAMETERS = ['prompt', 'negativePrompt', 'seed', 'steps', 'cfg', 'scheduler', 'eta', 'token'];
-export const STRING_PARAMETERS = ['prompt', 'negativePrompt', 'scheduler', 'token'];
-
 export function parameterList(exclude?: Array<string>) {
   const items = [];
 
diff --git a/gui/src/state.ts b/gui/src/state.ts
index 861f0e67..5f59e11b 100644
--- a/gui/src/state.ts
+++ b/gui/src/state.ts
@@ -311,14 +311,12 @@ export function createStateSlices(server: ServerParams) {
   const defaultGrid: PipelineGrid = {
     enabled: false,
     columns: {
-      input: '',
       parameter: 'seed',
-      values: [],
+      value: '',
     },
     rows: {
-      input: '',
       parameter: 'seed',
-      values: [],
+      value: '',
     },
   };
 
diff --git a/gui/src/types/chain.ts b/gui/src/types/chain.ts
index 9113a117..840a67f8 100644
--- a/gui/src/types/chain.ts
+++ b/gui/src/types/chain.ts
@@ -38,3 +38,6 @@ export interface ChainPipeline {
 
   stages: Array<Txt2ImgStage | Img2ImgStage | GridStage | OutputStage>;
 }
+
+export const VARIABLE_PARAMETERS = ['prompt', 'negativePrompt', 'seed', 'steps', 'cfg', 'scheduler', 'eta', 'token'];
+export const STRING_PARAMETERS = ['prompt', 'negativePrompt', 'scheduler', 'token'];

From 6b6f63564e6e709f77091cb2c3431b1066d03415 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 23 Sep 2023 20:11:05 -0500
Subject: [PATCH 069/240] lint(api): start breaking down model loading

---
 api/onnx_web/diffusers/load.py        | 513 ++++++++++++++------------
 api/tests/test_diffusers/test_load.py |   1 -
 onnx-web.code-workspace               |   3 +
 3 files changed, 280 insertions(+), 237 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index c38fe487..4e4c8c90 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -106,6 +106,9 @@ def get_scheduler_name(scheduler: Any) -> Optional[str]:
     return None
 
 
+VAE_COMPONENTS = ["vae", "vae_decoder", "vae_encoder"]
+
+
 def load_pipeline(
     server: ServerContext,
     params: ImageParams,
@@ -177,237 +180,28 @@ def load_pipeline(
         }
 
         # shared components
-        text_encoder = None
         unet_type = "unet"
 
         # ControlNet component
         if params.is_control() and params.control is not None:
-            cnet_path = path.join(
-                server.model_path, "control", f"{params.control.name}.onnx"
-            )
-            logger.debug("loading ControlNet weights from %s", cnet_path)
-            components["controlnet"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    cnet_path,
-                    provider=device.ort_provider(),
-                    sess_options=device.sess_options(),
-                )
-            )
-
+            logger.debug("loading ControlNet components")
+            control_components = load_controlnet(server, device, params)
+            components.update(control_components)
             unet_type = "cnet"
 
         # Textual Inversion blending
-        if inversions is not None and len(inversions) > 0:
-            logger.debug("blending Textual Inversions from %s", inversions)
-            inversion_names, inversion_weights = zip(*inversions)
+        encoder_components = load_text_encoders(
+            server, device, model, inversions, loras, torch_dtype, params
+        )
+        components.update(encoder_components)
 
-            inversion_models = [
-                path.join(server.model_path, "inversion", name)
-                for name in inversion_names
-            ]
-            text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
-            tokenizer = CLIPTokenizer.from_pretrained(
-                model,
-                subfolder="tokenizer",
-                torch_dtype=torch_dtype,
-            )
-            text_encoder, tokenizer = blend_textual_inversions(
-                server,
-                text_encoder,
-                tokenizer,
-                list(
-                    zip(
-                        inversion_models,
-                        inversion_weights,
-                        inversion_names,
-                        [None] * len(inversion_models),
-                    )
-                ),
-            )
+        unet_components = load_unet(
+            server, device, model, loras, unet_type, params
+        )
+        components.update(unet_components)
 
-            components["tokenizer"] = tokenizer
-
-            # should be pretty small and should not need external data
-            if loras is None or len(loras) == 0:
-                # TODO: handle XL encoders
-                components["text_encoder"] = OnnxRuntimeModel(
-                    OnnxRuntimeModel.load_model(
-                        text_encoder.SerializeToString(),
-                        provider=device.ort_provider("text-encoder"),
-                        sess_options=device.sess_options(),
-                    )
-                )
-
-        # LoRA blending
-        if loras is not None and len(loras) > 0:
-            lora_names, lora_weights = zip(*loras)
-            lora_models = [
-                path.join(server.model_path, "lora", name) for name in lora_names
-            ]
-            logger.info(
-                "blending base model %s with LoRA models: %s", model, lora_models
-            )
-
-            # blend and load text encoder
-            text_encoder = text_encoder or path.join(model, "text_encoder", ONNX_MODEL)
-            text_encoder = blend_loras(
-                server,
-                text_encoder,
-                list(zip(lora_models, lora_weights)),
-                "text_encoder",
-                1 if params.is_xl() else None,
-                params.is_xl(),
-            )
-            (text_encoder, text_encoder_data) = buffer_external_data_tensors(
-                text_encoder
-            )
-            text_encoder_names, text_encoder_values = zip(*text_encoder_data)
-            text_encoder_opts = device.sess_options(cache=False)
-            text_encoder_opts.add_external_initializers(
-                list(text_encoder_names), list(text_encoder_values)
-            )
-
-            if params.is_xl():
-                text_encoder_session = InferenceSession(
-                    text_encoder.SerializeToString(),
-                    providers=[device.ort_provider("text-encoder")],
-                    sess_options=text_encoder_opts,
-                )
-                text_encoder_session._model_path = path.join(model, "text_encoder")
-                components["text_encoder_session"] = text_encoder_session
-            else:
-                components["text_encoder"] = OnnxRuntimeModel(
-                    OnnxRuntimeModel.load_model(
-                        text_encoder.SerializeToString(),
-                        provider=device.ort_provider("text-encoder"),
-                        sess_options=text_encoder_opts,
-                    )
-                )
-
-            if params.is_xl():
-                text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
-                text_encoder_2 = blend_loras(
-                    server,
-                    text_encoder_2,
-                    list(zip(lora_models, lora_weights)),
-                    "text_encoder",
-                    2,
-                    params.is_xl(),
-                )
-                (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
-                    text_encoder_2
-                )
-                text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
-                text_encoder_2_opts = device.sess_options(cache=False)
-                text_encoder_2_opts.add_external_initializers(
-                    list(text_encoder_2_names), list(text_encoder_2_values)
-                )
-
-                text_encoder_2_session = InferenceSession(
-                    text_encoder_2.SerializeToString(),
-                    providers=[device.ort_provider("text-encoder")],
-                    sess_options=text_encoder_2_opts,
-                )
-                text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
-                components["text_encoder_2_session"] = text_encoder_2_session
-
-            # blend and load unet
-            unet = path.join(model, unet_type, ONNX_MODEL)
-            blended_unet = blend_loras(
-                server,
-                unet,
-                list(zip(lora_models, lora_weights)),
-                "unet",
-                xl=params.is_xl(),
-            )
-            (unet_model, unet_data) = buffer_external_data_tensors(blended_unet)
-            unet_names, unet_values = zip(*unet_data)
-            unet_opts = device.sess_options(cache=False)
-            unet_opts.add_external_initializers(list(unet_names), list(unet_values))
-
-            if params.is_xl():
-                unet_session = InferenceSession(
-                    unet_model.SerializeToString(),
-                    providers=[device.ort_provider("unet")],
-                    sess_options=unet_opts,
-                )
-                unet_session._model_path = path.join(model, "unet")
-                components["unet_session"] = unet_session
-            else:
-                components["unet"] = OnnxRuntimeModel(
-                    OnnxRuntimeModel.load_model(
-                        unet_model.SerializeToString(),
-                        provider=device.ort_provider("unet"),
-                        sess_options=unet_opts,
-                    )
-                )
-
-        # make sure a UNet has been loaded
-        if not params.is_xl() and "unet" not in components:
-            unet = path.join(model, unet_type, ONNX_MODEL)
-            logger.debug("loading UNet (%s) from %s", unet_type, unet)
-            components["unet"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    unet,
-                    provider=device.ort_provider("unet"),
-                    sess_options=device.sess_options(),
-                )
-            )
-
-        # one or more VAE models need to be loaded
-        vae = path.join(model, "vae", ONNX_MODEL)
-        vae_decoder = path.join(model, "vae_decoder", ONNX_MODEL)
-        vae_encoder = path.join(model, "vae_encoder", ONNX_MODEL)
-
-        if not params.is_xl() and path.exists(vae):
-            logger.debug("loading VAE from %s", vae)
-            components["vae"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    vae,
-                    provider=device.ort_provider("vae"),
-                    sess_options=device.sess_options(),
-                )
-            )
-        elif path.exists(vae_decoder) and path.exists(vae_encoder):
-            if params.is_xl():
-                logger.debug("loading VAE decoder from %s", vae_decoder)
-                components["vae_decoder_session"] = OnnxRuntimeModel.load_model(
-                    vae_decoder,
-                    provider=device.ort_provider("vae"),
-                    sess_options=device.sess_options(),
-                )
-                components[
-                    "vae_decoder_session"
-                ]._model_path = vae_decoder  # "#\\not a real path on any system"
-
-                logger.debug("loading VAE encoder from %s", vae_encoder)
-                components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
-                    vae_encoder,
-                    provider=device.ort_provider("vae"),
-                    sess_options=device.sess_options(),
-                )
-                components[
-                    "vae_encoder_session"
-                ]._model_path = vae_encoder  # "#\\not a real path on any system"
-
-            else:
-                logger.debug("loading VAE decoder from %s", vae_decoder)
-                components["vae_decoder"] = OnnxRuntimeModel(
-                    OnnxRuntimeModel.load_model(
-                        vae_decoder,
-                        provider=device.ort_provider("vae"),
-                        sess_options=device.sess_options(),
-                    )
-                )
-
-                logger.debug("loading VAE encoder from %s", vae_encoder)
-                components["vae_encoder"] = OnnxRuntimeModel(
-                    OnnxRuntimeModel.load_model(
-                        vae_encoder,
-                        provider=device.ort_provider("vae"),
-                        sess_options=device.sess_options(),
-                    )
-                )
+        vae_components = load_vae(server, device, model)
+        components.update(vae_components)
 
         # additional options for panorama pipeline
         if params.is_panorama():
@@ -427,19 +221,22 @@ def load_pipeline(
 
         # make sure XL models are actually being used
         if "text_encoder_session" in components:
-            pipe.text_encoder = ORTModelTextEncoder(text_encoder_session, text_encoder)
+            pipe.text_encoder = ORTModelTextEncoder(
+                components["text_encoder_session"], pipe
+            )
 
         if "text_encoder_2_session" in components:
             pipe.text_encoder_2 = ORTModelTextEncoder(
-                text_encoder_2_session, text_encoder_2
+                components["text_encoder_2_session"], pipe
             )
 
         if "unet_session" in components:
-            # unload old UNet first
+            # unload old UNet
             pipe.unet = None
             run_gc([device])
-            # load correct one
-            pipe.unet = ORTModelUnet(unet_session, unet_model)
+
+            # attach correct one
+            pipe.unet = ORTModelUnet(components["unet_session"], pipe)
 
         if "vae_decoder_session" in components:
             pipe.vae_decoder = ORTModelVaeDecoder(
@@ -462,11 +259,9 @@ def load_pipeline(
         server.cache.set(ModelTypes.diffusion, pipe_key, pipe)
         server.cache.set(ModelTypes.scheduler, scheduler_key, components["scheduler"])
 
-    if hasattr(pipe, "vae_decoder"):
-        pipe.vae_decoder.set_tiled(tiled=params.tiled_vae)
-
-    if hasattr(pipe, "vae_encoder"):
-        pipe.vae_encoder.set_tiled(tiled=params.tiled_vae)
+    for vae in VAE_COMPONENTS:
+        if hasattr(pipe, vae):
+            getattr(pipe, vae).set_tiled(tiled=params.tiled_vae)
 
     # update panorama params
     if params.is_panorama():
@@ -474,16 +269,262 @@ def load_pipeline(
         latent_stride = params.stride // 8
 
         pipe.set_window_size(latent_window, latent_stride)
-        if hasattr(pipe, "vae_decoder"):
-            pipe.vae_decoder.set_window_size(latent_window, params.overlap)
-        if hasattr(pipe, "vae_encoder"):
-            pipe.vae_encoder.set_window_size(latent_window, params.overlap)
+
+        for vae in VAE_COMPONENTS:
+            if hasattr(pipe, vae):
+                getattr(pipe, vae).set_window_size(latent_window, params.overlap)
 
     run_gc([device])
 
     return pipe
 
 
+def load_controlnet(server, device, params):
+    cnet_path = path.join(server.model_path, "control", f"{params.control.name}.onnx")
+    logger.debug("loading ControlNet weights from %s", cnet_path)
+    components = {}
+    components["controlnet"] = OnnxRuntimeModel(
+        OnnxRuntimeModel.load_model(
+            cnet_path,
+            provider=device.ort_provider(),
+            sess_options=device.sess_options(),
+        )
+    )
+    return components
+
+
+def load_text_encoders(
+    server, device, model: str, inversions, loras, torch_dtype, params
+):
+    text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
+    tokenizer = CLIPTokenizer.from_pretrained(
+        model,
+        subfolder="tokenizer",
+        torch_dtype=torch_dtype,
+    )
+
+    components = {}
+    components["tokenizer"] = tokenizer
+
+    if inversions is not None and len(inversions) > 0:
+        logger.debug("blending Textual Inversions from %s", inversions)
+        inversion_names, inversion_weights = zip(*inversions)
+
+        inversion_models = [
+            path.join(server.model_path, "inversion", name) for name in inversion_names
+        ]
+
+        text_encoder, tokenizer = blend_textual_inversions(
+            server,
+            text_encoder,
+            tokenizer,
+            list(
+                zip(
+                    inversion_models,
+                    inversion_weights,
+                    inversion_names,
+                    [None] * len(inversion_models),
+                )
+            ),
+        )
+
+    # should be pretty small and should not need external data
+    if loras is None or len(loras) == 0:
+        # TODO: handle XL encoders
+        components["text_encoder"] = OnnxRuntimeModel(
+            OnnxRuntimeModel.load_model(
+                text_encoder.SerializeToString(),
+                provider=device.ort_provider("text-encoder"),
+                sess_options=device.sess_options(),
+            )
+        )
+    else:
+        # blend and load text encoder
+        lora_names, lora_weights = zip(*loras)
+        lora_models = [
+            path.join(server.model_path, "lora", name) for name in lora_names
+        ]
+        logger.info("blending base model %s with LoRA models: %s", model, lora_models)
+
+        text_encoder = blend_loras(
+            server,
+            text_encoder,
+            list(zip(lora_models, lora_weights)),
+            "text_encoder",
+            1 if params.is_xl() else None,
+            params.is_xl(),
+        )
+        (text_encoder, text_encoder_data) = buffer_external_data_tensors(text_encoder)
+        text_encoder_names, text_encoder_values = zip(*text_encoder_data)
+        text_encoder_opts = device.sess_options(cache=False)
+        text_encoder_opts.add_external_initializers(
+            list(text_encoder_names), list(text_encoder_values)
+        )
+
+        if params.is_xl():
+            text_encoder_session = InferenceSession(
+                text_encoder.SerializeToString(),
+                providers=[device.ort_provider("text-encoder")],
+                sess_options=text_encoder_opts,
+            )
+            text_encoder_session._model_path = path.join(model, "text_encoder")
+            components["text_encoder_session"] = text_encoder_session
+        else:
+            components["text_encoder"] = OnnxRuntimeModel(
+                OnnxRuntimeModel.load_model(
+                    text_encoder.SerializeToString(),
+                    provider=device.ort_provider("text-encoder"),
+                    sess_options=text_encoder_opts,
+                )
+            )
+
+    if params.is_xl():
+        text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
+        text_encoder_2 = blend_loras(
+            server,
+            text_encoder_2,
+            list(zip(lora_models, lora_weights)),
+            "text_encoder",
+            2,
+            params.is_xl(),
+        )
+        (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
+            text_encoder_2
+        )
+        text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
+        text_encoder_2_opts = device.sess_options(cache=False)
+        text_encoder_2_opts.add_external_initializers(
+            list(text_encoder_2_names), list(text_encoder_2_values)
+        )
+
+        text_encoder_2_session = InferenceSession(
+            text_encoder_2.SerializeToString(),
+            providers=[device.ort_provider("text-encoder")],
+            sess_options=text_encoder_2_opts,
+        )
+        text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
+        components["text_encoder_2_session"] = text_encoder_2_session
+
+    return components
+
+
+def load_unet(server, device, model, loras, unet_type, params):
+    components = {}
+    unet = path.join(model, unet_type, ONNX_MODEL)
+
+    # LoRA blending
+    if loras is not None and len(loras) > 0:
+        lora_names, lora_weights = zip(*loras)
+        lora_models = [
+            path.join(server.model_path, "lora", name) for name in lora_names
+        ]
+        logger.info("blending base model %s with LoRA models: %s", model, lora_models)
+
+        # blend and load unet
+        blended_unet = blend_loras(
+            server,
+            unet,
+            list(zip(lora_models, lora_weights)),
+            "unet",
+            xl=params.is_xl(),
+        )
+        (unet_model, unet_data) = buffer_external_data_tensors(blended_unet)
+        unet_names, unet_values = zip(*unet_data)
+        unet_opts = device.sess_options(cache=False)
+        unet_opts.add_external_initializers(list(unet_names), list(unet_values))
+
+        if params.is_xl():
+            unet_session = InferenceSession(
+                unet_model.SerializeToString(),
+                providers=[device.ort_provider("unet")],
+                sess_options=unet_opts,
+            )
+            unet_session._model_path = path.join(model, "unet")
+            components["unet_session"] = unet_session
+        else:
+            components["unet"] = OnnxRuntimeModel(
+                OnnxRuntimeModel.load_model(
+                    unet_model.SerializeToString(),
+                    provider=device.ort_provider("unet"),
+                    sess_options=unet_opts,
+                )
+            )
+
+    # make sure a UNet has been loaded
+    if not params.is_xl() and "unet" not in components:
+        unet = path.join(model, unet_type, ONNX_MODEL)
+        logger.debug("loading UNet (%s) from %s", unet_type, unet)
+        components["unet"] = OnnxRuntimeModel(
+            OnnxRuntimeModel.load_model(
+                unet,
+                provider=device.ort_provider("unet"),
+                sess_options=device.sess_options(),
+            )
+        )
+
+    return components
+
+
+def load_vae(server, device, model, params):
+    # one or more VAE models need to be loaded
+    vae = path.join(model, "vae", ONNX_MODEL)
+    vae_decoder = path.join(model, "vae_decoder", ONNX_MODEL)
+    vae_encoder = path.join(model, "vae_encoder", ONNX_MODEL)
+
+    components = {}
+    if not params.is_xl() and path.exists(vae):
+        logger.debug("loading VAE from %s", vae)
+        components["vae"] = OnnxRuntimeModel(
+            OnnxRuntimeModel.load_model(
+                vae,
+                provider=device.ort_provider("vae"),
+                sess_options=device.sess_options(),
+            )
+        )
+    elif path.exists(vae_decoder) and path.exists(vae_encoder):
+        if params.is_xl():
+            logger.debug("loading VAE decoder from %s", vae_decoder)
+            components["vae_decoder_session"] = OnnxRuntimeModel.load_model(
+                vae_decoder,
+                provider=device.ort_provider("vae"),
+                sess_options=device.sess_options(),
+            )
+            components[
+                "vae_decoder_session"
+            ]._model_path = vae_decoder
+
+            logger.debug("loading VAE encoder from %s", vae_encoder)
+            components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
+                vae_encoder,
+                provider=device.ort_provider("vae"),
+                sess_options=device.sess_options(),
+            )
+            components[
+                "vae_encoder_session"
+            ]._model_path = vae_encoder
+
+        else:
+            logger.debug("loading VAE decoder from %s", vae_decoder)
+            components["vae_decoder"] = OnnxRuntimeModel(
+                OnnxRuntimeModel.load_model(
+                    vae_decoder,
+                    provider=device.ort_provider("vae"),
+                    sess_options=device.sess_options(),
+                )
+            )
+
+            logger.debug("loading VAE encoder from %s", vae_encoder)
+            components["vae_encoder"] = OnnxRuntimeModel(
+                OnnxRuntimeModel.load_model(
+                    vae_encoder,
+                    provider=device.ort_provider("vae"),
+                    sess_options=device.sess_options(),
+                )
+            )
+
+    return components
+
+
 def optimize_pipeline(
     server: ServerContext,
     pipe: StableDiffusionPipeline,
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index a7f4c97c..beaab12c 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -11,7 +11,6 @@ from onnx_web.diffusers.load import (
 )
 from onnx_web.diffusers.patches.unet import UNetWrapper
 from onnx_web.diffusers.patches.vae import VAEWrapper
-from onnx_web.diffusers.utils import expand_prompt
 from onnx_web.params import ImageParams
 from onnx_web.server.context import ServerContext
 from tests.mocks import MockPipeline
diff --git a/onnx-web.code-workspace b/onnx-web.code-workspace
index f859a141..08f791d9 100644
--- a/onnx-web.code-workspace
+++ b/onnx-web.code-workspace
@@ -26,6 +26,7 @@
 			"bokeh",
 			"Civitai",
 			"ckpt",
+			"cnet",
 			"codebook",
 			"codeformer",
 			"controlnet",
@@ -53,6 +54,8 @@
 			"KDPM",
 			"Knollingcase",
 			"Lanczos",
+			"loha",
+			"loras",
 			"Multistep",
 			"ndarray",
 			"numpy",

From d11b37f0b2003abb8a4b11b46064682ce3c4d149 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 23 Sep 2023 22:59:41 -0500
Subject: [PATCH 070/240] move text encoder 2 loading

---
 api/onnx_web/diffusers/load.py | 53 +++++++++++++++++-----------------
 1 file changed, 26 insertions(+), 27 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 4e4c8c90..3e0c2920 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -369,6 +369,32 @@ def load_text_encoders(
             )
             text_encoder_session._model_path = path.join(model, "text_encoder")
             components["text_encoder_session"] = text_encoder_session
+
+            text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
+            text_encoder_2 = blend_loras(
+                server,
+                text_encoder_2,
+                list(zip(lora_models, lora_weights)),
+                "text_encoder",
+                2,
+                params.is_xl(),
+            )
+            (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
+                text_encoder_2
+            )
+            text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
+            text_encoder_2_opts = device.sess_options(cache=False)
+            text_encoder_2_opts.add_external_initializers(
+                list(text_encoder_2_names), list(text_encoder_2_values)
+            )
+
+            text_encoder_2_session = InferenceSession(
+                text_encoder_2.SerializeToString(),
+                providers=[device.ort_provider("text-encoder")],
+                sess_options=text_encoder_2_opts,
+            )
+            text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
+            components["text_encoder_2_session"] = text_encoder_2_session
         else:
             components["text_encoder"] = OnnxRuntimeModel(
                 OnnxRuntimeModel.load_model(
@@ -378,33 +404,6 @@ def load_text_encoders(
                 )
             )
 
-    if params.is_xl():
-        text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
-        text_encoder_2 = blend_loras(
-            server,
-            text_encoder_2,
-            list(zip(lora_models, lora_weights)),
-            "text_encoder",
-            2,
-            params.is_xl(),
-        )
-        (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
-            text_encoder_2
-        )
-        text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
-        text_encoder_2_opts = device.sess_options(cache=False)
-        text_encoder_2_opts.add_external_initializers(
-            list(text_encoder_2_names), list(text_encoder_2_values)
-        )
-
-        text_encoder_2_session = InferenceSession(
-            text_encoder_2.SerializeToString(),
-            providers=[device.ort_provider("text-encoder")],
-            sess_options=text_encoder_2_opts,
-        )
-        text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
-        components["text_encoder_2_session"] = text_encoder_2_session
-
     return components
 
 

From 56f19256b5cdd2b1d5c01cb6805f163d1a8e4f92 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 09:49:16 -0500
Subject: [PATCH 071/240] fix(api): correctly load text encoder 2 and VAE
 without LoRAs

---
 api/onnx_web/diffusers/load.py         | 12 +++++++++++-
 api/onnx_web/diffusers/patches/unet.py | 11 ++++++-----
 2 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 3e0c2920..2773922c 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -200,7 +200,7 @@ def load_pipeline(
         )
         components.update(unet_components)
 
-        vae_components = load_vae(server, device, model)
+        vae_components = load_vae(server, device, model, params)
         components.update(vae_components)
 
         # additional options for panorama pipeline
@@ -338,6 +338,16 @@ def load_text_encoders(
                 sess_options=device.sess_options(),
             )
         )
+
+        if params.is_xl():
+            text_encoder_2_session = InferenceSession(
+                text_encoder_2.SerializeToString(),
+                providers=[device.ort_provider("text-encoder")],
+                sess_options=text_encoder_2_opts,
+            )
+            text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
+            components["text_encoder_2_session"] = text_encoder_2_session
+
     else:
         # blend and load text encoder
         lora_names, lora_weights = zip(*loras)
diff --git a/api/onnx_web/diffusers/patches/unet.py b/api/onnx_web/diffusers/patches/unet.py
index fbe0f4f8..6e15597f 100644
--- a/api/onnx_web/diffusers/patches/unet.py
+++ b/api/onnx_web/diffusers/patches/unet.py
@@ -47,11 +47,12 @@ class UNetWrapper(object):
             self.prompt_index += 1
 
         if self.xl:
-            logger.trace(
-                "converting UNet sample to hidden state dtype for XL: %s",
-                encoder_hidden_states.dtype,
-            )
-            sample = sample.astype(encoder_hidden_states.dtype)
+            if sample.dtype != encoder_hidden_states.dtype:
+                logger.trace(
+                    "converting UNet sample to hidden state dtype for XL: %s",
+                    encoder_hidden_states.dtype,
+                )
+                sample = sample.astype(encoder_hidden_states.dtype)
         else:
             if sample.dtype != timestep.dtype:
                 logger.trace("converting UNet sample to timestep dtype")

From c99481f4848d18028d2d6fcfb591fac08fa94016 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 09:49:50 -0500
Subject: [PATCH 072/240] fix(api): load replacement VAE from single file for
 SD v1/v2

---
 api/onnx_web/convert/diffusion/diffusion.py | 21 +++++++--------------
 1 file changed, 7 insertions(+), 14 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index 93bc96a1..a14f2c95 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -341,7 +341,6 @@ def convert_diffusion_diffusers(
                 source,
                 original_config_file=config_path,
                 pipeline_class=pipe_class,
-                vae_path=replace_vae,
                 **pipe_args,
             ).to(device, torch_dtype=dtype)
     elif hf:
@@ -355,6 +354,13 @@ def convert_diffusion_diffusers(
         logger.warning("pipeline source not found or not recognized: %s", source)
         raise ValueError(f"pipeline source not found or not recognized: {source}")
 
+    if replace_vae is not None:
+        vae_path = path.join(conversion.model_path, replace_vae)
+        if replace_vae.endswith(".safetensors"):
+            pipeline.vae = AutoencoderKL.from_single_file(vae_path)
+        else:
+            pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
+
     optimize_pipeline(conversion, pipeline)
 
     output_path = Path(dest_path)
@@ -507,19 +513,6 @@ def convert_diffusion_diffusers(
     del unet
     run_gc()
 
-    # VAE
-    if replace_vae is not None:
-        if replace_vae.startswith("."):
-            logger.debug(
-                "custom VAE appears to be a local path, making it relative to the model path"
-            )
-            replace_vae = path.join(conversion.model_path, replace_vae)
-
-        logger.info("loading custom VAE: %s", replace_vae)
-        vae = AutoencoderKL.from_pretrained(replace_vae)
-        pipeline.vae = vae
-        run_gc()
-
     if single_vae:
         logger.debug("VAE config: %s", pipeline.vae.config)
 

From 5d3a7d77a5b3f6bd20cd4082b722eca3d8c65409 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 10:04:21 -0500
Subject: [PATCH 073/240] fix(api): use Torch pipelines while loading models
 for conversion

---
 api/onnx_web/convert/diffusion/diffusion.py | 25 ++++++++++++++++++---
 1 file changed, 22 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index a14f2c95..6fe9b172 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -16,14 +16,22 @@ from shutil import rmtree
 from typing import Any, Dict, Optional, Tuple, Union
 
 import torch
-from diffusers import AutoencoderKL, OnnxRuntimeModel, OnnxStableDiffusionPipeline
+from diffusers import (
+    AutoencoderKL,
+    OnnxRuntimeModel,
+    OnnxStableDiffusionPipeline,
+    StableDiffusionInstructPix2PixPipeline,
+    StableDiffusionPipeline,
+    StableDiffusionUpscalePipeline,
+)
 from diffusers.pipelines.stable_diffusion.convert_from_ckpt import (
     download_from_original_stable_diffusion_ckpt,
 )
 from onnx import load_model, save_model
 
 from ...constants import ONNX_MODEL, ONNX_WEIGHTS
-from ...diffusers.load import available_pipelines, optimize_pipeline
+from ...diffusers.load import optimize_pipeline
+from ...diffusers.pipelines.controlnet import OnnxStableDiffusionControlNetPipeline
 from ...diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
 from ...diffusers.version_safe_diffusers import AttnProcessor
 from ...models.cnet import UNet2DConditionModel_CNet
@@ -33,6 +41,17 @@ from .checkpoint import convert_extract_checkpoint
 
 logger = getLogger(__name__)
 
+CONVERT_PIPELINES = {
+    "controlnet": OnnxStableDiffusionControlNetPipeline,
+    "img2img": StableDiffusionPipeline,
+    "inpaint": StableDiffusionPipeline,
+    "lpw": StableDiffusionPipeline,
+    "panorama": StableDiffusionPipeline,
+    "pix2pix": StableDiffusionInstructPix2PixPipeline,
+    "txt2img": StableDiffusionPipeline,
+    "upscale": StableDiffusionUpscalePipeline,
+}
+
 
 def get_model_version(
     source,
@@ -295,7 +314,7 @@ def convert_diffusion_diffusers(
             logger.info("ONNX model already exists, skipping")
             return (False, dest_path)
 
-    pipe_class = available_pipelines.get(pipe_type)
+    pipe_class = CONVERT_PIPELINES.get(pipe_type)
     v2, pipe_args = get_model_version(
         source, conversion.map_location, size=image_size, version=version
     )

From 539140909b30fbd03f3d5c897b429fe3c05af1a1 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 10:04:44 -0500
Subject: [PATCH 074/240] fix XL text encoder loading

---
 api/onnx_web/diffusers/load.py | 42 +++++++++++++++++++---------------
 1 file changed, 23 insertions(+), 19 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 2773922c..60ef7090 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -195,9 +195,7 @@ def load_pipeline(
         )
         components.update(encoder_components)
 
-        unet_components = load_unet(
-            server, device, model, loras, unet_type, params
-        )
+        unet_components = load_unet(server, device, model, loras, unet_type, params)
         components.update(unet_components)
 
         vae_components = load_vae(server, device, model, params)
@@ -330,23 +328,33 @@ def load_text_encoders(
 
     # should be pretty small and should not need external data
     if loras is None or len(loras) == 0:
-        # TODO: handle XL encoders
-        components["text_encoder"] = OnnxRuntimeModel(
-            OnnxRuntimeModel.load_model(
-                text_encoder.SerializeToString(),
-                provider=device.ort_provider("text-encoder"),
-                sess_options=device.sess_options(),
-            )
-        )
-
         if params.is_xl():
+            text_encoder = path.join(model, "text_encoder", ONNX_MODEL)
+            text_encoder_opts = device.sess_options(cache=False)
+            text_encoder_session = InferenceSession(
+                text_encoder.SerializeToString(),
+                providers=[device.ort_provider("text-encoder")],
+                sess_options=text_encoder_opts,
+            )
+
+            text_encoder_session._model_path = path.join(model, "text_encoder")
+
+            text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
+            text_encoder_2_opts = device.sess_options(cache=False)
             text_encoder_2_session = InferenceSession(
                 text_encoder_2.SerializeToString(),
                 providers=[device.ort_provider("text-encoder")],
                 sess_options=text_encoder_2_opts,
             )
             text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
-            components["text_encoder_2_session"] = text_encoder_2_session
+        else:
+            components["text_encoder"] = OnnxRuntimeModel(
+                OnnxRuntimeModel.load_model(
+                    text_encoder.SerializeToString(),
+                    provider=device.ort_provider("text-encoder"),
+                    sess_options=device.sess_options(),
+                )
+            )
 
     else:
         # blend and load text encoder
@@ -498,9 +506,7 @@ def load_vae(server, device, model, params):
                 provider=device.ort_provider("vae"),
                 sess_options=device.sess_options(),
             )
-            components[
-                "vae_decoder_session"
-            ]._model_path = vae_decoder
+            components["vae_decoder_session"]._model_path = vae_decoder
 
             logger.debug("loading VAE encoder from %s", vae_encoder)
             components["vae_encoder_session"] = OnnxRuntimeModel.load_model(
@@ -508,9 +514,7 @@ def load_vae(server, device, model, params):
                 provider=device.ort_provider("vae"),
                 sess_options=device.sess_options(),
             )
-            components[
-                "vae_encoder_session"
-            ]._model_path = vae_encoder
+            components["vae_encoder_session"]._model_path = vae_encoder
 
         else:
             logger.debug("loading VAE decoder from %s", vae_decoder)

From 5ffe8b26faae6080c5f643522c505960d707b048 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 10:11:52 -0500
Subject: [PATCH 075/240] fix(api): increase max tile size for output and grid
 stages to max

---
 api/onnx_web/chain/blend_grid.py   | 4 +++-
 api/onnx_web/chain/persist_disk.py | 4 +++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 19b1eca2..19af2fbd 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -3,7 +3,7 @@ from typing import List, Optional
 
 from PIL import Image
 
-from ..params import ImageParams, StageParams
+from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .stage import BaseStage
@@ -12,6 +12,8 @@ logger = getLogger(__name__)
 
 
 class BlendGridStage(BaseStage):
+    max_tile = SizeChart.max
+
     def run(
         self,
         _worker: WorkerContext,
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 890e6589..7d9a0fe6 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -4,7 +4,7 @@ from typing import List, Optional
 from PIL import Image
 
 from ..output import save_image
-from ..params import ImageParams, Size, StageParams
+from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .stage import BaseStage
@@ -13,6 +13,8 @@ logger = getLogger(__name__)
 
 
 class PersistDiskStage(BaseStage):
+    max_tile = SizeChart.max
+
     def run(
         self,
         _worker: WorkerContext,

From a79d8351933254e81f266ad6a21edd2e14baded0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 10:12:12 -0500
Subject: [PATCH 076/240] fix(api): remove still-random seed from stage kwargs

---
 api/onnx_web/server/api.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 3865cea4..4c23ba22 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -411,6 +411,9 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
             if pop_key in kwargs:
                 kwargs.pop(pop_key)
 
+        if "seed" in kwargs and kwargs["seed"] == -1:
+            kwargs.pop("seed")
+
         # replace kwargs with parsed versions
         kwargs["params"] = params
         kwargs["size"] = size

From 6e2896f7f72995f2d37b3582977e80e72a15d633 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 10:12:40 -0500
Subject: [PATCH 077/240] fix(api): allow SDXL txt2img models in extras file
 and schema

---
 api/schemas/extras.yaml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/schemas/extras.yaml b/api/schemas/extras.yaml
index eea6dbf9..30886f2c 100644
--- a/api/schemas/extras.yaml
+++ b/api/schemas/extras.yaml
@@ -100,6 +100,7 @@ $defs:
               panorama,
               pix2pix,
               txt2img,
+              txt2img-sdxl,
               upscale,
             ]
           vae:

From 0ecae65f886ecd6cb2ea7d4e41c8336e13f5ee3a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 15:02:21 -0500
Subject: [PATCH 078/240] fix(api): set VAE attn processor during conversion

---
 api/onnx_web/convert/diffusion/diffusion.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index 6fe9b172..f14de94d 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -380,6 +380,10 @@ def convert_diffusion_diffusers(
         else:
             pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
 
+    if is_torch_2_0:
+        pipeline.unet.set_attn_processor(AttnProcessor())
+        pipeline.vae.set_attn_processor(AttnProcessor())
+
     optimize_pipeline(conversion, pipeline)
 
     output_path = Path(dest_path)
@@ -430,9 +434,6 @@ def convert_diffusion_diffusers(
         unet_inputs = ["sample", "timestep", "encoder_hidden_states", "return_dict"]
         unet_scale = torch.tensor(False).to(device=device, dtype=torch.bool)
 
-    if is_torch_2_0:
-        pipeline.unet.set_attn_processor(AttnProcessor())
-
     unet_in_channels = pipeline.unet.config.in_channels
     unet_sample_size = pipeline.unet.config.sample_size
     unet_path = output_path / "unet" / ONNX_MODEL

From 85b4245cef12a5166a499285b33388135ebb566a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 15:02:39 -0500
Subject: [PATCH 079/240] fix text encoder loading

---
 api/onnx_web/diffusers/load.py | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 60ef7090..bc303579 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -328,11 +328,12 @@ def load_text_encoders(
 
     # should be pretty small and should not need external data
     if loras is None or len(loras) == 0:
+        text_encoder = path.join(model, "text_encoder", ONNX_MODEL)
+
         if params.is_xl():
-            text_encoder = path.join(model, "text_encoder", ONNX_MODEL)
             text_encoder_opts = device.sess_options(cache=False)
             text_encoder_session = InferenceSession(
-                text_encoder.SerializeToString(),
+                text_encoder,
                 providers=[device.ort_provider("text-encoder")],
                 sess_options=text_encoder_opts,
             )
@@ -342,7 +343,7 @@ def load_text_encoders(
             text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
             text_encoder_2_opts = device.sess_options(cache=False)
             text_encoder_2_session = InferenceSession(
-                text_encoder_2.SerializeToString(),
+                text_encoder_2,
                 providers=[device.ort_provider("text-encoder")],
                 sess_options=text_encoder_2_opts,
             )
@@ -350,7 +351,7 @@ def load_text_encoders(
         else:
             components["text_encoder"] = OnnxRuntimeModel(
                 OnnxRuntimeModel.load_model(
-                    text_encoder.SerializeToString(),
+                    text_encoder,
                     provider=device.ort_provider("text-encoder"),
                     sess_options=device.sess_options(),
                 )

From a3a04fd1f499c0467c5166bda8f039700a838538 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 18:01:42 -0500
Subject: [PATCH 080/240] clean up text encoder loading logic, deduplicate
 sessions

---
 api/onnx_web/diffusers/load.py | 176 ++++++++++++++-------------------
 1 file changed, 75 insertions(+), 101 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index bc303579..a904aa36 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -294,7 +294,6 @@ def load_controlnet(server, device, params):
 def load_text_encoders(
     server, device, model: str, inversions, loras, torch_dtype, params
 ):
-    text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
     tokenizer = CLIPTokenizer.from_pretrained(
         model,
         subfolder="tokenizer",
@@ -304,14 +303,23 @@ def load_text_encoders(
     components = {}
     components["tokenizer"] = tokenizer
 
-    if inversions is not None and len(inversions) > 0:
-        logger.debug("blending Textual Inversions from %s", inversions)
-        inversion_names, inversion_weights = zip(*inversions)
+    text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
+    text_encoder_2 = None
 
+    if params.is_xl():
+        text_encoder_2 = load_model(path.join(model, "text_encoder_2", ONNX_MODEL))
+
+    # blend embeddings, if any
+    if inversions is not None and len(inversions) > 0:
+        inversion_names, inversion_weights = zip(*inversions)
         inversion_models = [
             path.join(server.model_path, "inversion", name) for name in inversion_names
         ]
+        logger.debug(
+            "blending base model %s with embeddings from %s", model, inversion_models
+        )
 
+        # TODO: blend text_encoder_2 as well
         text_encoder, tokenizer = blend_textual_inversions(
             server,
             text_encoder,
@@ -326,45 +334,15 @@ def load_text_encoders(
             ),
         )
 
-    # should be pretty small and should not need external data
-    if loras is None or len(loras) == 0:
-        text_encoder = path.join(model, "text_encoder", ONNX_MODEL)
-
-        if params.is_xl():
-            text_encoder_opts = device.sess_options(cache=False)
-            text_encoder_session = InferenceSession(
-                text_encoder,
-                providers=[device.ort_provider("text-encoder")],
-                sess_options=text_encoder_opts,
-            )
-
-            text_encoder_session._model_path = path.join(model, "text_encoder")
-
-            text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
-            text_encoder_2_opts = device.sess_options(cache=False)
-            text_encoder_2_session = InferenceSession(
-                text_encoder_2,
-                providers=[device.ort_provider("text-encoder")],
-                sess_options=text_encoder_2_opts,
-            )
-            text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
-        else:
-            components["text_encoder"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    text_encoder,
-                    provider=device.ort_provider("text-encoder"),
-                    sess_options=device.sess_options(),
-                )
-            )
-
-    else:
-        # blend and load text encoder
+    # blend LoRAs, if any
+    if loras is not None and len(loras) > 0:
         lora_names, lora_weights = zip(*loras)
         lora_models = [
             path.join(server.model_path, "lora", name) for name in lora_names
         ]
         logger.info("blending base model %s with LoRA models: %s", model, lora_models)
 
+        # blend and load text encoder
         text_encoder = blend_loras(
             server,
             text_encoder,
@@ -373,23 +351,8 @@ def load_text_encoders(
             1 if params.is_xl() else None,
             params.is_xl(),
         )
-        (text_encoder, text_encoder_data) = buffer_external_data_tensors(text_encoder)
-        text_encoder_names, text_encoder_values = zip(*text_encoder_data)
-        text_encoder_opts = device.sess_options(cache=False)
-        text_encoder_opts.add_external_initializers(
-            list(text_encoder_names), list(text_encoder_values)
-        )
 
         if params.is_xl():
-            text_encoder_session = InferenceSession(
-                text_encoder.SerializeToString(),
-                providers=[device.ort_provider("text-encoder")],
-                sess_options=text_encoder_opts,
-            )
-            text_encoder_session._model_path = path.join(model, "text_encoder")
-            components["text_encoder_session"] = text_encoder_session
-
-            text_encoder_2 = path.join(model, "text_encoder_2", ONNX_MODEL)
             text_encoder_2 = blend_loras(
                 server,
                 text_encoder_2,
@@ -398,37 +361,59 @@ def load_text_encoders(
                 2,
                 params.is_xl(),
             )
-            (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
-                text_encoder_2
-            )
-            text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
-            text_encoder_2_opts = device.sess_options(cache=False)
-            text_encoder_2_opts.add_external_initializers(
-                list(text_encoder_2_names), list(text_encoder_2_values)
-            )
 
-            text_encoder_2_session = InferenceSession(
-                text_encoder_2.SerializeToString(),
-                providers=[device.ort_provider("text-encoder")],
-                sess_options=text_encoder_2_opts,
-            )
-            text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
-            components["text_encoder_2_session"] = text_encoder_2_session
-        else:
-            components["text_encoder"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    text_encoder.SerializeToString(),
-                    provider=device.ort_provider("text-encoder"),
-                    sess_options=text_encoder_opts,
-                )
+    # prepare external data for sessions
+    (text_encoder, text_encoder_data) = buffer_external_data_tensors(text_encoder)
+    text_encoder_names, text_encoder_values = zip(*text_encoder_data)
+    text_encoder_opts = device.sess_options(cache=False)
+    text_encoder_opts.add_external_initializers(
+        list(text_encoder_names), list(text_encoder_values)
+    )
+
+    if params.is_xl():
+        # encoder 2 only exists in XL
+        (text_encoder_2, text_encoder_2_data) = buffer_external_data_tensors(
+            text_encoder_2
+        )
+        text_encoder_2_names, text_encoder_2_values = zip(*text_encoder_2_data)
+        text_encoder_2_opts = device.sess_options(cache=False)
+        text_encoder_2_opts.add_external_initializers(
+            list(text_encoder_2_names), list(text_encoder_2_values)
+        )
+
+        # session for te1
+        text_encoder_session = InferenceSession(
+            text_encoder,
+            providers=[device.ort_provider("text-encoder")],
+            sess_options=text_encoder_opts,
+        )
+        text_encoder_session._model_path = path.join(model, "text_encoder")
+        components["text_encoder_session"] = text_encoder_session
+
+        # session for te2
+        text_encoder_2_session = InferenceSession(
+            text_encoder_2,
+            providers=[device.ort_provider("text-encoder")],
+            sess_options=text_encoder_2_opts,
+        )
+        text_encoder_2_session._model_path = path.join(model, "text_encoder_2")
+        components["text_encoder_2_session"] = text_encoder_2_session
+    else:
+        # session for te
+        components["text_encoder"] = OnnxRuntimeModel(
+            OnnxRuntimeModel.load_model(
+                text_encoder,
+                provider=device.ort_provider("text-encoder"),
+                sess_options=text_encoder_opts,
             )
+        )
 
     return components
 
 
 def load_unet(server, device, model, loras, unet_type, params):
     components = {}
-    unet = path.join(model, unet_type, ONNX_MODEL)
+    unet = load_model(path.join(model, unet_type, ONNX_MODEL))
 
     # LoRA blending
     if loras is not None and len(loras) > 0:
@@ -446,37 +431,26 @@ def load_unet(server, device, model, loras, unet_type, params):
             "unet",
             xl=params.is_xl(),
         )
-        (unet_model, unet_data) = buffer_external_data_tensors(blended_unet)
-        unet_names, unet_values = zip(*unet_data)
-        unet_opts = device.sess_options(cache=False)
-        unet_opts.add_external_initializers(list(unet_names), list(unet_values))
 
-        if params.is_xl():
-            unet_session = InferenceSession(
-                unet_model.SerializeToString(),
-                providers=[device.ort_provider("unet")],
-                sess_options=unet_opts,
-            )
-            unet_session._model_path = path.join(model, "unet")
-            components["unet_session"] = unet_session
-        else:
-            components["unet"] = OnnxRuntimeModel(
-                OnnxRuntimeModel.load_model(
-                    unet_model.SerializeToString(),
-                    provider=device.ort_provider("unet"),
-                    sess_options=unet_opts,
-                )
-            )
+    (unet_model, unet_data) = buffer_external_data_tensors(blended_unet)
+    unet_names, unet_values = zip(*unet_data)
+    unet_opts = device.sess_options(cache=False)
+    unet_opts.add_external_initializers(list(unet_names), list(unet_values))
 
-    # make sure a UNet has been loaded
-    if not params.is_xl() and "unet" not in components:
-        unet = path.join(model, unet_type, ONNX_MODEL)
-        logger.debug("loading UNet (%s) from %s", unet_type, unet)
+    if params.is_xl():
+        unet_session = InferenceSession(
+            unet_model.SerializeToString(),
+            providers=[device.ort_provider("unet")],
+            sess_options=unet_opts,
+        )
+        unet_session._model_path = path.join(model, "unet")
+        components["unet_session"] = unet_session
+    else:
         components["unet"] = OnnxRuntimeModel(
             OnnxRuntimeModel.load_model(
-                unet,
+                unet_model.SerializeToString(),
                 provider=device.ort_provider("unet"),
-                sess_options=device.sess_options(),
+                sess_options=unet_opts,
             )
         )
 

From e1c2ae5b1bcfd2abdb3de7ee437ea80cfc3df1a8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 18:04:23 -0500
Subject: [PATCH 081/240] serialize models before loading

---
 api/onnx_web/diffusers/load.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index a904aa36..f51b191c 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -383,7 +383,7 @@ def load_text_encoders(
 
         # session for te1
         text_encoder_session = InferenceSession(
-            text_encoder,
+            text_encoder.SerializeToString(),
             providers=[device.ort_provider("text-encoder")],
             sess_options=text_encoder_opts,
         )
@@ -392,7 +392,7 @@ def load_text_encoders(
 
         # session for te2
         text_encoder_2_session = InferenceSession(
-            text_encoder_2,
+            text_encoder_2.SerializeToString(),
             providers=[device.ort_provider("text-encoder")],
             sess_options=text_encoder_2_opts,
         )
@@ -402,7 +402,7 @@ def load_text_encoders(
         # session for te
         components["text_encoder"] = OnnxRuntimeModel(
             OnnxRuntimeModel.load_model(
-                text_encoder,
+                text_encoder.SerializeToString(),
                 provider=device.ort_provider("text-encoder"),
                 sess_options=text_encoder_opts,
             )

From cdb09d2b444f6665fd2127776a8a74240b2f41ed Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 18:05:48 -0500
Subject: [PATCH 082/240] fix variable name

---
 api/onnx_web/diffusers/load.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index f51b191c..37800e71 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -424,7 +424,7 @@ def load_unet(server, device, model, loras, unet_type, params):
         logger.info("blending base model %s with LoRA models: %s", model, lora_models)
 
         # blend and load unet
-        blended_unet = blend_loras(
+        unet = blend_loras(
             server,
             unet,
             list(zip(lora_models, lora_weights)),
@@ -432,7 +432,7 @@ def load_unet(server, device, model, loras, unet_type, params):
             xl=params.is_xl(),
         )
 
-    (unet_model, unet_data) = buffer_external_data_tensors(blended_unet)
+    (unet_model, unet_data) = buffer_external_data_tensors(unet)
     unet_names, unet_values = zip(*unet_data)
     unet_opts = device.sess_options(cache=False)
     unet_opts.add_external_initializers(list(unet_names), list(unet_values))

From e338fcd0e0ac0725f4baef8ac81df6705849000a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 24 Sep 2023 18:15:58 -0500
Subject: [PATCH 083/240] lint(api): start renaming inversions to embeddings in
 code

---
 api/onnx_web/chain/blend_img2img.py    |  2 +-
 api/onnx_web/chain/source_txt2img.py   |  2 +-
 api/onnx_web/chain/upscale_outpaint.py |  2 +-
 api/onnx_web/diffusers/load.py         | 55 ++++++++++++++++----------
 4 files changed, 38 insertions(+), 23 deletions(-)

diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index 0d5ad28e..af181c10 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -52,7 +52,7 @@ class BlendImg2ImgStage(BaseStage):
             params,
             pipe_type,
             worker.get_device(),
-            inversions=inversions,
+            embeddings=inversions,
             loras=loras,
         )
 
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index b4dd7c24..5448364e 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -79,7 +79,7 @@ class SourceTxt2ImgStage(BaseStage):
             params,
             pipe_type,
             worker.get_device(),
-            inversions=inversions,
+            embeddings=inversions,
             loras=loras,
         )
 
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 67f7ca0a..78d32077 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -56,7 +56,7 @@ class UpscaleOutpaintStage(BaseStage):
             params,
             pipe_type,
             worker.get_device(),
-            inversions=inversions,
+            embeddings=inversions,
             loras=loras,
         )
 
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 37800e71..1198d85d 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -1,6 +1,6 @@
 from logging import getLogger
 from os import path
-from typing import Any, List, Optional, Tuple
+from typing import Any, List, Literal, Optional, Tuple
 
 from onnx import load_model
 from optimum.onnxruntime import (  # ORTStableDiffusionXLInpaintPipeline,
@@ -114,11 +114,11 @@ def load_pipeline(
     params: ImageParams,
     pipeline: str,
     device: DeviceParams,
-    inversions: Optional[List[Tuple[str, float]]] = None,
+    embeddings: Optional[List[Tuple[str, float]]] = None,
     loras: Optional[List[Tuple[str, float]]] = None,
     model: Optional[str] = None,
 ):
-    inversions = inversions or []
+    embeddings = embeddings or []
     loras = loras or []
     model = model or params.model
 
@@ -132,7 +132,7 @@ def load_pipeline(
         device.device,
         device.provider,
         control_key,
-        inversions,
+        embeddings,
         loras,
     )
     scheduler_key = (params.scheduler, model)
@@ -189,9 +189,9 @@ def load_pipeline(
             components.update(control_components)
             unet_type = "cnet"
 
-        # Textual Inversion blending
+        # load various pipeline components
         encoder_components = load_text_encoders(
-            server, device, model, inversions, loras, torch_dtype, params
+            server, device, model, embeddings, loras, torch_dtype, params
         )
         components.update(encoder_components)
 
@@ -277,7 +277,7 @@ def load_pipeline(
     return pipe
 
 
-def load_controlnet(server, device, params):
+def load_controlnet(server: ServerContext, device: DeviceParams, params: ImageParams):
     cnet_path = path.join(server.model_path, "control", f"{params.control.name}.onnx")
     logger.debug("loading ControlNet weights from %s", cnet_path)
     components = {}
@@ -292,7 +292,13 @@ def load_controlnet(server, device, params):
 
 
 def load_text_encoders(
-    server, device, model: str, inversions, loras, torch_dtype, params
+    server: ServerContext,
+    device: DeviceParams,
+    model: str,
+    embeddings: Optional[List[Tuple[str, float]]],
+    loras: Optional[List[Tuple[str, float]]],
+    torch_dtype,
+    params: ImageParams,
 ):
     tokenizer = CLIPTokenizer.from_pretrained(
         model,
@@ -310,13 +316,13 @@ def load_text_encoders(
         text_encoder_2 = load_model(path.join(model, "text_encoder_2", ONNX_MODEL))
 
     # blend embeddings, if any
-    if inversions is not None and len(inversions) > 0:
-        inversion_names, inversion_weights = zip(*inversions)
-        inversion_models = [
-            path.join(server.model_path, "inversion", name) for name in inversion_names
+    if embeddings is not None and len(embeddings) > 0:
+        embedding_names, embedding_weights = zip(*embeddings)
+        embedding_models = [
+            path.join(server.model_path, "inversion", name) for name in embedding_names
         ]
         logger.debug(
-            "blending base model %s with embeddings from %s", model, inversion_models
+            "blending base model %s with embeddings from %s", model, embedding_models
         )
 
         # TODO: blend text_encoder_2 as well
@@ -326,10 +332,10 @@ def load_text_encoders(
             tokenizer,
             list(
                 zip(
-                    inversion_models,
-                    inversion_weights,
-                    inversion_names,
-                    [None] * len(inversion_models),
+                    embedding_models,
+                    embedding_weights,
+                    embedding_names,
+                    [None] * len(embedding_models),
                 )
             ),
         )
@@ -340,7 +346,7 @@ def load_text_encoders(
         lora_models = [
             path.join(server.model_path, "lora", name) for name in lora_names
         ]
-        logger.info("blending base model %s with LoRA models: %s", model, lora_models)
+        logger.info("blending base model %s with LoRAs from %s", model, lora_models)
 
         # blend and load text encoder
         text_encoder = blend_loras(
@@ -411,7 +417,14 @@ def load_text_encoders(
     return components
 
 
-def load_unet(server, device, model, loras, unet_type, params):
+def load_unet(
+    server: ServerContext,
+    device: DeviceParams,
+    model: str,
+    loras: List[Tuple[str, float]],
+    unet_type: Literal["cnet", "unet"],
+    params: ImageParams,
+):
     components = {}
     unet = load_model(path.join(model, unet_type, ONNX_MODEL))
 
@@ -457,7 +470,9 @@ def load_unet(server, device, model, loras, unet_type, params):
     return components
 
 
-def load_vae(server, device, model, params):
+def load_vae(
+    server: ServerContext, device: DeviceParams, model: str, params: ImageParams
+):
     # one or more VAE models need to be loaded
     vae = path.join(model, "vae", ONNX_MODEL)
     vae_decoder = path.join(model, "vae_decoder", ONNX_MODEL)

From fc02fa6be1b8b99d53a1804ccec92db3f07b1b12 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 25 Sep 2023 18:24:16 -0500
Subject: [PATCH 084/240] fix(api): blend embeddings into second tokenizer/text
 encoder for SDXL

---
 api/onnx_web/diffusers/load.py | 44 ++++++++++++++++++++++++++--------
 1 file changed, 34 insertions(+), 10 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 1198d85d..eeea47d4 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -201,11 +201,6 @@ def load_pipeline(
         vae_components = load_vae(server, device, model, params)
         components.update(vae_components)
 
-        # additional options for panorama pipeline
-        if params.is_panorama():
-            components["window"] = params.tiles // 8
-            components["stride"] = params.stride // 8
-
         pipeline_class = available_pipelines.get(pipeline, OnnxStableDiffusionPipeline)
         logger.debug("loading pretrained SD pipeline for %s", pipeline_class.__name__)
         pipe = pipeline_class.from_pretrained(
@@ -228,8 +223,15 @@ def load_pipeline(
                 components["text_encoder_2_session"], pipe
             )
 
+        if "tokenizer" in components:
+            pipe.tokenizer = components["tokenizer"]
+
+        if "tokenizer_2" in components:
+            pipe.tokenizer_2 = components["tokenizer_2"]
+
         if "unet_session" in components:
             # unload old UNet
+            logger.debug("unloading previous Unet")
             pipe.unet = None
             run_gc([device])
 
@@ -300,20 +302,25 @@ def load_text_encoders(
     torch_dtype,
     params: ImageParams,
 ):
+    text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
     tokenizer = CLIPTokenizer.from_pretrained(
         model,
         subfolder="tokenizer",
         torch_dtype=torch_dtype,
     )
 
-    components = {}
-    components["tokenizer"] = tokenizer
-
-    text_encoder = load_model(path.join(model, "text_encoder", ONNX_MODEL))
-    text_encoder_2 = None
+    components = {
+        "tokenizer": tokenizer,
+    }
 
     if params.is_xl():
         text_encoder_2 = load_model(path.join(model, "text_encoder_2", ONNX_MODEL))
+        tokenizer_2 = CLIPTokenizer.from_pretrained(
+            model,
+            subfolder="tokenizer_2",
+            torch_dtype=torch_dtype,
+        )
+        components["tokenizer_2"] = tokenizer_2
 
     # blend embeddings, if any
     if embeddings is not None and len(embeddings) > 0:
@@ -339,6 +346,23 @@ def load_text_encoders(
                 )
             ),
         )
+        components["tokenizer"] = tokenizer
+
+        if params.is_xl():
+            text_encoder_2, tokenizer_2 = blend_textual_inversions(
+                server,
+                text_encoder_2,
+                tokenizer_2,
+                list(
+                    zip(
+                        embedding_models,
+                        embedding_weights,
+                        embedding_names,
+                        [None] * len(embedding_models),
+                    )
+                ),
+            )
+            components["tokenizer_2"] = tokenizer_2
 
     # blend LoRAs, if any
     if loras is not None and len(loras) > 0:

From 23aa00d696ef8e324e14f58a33f3fdc66d4fcc8c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 25 Sep 2023 21:57:25 -0500
Subject: [PATCH 085/240] start testing pipeline loading

---
 api/onnx_web/diffusers/load.py        |  17 +--
 api/tests/helpers.py                  |   9 ++
 api/tests/test_diffusers/test_load.py | 147 +++++++++++++++++++++++++-
 onnx-web.code-workspace               |   1 +
 4 files changed, 165 insertions(+), 9 deletions(-)
 create mode 100644 api/tests/helpers.py

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index eeea47d4..38b61e50 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -169,14 +169,15 @@ def load_pipeline(
             run_gc([device])
 
         logger.debug("loading new diffusion pipeline from %s", model)
+        scheduler = scheduler_type.from_pretrained(
+            model,
+            provider=device.ort_provider(),
+            sess_options=device.sess_options(),
+            subfolder="scheduler",
+            torch_dtype=torch_dtype,
+        )
         components = {
-            "scheduler": scheduler_type.from_pretrained(
-                model,
-                provider=device.ort_provider(),
-                sess_options=device.sess_options(),
-                subfolder="scheduler",
-                torch_dtype=torch_dtype,
-            )
+            "scheduler": scheduler,
         }
 
         # shared components
@@ -257,7 +258,7 @@ def load_pipeline(
         patch_pipeline(server, pipe, pipeline_class, params)
 
         server.cache.set(ModelTypes.diffusion, pipe_key, pipe)
-        server.cache.set(ModelTypes.scheduler, scheduler_key, components["scheduler"])
+        server.cache.set(ModelTypes.scheduler, scheduler_key, scheduler)
 
     for vae in VAE_COMPONENTS:
         if hasattr(pipe, vae):
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
new file mode 100644
index 00000000..3fc5cc7b
--- /dev/null
+++ b/api/tests/helpers.py
@@ -0,0 +1,9 @@
+from typing import List
+
+
+def test_with_models(models: List[str]):
+  def wrapper(func):
+    # TODO: check if models exist
+    return func
+
+  return wrapper
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index beaab12c..7b811497 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -1,18 +1,26 @@
 import unittest
+from os import path
 
+import torch
 from diffusers import DDIMScheduler
 
 from onnx_web.diffusers.load import (
     get_available_pipelines,
     get_pipeline_schedulers,
     get_scheduler_name,
+    load_controlnet,
+    load_text_encoders,
+    load_unet,
+    load_vae,
     optimize_pipeline,
     patch_pipeline,
 )
 from onnx_web.diffusers.patches.unet import UNetWrapper
 from onnx_web.diffusers.patches.vae import VAEWrapper
-from onnx_web.params import ImageParams
+from onnx_web.models.meta import NetworkModel, NetworkType
+from onnx_web.params import DeviceParams, ImageParams
 from onnx_web.server.context import ServerContext
+from tests.helpers import test_with_models
 from tests.mocks import MockPipeline
 
 
@@ -130,3 +138,140 @@ class TestPatchPipeline(unittest.TestCase):
     patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
     self.assertTrue(isinstance(pipeline.vae_decoder, VAEWrapper))
     self.assertTrue(isinstance(pipeline.vae_encoder, VAEWrapper))
+
+
+class TestLoadControlNet(unittest.TestCase):
+  @unittest.skipUnless(path.exists("../models/control/canny.onnx"), "model does not exist")
+  def test_load_existing(self):
+    """
+    Should load a model
+    """
+    components = load_controlnet(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1, control=NetworkModel("canny", "control")),
+    )
+    self.assertIn("controlnet", components)
+
+  def test_load_missing(self):
+    """
+    Should throw
+    """
+    components = {}
+    try:
+      components = load_controlnet(
+        ServerContext(),
+        DeviceParams("cpu", "CPUExecutionProvider"),
+        ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1, control=NetworkModel("missing", "control")),
+      )
+    except:
+      self.assertNotIn("controlnet", components)
+      return
+
+    self.fail()
+
+
+class TestLoadTextEncoders(unittest.TestCase):
+  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
+  def test_load_embeddings(self):
+    """
+    Should add the token to tokenizer
+    Should increase the encoder dims
+    """
+    components = load_text_encoders(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/stable-diffusion-onnx-v1-5",
+      [
+        # TODO: add some embeddings
+      ],
+      [],
+      torch.float32,
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertIn("text_encoder", components)
+
+  def test_load_embeddings_xl(self):
+    pass
+
+  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
+  def test_load_loras(self):
+    components = load_text_encoders(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/stable-diffusion-onnx-v1-5",
+      [],
+      [
+        # TODO: add some loras
+      ],
+      torch.float32,
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertIn("text_encoder", components)
+
+  def test_load_loras_xl(self):
+    pass
+
+class TestLoadUnet(unittest.TestCase):
+  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/unet/model.onnx"), "model does not exist")
+  def test_load_unet_loras(self):
+    components = load_unet(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/stable-diffusion-onnx-v1-5",
+      [
+        # TODO: add some loras
+      ],
+      "unet",
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertIn("unet", components)
+
+  def test_load_unet_loras_xl(self):
+    pass
+
+  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/cnet/model.onnx"), "model does not exist")
+  def test_load_cnet_loras(self):
+    components = load_unet(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/stable-diffusion-onnx-v1-5",
+      [
+        # TODO: add some loras
+      ],
+      "cnet",
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertIn("unet", components)
+
+
+class TestLoadVae(unittest.TestCase):
+  @unittest.skipUnless(lambda: path.exists("../models/upscaling-stable-diffusion-x4/vae/model.onnx"), "model does not exist")
+  def test_load_single(self):
+    """
+    Should return single component
+    """
+    components = load_vae(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/upscaling-stable-diffusion-x4",
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertIn("vae", components)
+    self.assertNotIn("vae_decoder", components)
+    self.assertNotIn("vae_encoder", components)
+
+  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/vae_encoder/model.onnx"), "model does not exist")
+  def test_load_split(self):
+    """
+    Should return split encoder/decoder
+    """
+    components = load_vae(
+      ServerContext(model_path="../models"),
+      DeviceParams("cpu", "CPUExecutionProvider"),
+      "../models/stable-diffusion-onnx-v1-5",
+      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    )
+    self.assertNotIn("vae", components)
+    self.assertIn("vae_decoder", components)
+    self.assertIn("vae_encoder", components)
diff --git a/onnx-web.code-workspace b/onnx-web.code-workspace
index 08f791d9..d3965a5f 100644
--- a/onnx-web.code-workspace
+++ b/onnx-web.code-workspace
@@ -83,6 +83,7 @@
 			"scandir",
 			"scipy",
 			"scrollback",
+			"sdxl",
 			"sess",
 			"Singlestep",
 			"spacy",

From 898d76e4a589bcd0c7676a296039e1d7b0e3177e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 25 Sep 2023 22:10:47 -0500
Subject: [PATCH 086/240] fix conditional tests

---
 api/tests/test_diffusers/test_load.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index 7b811497..8a7720c7 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -172,7 +172,7 @@ class TestLoadControlNet(unittest.TestCase):
 
 
 class TestLoadTextEncoders(unittest.TestCase):
-  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
   def test_load_embeddings(self):
     """
     Should add the token to tokenizer
@@ -194,7 +194,7 @@ class TestLoadTextEncoders(unittest.TestCase):
   def test_load_embeddings_xl(self):
     pass
 
-  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
   def test_load_loras(self):
     components = load_text_encoders(
       ServerContext(model_path="../models"),
@@ -213,7 +213,7 @@ class TestLoadTextEncoders(unittest.TestCase):
     pass
 
 class TestLoadUnet(unittest.TestCase):
-  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/unet/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/unet/model.onnx"), "model does not exist")
   def test_load_unet_loras(self):
     components = load_unet(
       ServerContext(model_path="../models"),
@@ -230,7 +230,7 @@ class TestLoadUnet(unittest.TestCase):
   def test_load_unet_loras_xl(self):
     pass
 
-  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/cnet/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/cnet/model.onnx"), "model does not exist")
   def test_load_cnet_loras(self):
     components = load_unet(
       ServerContext(model_path="../models"),
@@ -246,7 +246,7 @@ class TestLoadUnet(unittest.TestCase):
 
 
 class TestLoadVae(unittest.TestCase):
-  @unittest.skipUnless(lambda: path.exists("../models/upscaling-stable-diffusion-x4/vae/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/upscaling-stable-diffusion-x4/vae/model.onnx"), "model does not exist")
   def test_load_single(self):
     """
     Should return single component
@@ -261,7 +261,7 @@ class TestLoadVae(unittest.TestCase):
     self.assertNotIn("vae_decoder", components)
     self.assertNotIn("vae_encoder", components)
 
-  @unittest.skipUnless(lambda: path.exists("../models/stable-diffusion-onnx-v1-5/vae_encoder/model.onnx"), "model does not exist")
+  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/vae_encoder/model.onnx"), "model does not exist")
   def test_load_split(self):
     """
     Should return split encoder/decoder

From 047e58c91680e5d53de2ad7469497603cbf474c7 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 28 Sep 2023 18:45:04 -0500
Subject: [PATCH 087/240] fix(api): continue adding tests, fix bugs encountered

---
 api/onnx_web/convert/utils.py         |  22 ++--
 api/onnx_web/diffusers/run.py         |   1 +
 api/onnx_web/image/source_filter.py   |   2 +-
 api/onnx_web/worker/context.py        |   7 +-
 api/onnx_web/worker/pool.py           |  11 +-
 api/onnx_web/worker/worker.py         |   2 +-
 api/tests/chain/test_tile.py          |  30 +++++
 api/tests/convert/test_utils.py       | 167 ++++++++++++++++++++++++-
 api/tests/helpers.py                  |  17 ++-
 api/tests/image/__init__.py           |   0
 api/tests/image/test_mask_filter.py   |  33 +++++
 api/tests/image/test_source_filter.py |  37 ++++++
 api/tests/server/test_load.py         |  13 ++
 api/tests/test_diffusers/test_load.py |   3 +-
 api/tests/test_diffusers/test_run.py  | 171 ++++++++++++++++++++++++++
 api/tests/worker/test_pool.py         |  62 ++++++----
 16 files changed, 526 insertions(+), 52 deletions(-)
 create mode 100644 api/tests/image/__init__.py
 create mode 100644 api/tests/image/test_mask_filter.py
 create mode 100644 api/tests/image/test_source_filter.py
 create mode 100644 api/tests/test_diffusers/test_run.py

diff --git a/api/onnx_web/convert/utils.py b/api/onnx_web/convert/utils.py
index 9ed7424f..52963916 100644
--- a/api/onnx_web/convert/utils.py
+++ b/api/onnx_web/convert/utils.py
@@ -133,9 +133,9 @@ def tuple_to_source(model: Union[ModelDict, LegacyModel]):
 def tuple_to_correction(model: Union[ModelDict, LegacyModel]):
     if isinstance(model, list) or isinstance(model, tuple):
         name, source, *rest = model
-        scale = rest[0] if len(rest) > 0 else 1
-        half = rest[0] if len(rest) > 0 else False
-        opset = rest[0] if len(rest) > 0 else None
+        scale = rest.pop(0) if len(rest) > 0 else 1
+        half = rest.pop(0) if len(rest) > 0 else False
+        opset = rest.pop(0) if len(rest) > 0 else None
 
         return {
             "name": name,
@@ -151,9 +151,9 @@ def tuple_to_correction(model: Union[ModelDict, LegacyModel]):
 def tuple_to_diffusion(model: Union[ModelDict, LegacyModel]):
     if isinstance(model, list) or isinstance(model, tuple):
         name, source, *rest = model
-        single_vae = rest[0] if len(rest) > 0 else False
-        half = rest[0] if len(rest) > 0 else False
-        opset = rest[0] if len(rest) > 0 else None
+        single_vae = rest.pop(0) if len(rest) > 0 else False
+        half = rest.pop(0) if len(rest) > 0 else False
+        opset = rest.pop(0) if len(rest) > 0 else None
 
         return {
             "name": name,
@@ -169,9 +169,9 @@ def tuple_to_diffusion(model: Union[ModelDict, LegacyModel]):
 def tuple_to_upscaling(model: Union[ModelDict, LegacyModel]):
     if isinstance(model, list) or isinstance(model, tuple):
         name, source, *rest = model
-        scale = rest[0] if len(rest) > 0 else 1
-        half = rest[0] if len(rest) > 0 else False
-        opset = rest[0] if len(rest) > 0 else None
+        scale = rest.pop(0) if len(rest) > 0 else 1
+        half = rest.pop(0) if len(rest) > 0 else False
+        opset = rest.pop(0) if len(rest) > 0 else None
 
         return {
             "name": name,
@@ -298,6 +298,7 @@ def onnx_export(
     half=False,
     external_data=False,
     v2=False,
+    op_block_list=None,
 ):
     """
     From https://github.com/huggingface/diffusers/blob/main/scripts/convert_stable_diffusion_checkpoint_to_onnx.py
@@ -316,8 +317,7 @@ def onnx_export(
         opset_version=opset,
     )
 
-    op_block_list = None
-    if v2:
+    if v2 and op_block_list is None:
         op_block_list = ["Attention", "MultiHeadAttention"]
 
     if half:
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index b1f14b1d..a9c72d2f 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -97,6 +97,7 @@ def run_txt2img_pipeline(
     _pairs, loras, inversions, _rest = parse_prompt(params)
 
     for image, output in zip(images, outputs):
+        logger.trace("saving output image %s: %s", output, image.size)
         dest = save_image(
             server,
             output,
diff --git a/api/onnx_web/image/source_filter.py b/api/onnx_web/image/source_filter.py
index ea6e0d12..99c6b5eb 100644
--- a/api/onnx_web/image/source_filter.py
+++ b/api/onnx_web/image/source_filter.py
@@ -47,7 +47,7 @@ def source_filter_noise(
     source: Image.Image,
     strength: float = 0.5,
 ):
-    noise = noise_source_histogram(source, source.size)
+    noise = noise_source_histogram(source, source.size, (0, 0))
     return ImageChops.blend(source, noise, strength)
 
 
diff --git a/api/onnx_web/worker/context.py b/api/onnx_web/worker/context.py
index 2b35ff4c..a24613ed 100644
--- a/api/onnx_web/worker/context.py
+++ b/api/onnx_web/worker/context.py
@@ -25,6 +25,7 @@ class WorkerContext:
     idle: "Value[bool]"
     timeout: float
     retries: int
+    initial_retries: int
 
     def __init__(
         self,
@@ -37,6 +38,7 @@ class WorkerContext:
         active_pid: "Value[int]",
         idle: "Value[bool]",
         retries: int,
+        timeout: float,
     ):
         self.job = None
         self.name = name
@@ -48,12 +50,13 @@ class WorkerContext:
         self.active_pid = active_pid
         self.last_progress = None
         self.idle = idle
+        self.initial_retries = retries
         self.retries = retries
-        self.timeout = 1.0
+        self.timeout = timeout
 
     def start(self, job: str) -> None:
         self.job = job
-        self.retries = 3
+        self.retries = self.initial_retries
         self.set_cancel(cancel=False)
         self.set_idle(idle=False)
 
diff --git a/api/onnx_web/worker/pool.py b/api/onnx_web/worker/pool.py
index 833a04f8..3b0d32a8 100644
--- a/api/onnx_web/worker/pool.py
+++ b/api/onnx_web/worker/pool.py
@@ -86,15 +86,15 @@ class DevicePoolExecutor:
         self.logs = Queue(self.max_pending_per_worker)
         self.rlock = Lock()
 
-    def start(self) -> None:
+    def start(self, *args) -> None:
         self.create_health_worker()
         self.create_logger_worker()
         self.create_progress_worker()
 
         for device in self.devices:
-            self.create_device_worker(device)
+            self.create_device_worker(device, *args)
 
-    def create_device_worker(self, device: DeviceParams) -> None:
+    def create_device_worker(self, device: DeviceParams, *args) -> None:
         name = device.device
 
         # always recreate queues
@@ -125,15 +125,16 @@ class DevicePoolExecutor:
             active_pid=current,
             idle=self.worker_idle[name],
             retries=self.server.worker_retries,
+            timeout=self.progress_interval,
         )
         self.context[name] = context
 
         worker = Process(
             name=f"onnx-web worker: {name}",
             target=worker_main,
-            args=(context, self.server),
+            args=(context, self.server, *args),
+            daemon=True,
         )
-        worker.daemon = True
         self.workers[name] = worker
 
         logger.debug("starting worker for device %s", device)
diff --git a/api/onnx_web/worker/worker.py b/api/onnx_web/worker/worker.py
index 361c1150..5377c42a 100644
--- a/api/onnx_web/worker/worker.py
+++ b/api/onnx_web/worker/worker.py
@@ -27,7 +27,7 @@ MEMORY_ERRORS = [
 ]
 
 
-def worker_main(worker: WorkerContext, server: ServerContext):
+def worker_main(worker: WorkerContext, server: ServerContext, *args):
     apply_patches(server)
     setproctitle("onnx-web worker: %s" % (worker.device.device))
 
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index a613a719..7f599db2 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -7,6 +7,8 @@ from onnx_web.chain.tile import (
     generate_tile_spiral,
     get_tile_grads,
     needs_tile,
+    process_tile_grid,
+    process_tile_spiral,
 )
 from onnx_web.params import Size
 
@@ -95,3 +97,31 @@ class TestGenerateTileSpiral(unittest.TestCase):
     self.assertEqual(len(tiles), 225)
     self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
     self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
+
+
+class TestProcessTileGrid(unittest.TestCase):
+  def test_grid_full(self):
+    source = Image.new("RGB", (64, 64))
+    blend = process_tile_grid(source, 32, 1, [])
+
+    self.assertEqual(blend.size, (64, 64))
+
+  def test_grid_partial(self):
+    source = Image.new("RGB", (72, 72))
+    blend = process_tile_grid(source, 32, 1, [])
+
+    self.assertEqual(blend.size, (72, 72))
+
+
+class TestProcessTileSpiral(unittest.TestCase):
+  def test_grid_full(self):
+    source = Image.new("RGB", (64, 64))
+    blend = process_tile_spiral(source, 32, 1, [])
+
+    self.assertEqual(blend.size, (64, 64))
+
+  def test_grid_partial(self):
+    source = Image.new("RGB", (72, 72))
+    blend = process_tile_spiral(source, 32, 1, [])
+
+    self.assertEqual(blend.size, (72, 72))
diff --git a/api/tests/convert/test_utils.py b/api/tests/convert/test_utils.py
index 755d6032..45c8fccc 100644
--- a/api/tests/convert/test_utils.py
+++ b/api/tests/convert/test_utils.py
@@ -1,6 +1,14 @@
 import unittest
 
-from onnx_web.convert.utils import DEFAULT_OPSET, ConversionContext, download_progress
+from onnx_web.convert.utils import (
+    DEFAULT_OPSET,
+    ConversionContext,
+    download_progress,
+    tuple_to_correction,
+    tuple_to_diffusion,
+    tuple_to_source,
+    tuple_to_upscaling,
+)
 
 
 class ConversionContextTests(unittest.TestCase):
@@ -17,3 +25,160 @@ class DownloadProgressTests(unittest.TestCase):
    def test_download_example(self):
       path = download_progress([("https://example.com", "/tmp/example-dot-com")])
       self.assertEqual(path, "/tmp/example-dot-com")
+
+
+class TupleToSourceTests(unittest.TestCase):
+   def test_basic_tuple(self):
+      source = tuple_to_source(("foo", "bar"))
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_list(self):
+      source = tuple_to_source(["foo", "bar"])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_dict(self):
+      source = tuple_to_source(["foo", "bar"])
+      source["bin"] = "bin"
+
+      # make sure this is returned as-is with extra fields
+      second = tuple_to_source(source)
+
+      self.assertEqual(source, second)
+      self.assertIn("bin", second)
+
+
+class TupleToCorrectionTests(unittest.TestCase):
+   def test_basic_tuple(self):
+      source = tuple_to_correction(("foo", "bar"))
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_list(self):
+      source = tuple_to_correction(["foo", "bar"])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_dict(self):
+      source = tuple_to_correction(["foo", "bar"])
+      source["bin"] = "bin"
+
+      # make sure this is returned with extra fields
+      second = tuple_to_source(source)
+
+      self.assertEqual(source, second)
+      self.assertIn("bin", second)
+
+   def test_scale_tuple(self):
+      source = tuple_to_correction(["foo", "bar", 2])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_half_tuple(self):
+      source = tuple_to_correction(["foo", "bar", True])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_opset_tuple(self):
+      source = tuple_to_correction(["foo", "bar", 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_all_tuple(self):
+      source = tuple_to_correction(["foo", "bar", 2, True, 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+      self.assertEqual(source["scale"], 2)
+      self.assertEqual(source["half"], True)
+      self.assertEqual(source["opset"], 14)
+
+
+class TupleToDiffusionTests(unittest.TestCase):
+   def test_basic_tuple(self):
+      source = tuple_to_diffusion(("foo", "bar"))
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_list(self):
+      source = tuple_to_diffusion(["foo", "bar"])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_dict(self):
+      source = tuple_to_diffusion(["foo", "bar"])
+      source["bin"] = "bin"
+
+      # make sure this is returned with extra fields
+      second = tuple_to_diffusion(source)
+
+      self.assertEqual(source, second)
+      self.assertIn("bin", second)
+
+   def test_single_vae_tuple(self):
+      source = tuple_to_diffusion(["foo", "bar", True])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_half_tuple(self):
+      source = tuple_to_diffusion(["foo", "bar", True])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_opset_tuple(self):
+      source = tuple_to_diffusion(["foo", "bar", 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_all_tuple(self):
+      source = tuple_to_diffusion(["foo", "bar", True, True, 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+      self.assertEqual(source["single_vae"], True)
+      self.assertEqual(source["half"], True)
+      self.assertEqual(source["opset"], 14)
+
+
+class TupleToUpscalingTests(unittest.TestCase):
+   def test_basic_tuple(self):
+      source = tuple_to_upscaling(("foo", "bar"))
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_list(self):
+      source = tuple_to_upscaling(["foo", "bar"])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_basic_dict(self):
+      source = tuple_to_upscaling(["foo", "bar"])
+      source["bin"] = "bin"
+
+      # make sure this is returned with extra fields
+      second = tuple_to_source(source)
+
+      self.assertEqual(source, second)
+      self.assertIn("bin", second)
+
+   def test_scale_tuple(self):
+      source = tuple_to_upscaling(["foo", "bar", 2])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_half_tuple(self):
+      source = tuple_to_upscaling(["foo", "bar", True])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_opset_tuple(self):
+      source = tuple_to_upscaling(["foo", "bar", 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+
+   def test_all_tuple(self):
+      source = tuple_to_upscaling(["foo", "bar", 2, True, 14])
+      self.assertEqual(source["name"], "foo")
+      self.assertEqual(source["source"], "bar")
+      self.assertEqual(source["scale"], 2)
+      self.assertEqual(source["half"], True)
+      self.assertEqual(source["opset"], 14)
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index 3fc5cc7b..586ecbd8 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -1,9 +1,16 @@
+from os import path
 from typing import List
+from unittest import skipUnless
+
+from onnx_web.params import DeviceParams
 
 
-def test_with_models(models: List[str]):
-  def wrapper(func):
-    # TODO: check if models exist
-    return func
+def test_needs_models(models: List[str]):
+  return skipUnless(all([path.exists(model) for model in models]), "model does not exist")
 
-  return wrapper
+
+def test_device() -> DeviceParams:
+  return DeviceParams("cpu", "CPUExecutionProvider")
+
+
+TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
\ No newline at end of file
diff --git a/api/tests/image/__init__.py b/api/tests/image/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/api/tests/image/test_mask_filter.py b/api/tests/image/test_mask_filter.py
new file mode 100644
index 00000000..58b46c7c
--- /dev/null
+++ b/api/tests/image/test_mask_filter.py
@@ -0,0 +1,33 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.image.mask_filter import (
+    mask_filter_gaussian_multiply,
+    mask_filter_gaussian_screen,
+    mask_filter_none,
+)
+
+
+class MaskFilterNoneTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    mask = Image.new("RGB", dims)
+    result = mask_filter_none(mask, dims, (0, 0))
+    self.assertEqual(result.size, dims)
+
+
+class MaskFilterGaussianMultiplyTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    mask = Image.new("RGB", dims)
+    result = mask_filter_gaussian_multiply(mask, dims, (0, 0))
+    self.assertEqual(result.size, dims)
+
+
+class MaskFilterGaussianScreenTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    mask = Image.new("RGB", dims)
+    result = mask_filter_gaussian_screen(mask, dims, (0, 0))
+    self.assertEqual(result.size, dims)
diff --git a/api/tests/image/test_source_filter.py b/api/tests/image/test_source_filter.py
new file mode 100644
index 00000000..89e73924
--- /dev/null
+++ b/api/tests/image/test_source_filter.py
@@ -0,0 +1,37 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.image.source_filter import (
+    source_filter_gaussian,
+    source_filter_noise,
+    source_filter_none,
+)
+from onnx_web.server.context import ServerContext
+
+
+class SourceFilterNoneTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    server = ServerContext()
+    source = Image.new("RGB", dims)
+    result = source_filter_none(server, source)
+    self.assertEqual(result.size, dims)
+
+
+class SourceFilterGaussianTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    server = ServerContext()
+    source = Image.new("RGB", dims)
+    result = source_filter_gaussian(server, source)
+    self.assertEqual(result.size, dims)
+
+
+class SourceFilterNoiseTests(unittest.TestCase):
+  def test_basic(self):
+    dims = (64, 64)
+    server = ServerContext()
+    source = Image.new("RGB", dims)
+    result = source_filter_noise(server, source)
+    self.assertEqual(result.size, dims)
diff --git a/api/tests/server/test_load.py b/api/tests/server/test_load.py
index 67a5f4e4..c32b9663 100644
--- a/api/tests/server/test_load.py
+++ b/api/tests/server/test_load.py
@@ -1,5 +1,6 @@
 import unittest
 
+from onnx_web.server.context import ServerContext
 from onnx_web.server.load import (
     get_available_platforms,
     get_config_params,
@@ -14,6 +15,8 @@ from onnx_web.server.load import (
     get_source_filters,
     get_upscaling_models,
     get_wildcard_data,
+    load_extras,
+    load_models,
 )
 
 
@@ -81,3 +84,13 @@ class SourceFilterTests(unittest.TestCase):
     def test_before_setup(self):
         filters = get_source_filters()
         self.assertIsNotNone(filters)
+
+class LoadExtrasTests(unittest.TestCase):
+    def test_default_extras(self):
+        server = ServerContext(extra_models=["../models/extras.json"])
+        load_extras(server)
+
+class LoadModelsTests(unittest.TestCase):
+    def test_default_models(self):
+        server = ServerContext(model_path="../models")
+        load_models(server)
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index 8a7720c7..8f7a3963 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -17,10 +17,9 @@ from onnx_web.diffusers.load import (
 )
 from onnx_web.diffusers.patches.unet import UNetWrapper
 from onnx_web.diffusers.patches.vae import VAEWrapper
-from onnx_web.models.meta import NetworkModel, NetworkType
+from onnx_web.models.meta import NetworkModel
 from onnx_web.params import DeviceParams, ImageParams
 from onnx_web.server.context import ServerContext
-from tests.helpers import test_with_models
 from tests.mocks import MockPipeline
 
 
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
new file mode 100644
index 00000000..5152a834
--- /dev/null
+++ b/api/tests/test_diffusers/test_run.py
@@ -0,0 +1,171 @@
+import unittest
+from multiprocessing import Queue, Value
+from os import path
+
+from PIL import Image
+
+from onnx_web.diffusers.run import (
+    run_blend_pipeline,
+    run_img2img_pipeline,
+    run_txt2img_pipeline,
+    run_upscale_pipeline,
+)
+from onnx_web.params import HighresParams, ImageParams, Size, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_device, test_needs_models
+
+
+class TestTxt2ImgPipeline(unittest.TestCase):
+  @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+  def test_basic(self):
+    cancel = Value("L", 0)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    active = Value("L", 0)
+    idle = Value("L", 0)
+
+    worker = WorkerContext(
+      "test",
+      test_device(),
+      cancel,
+      logs,
+      pending,
+      progress,
+      active,
+      idle,
+      3,
+      0.1,
+    )
+    worker.start("test")
+
+    run_txt2img_pipeline(
+      worker,
+      ServerContext(model_path="../models", output_path="../outputs"),
+      ImageParams(
+        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
+      Size(256, 256),
+      ["test-txt2img.png"],
+      UpscaleParams("test"),
+      HighresParams(False, 1, 0, 0),
+    )
+
+    self.assertTrue(path.exists("../outputs/test-txt2img.png"))
+
+class TestImg2ImgPipeline(unittest.TestCase):
+  @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+  def test_basic(self):
+    cancel = Value("L", 0)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    active = Value("L", 0)
+    idle = Value("L", 0)
+
+    worker = WorkerContext(
+      "test",
+      test_device(),
+      cancel,
+      logs,
+      pending,
+      progress,
+      active,
+      idle,
+      3,
+      0.1,
+    )
+    worker.start("test")
+
+    source = Image.new("RGB", (64, 64), "black")
+    run_img2img_pipeline(
+      worker,
+      ServerContext(model_path="../models", output_path="../outputs"),
+      ImageParams(
+        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
+      ["test-img2img.png"],
+      UpscaleParams("test"),
+      HighresParams(False, 1, 0, 0),
+      source,
+      1.0,
+    )
+
+    self.assertTrue(path.exists("../outputs/test-img2img.png"))
+
+class TestUpscalePipeline(unittest.TestCase):
+  @test_needs_models(["../models/upscaling-stable-diffusion-x4"])
+  def test_basic(self):
+    cancel = Value("L", 0)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    active = Value("L", 0)
+    idle = Value("L", 0)
+
+    worker = WorkerContext(
+      "test",
+      test_device(),
+      cancel,
+      logs,
+      pending,
+      progress,
+      active,
+      idle,
+      3,
+      0.1,
+    )
+    worker.start("test")
+
+    source = Image.new("RGB", (64, 64), "black")
+    run_upscale_pipeline(
+      worker,
+      ServerContext(model_path="../models", output_path="../outputs"),
+      ImageParams(
+        "../models/upscaling-stable-diffusion-x4", "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
+      Size(256, 256),
+      ["test-upscale.png"],
+      UpscaleParams("test"),
+      HighresParams(False, 1, 0, 0),
+      source,
+    )
+
+    self.assertTrue(path.exists("../outputs/test-upscale.png"))
+
+class TestBlendPipeline(unittest.TestCase):
+  def test_basic(self):
+    cancel = Value("L", 0)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    active = Value("L", 0)
+    idle = Value("L", 0)
+
+    worker = WorkerContext(
+      "test",
+      test_device(),
+      cancel,
+      logs,
+      pending,
+      progress,
+      active,
+      idle,
+      3,
+      0.1,
+    )
+    worker.start("test")
+
+    source = Image.new("RGBA", (64, 64), "black")
+    mask = Image.new("RGBA", (64, 64), "white")
+    run_blend_pipeline(
+      worker,
+      ServerContext(model_path="../models", output_path="../outputs"),
+      ImageParams(
+        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
+      Size(64, 64),
+      ["test-blend.png"],
+      UpscaleParams("test"),
+      [source, source],
+      mask,
+    )
+
+    self.assertTrue(path.exists("../outputs/test-blend.png"))
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index 2547512f..7ea73451 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -9,16 +9,22 @@ from onnx_web.worker.pool import DevicePoolExecutor
 
 TEST_JOIN_TIMEOUT = 0.2
 
-def test_job(*args, lock: Event, **kwargs):
+lock = Event()
+
+
+def test_job(*args, **kwargs):
   lock.wait()
 
 
+def wait_job(*args, **kwargs):
+  sleep(0.5)
+
+
 class TestWorkerPool(unittest.TestCase):
-  lock: Optional[Event]
+  # lock: Optional[Event]
   pool: Optional[DevicePoolExecutor]
 
   def setUp(self) -> None:
-    self.lock = Event()
     self.pool = None
 
   def tearDown(self) -> None:
@@ -38,7 +44,17 @@ class TestWorkerPool(unittest.TestCase):
     self.assertEqual(len(self.pool.workers), 1)
 
   def test_cancel_pending(self):
-    pass
+    device = DeviceParams("cpu", "CPUProvider")
+    server = ServerContext()
+
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool.start()
+
+    self.pool.submit("test", wait_job, lock=lock)
+    self.assertEqual(self.pool.done("test"), (True, None))
+
+    self.assertTrue(self.pool.cancel("test"))
+    self.assertEqual(self.pool.done("test"), (False, None))
 
   def test_cancel_running(self):
     pass
@@ -61,48 +77,46 @@ class TestWorkerPool(unittest.TestCase):
     self.assertEqual(self.pool.get_next_device(needs_device=device2), 1)
 
   def test_done_running(self):
-    """
     device = DeviceParams("cpu", "CPUProvider")
     server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1)
+    self.pool.start(lock)
+    sleep(2.0)
 
-    self.pool.submit("test", test_job, lock=self.lock)
-    sleep(5.0)
-    self.assertEqual(self.pool.done("test"), (False, None))
-    """
-    pass
+    self.pool.submit("test", test_job)
+    sleep(2.0)
+
+    pending, _progress = self.pool.done("test")
+    self.assertFalse(pending)
 
   def test_done_pending(self):
     device = DeviceParams("cpu", "CPUProvider")
     server = ServerContext()
 
     self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+    self.pool.start(lock)
 
-    self.pool.submit("test1", test_job, lock=self.lock)
-    self.pool.submit("test2", test_job, lock=self.lock)
+    self.pool.submit("test1", test_job)
+    self.pool.submit("test2", test_job)
     self.assertTrue(self.pool.done("test2"), (True, None))
 
-    self.lock.set()
+    lock.set()
 
   def test_done_finished(self):
-    """
     device = DeviceParams("cpu", "CPUProvider")
     server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1)
     self.pool.start()
+    sleep(2.0)
 
-    self.pool.submit("test", test_job, lock=self.lock)
+    self.pool.submit("test", wait_job)
     self.assertEqual(self.pool.done("test"), (True, None))
 
-    self.lock.set()
-    sleep(5.0)
-    self.assertEqual(self.pool.done("test"), (False, None))
-    """
-    pass
+    sleep(2.0)
+    pending, _progress = self.pool.done("test")
+    self.assertFalse(pending)
 
   def test_recycle_live(self):
     pass

From 1351b2f3ff69e5866ea49622db612ec02a6b2576 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 6 Oct 2023 19:01:00 -0500
Subject: [PATCH 088/240] fix(api): allow SDXL VAE in any supported tensor
 format, ensure new SDXL models get hash file

---
 .../convert/diffusion/diffusion_xl.py         | 20 ++++++++++++-------
 1 file changed, 13 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index 16081b53..54f37752 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -10,7 +10,7 @@ from onnxruntime.transformers.float16 import convert_float_to_float16
 from optimum.exporters.onnx import main_export
 
 from ...constants import ONNX_MODEL
-from ..utils import ConversionContext
+from ..utils import RESOLVE_FORMATS, ConversionContext, check_ext
 
 logger = getLogger(__name__)
 
@@ -42,13 +42,14 @@ def convert_diffusion_diffusers_xl(
         "converting Stable Diffusion XL model %s: %s -> %s/", name, source, dest_path
     )
 
-    if "hash" in model and not path.exists(model_hash):
-        logger.info("ONNX model does not have hash file, adding one")
-        with open(model_hash, "w") as f:
-            f.write(model["hash"])
-
     if path.exists(dest_path) and path.exists(model_index):
         logger.info("ONNX model already exists, skipping conversion")
+
+        if "hash" in model and not path.exists(model_hash):
+            logger.info("ONNX model does not have hash file, adding one")
+            with open(model_hash, "w") as f:
+                f.write(model["hash"])
+
         return (False, dest_path)
 
     # safetensors -> diffusers directory with torch models
@@ -63,7 +64,7 @@ def convert_diffusion_diffusers_xl(
 
     if replace_vae is not None:
         vae_path = path.join(conversion.model_path, replace_vae)
-        if replace_vae.endswith(".safetensors"):
+        if check_ext(replace_vae, RESOLVE_FORMATS):
             pipeline.vae = AutoencoderKL.from_single_file(vae_path)
         else:
             pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
@@ -80,6 +81,11 @@ def convert_diffusion_diffusers_xl(
         framework="pt",
     )
 
+    if "hash" in model:
+        logger.debug("adding hash file to ONNX model")
+        with open(model_hash, "w") as f:
+            f.write(model["hash"])
+
     if conversion.half:
         unet_path = path.join(dest_path, "unet", ONNX_MODEL)
         infer_shapes_path(unet_path)

From ebdfa78737bce5b723423031c6e57fb63a1c25bc Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 6 Oct 2023 19:03:15 -0500
Subject: [PATCH 089/240] fix(api): allow PTH tensor files, add helper to check
 extension

---
 api/onnx_web/convert/utils.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/convert/utils.py b/api/onnx_web/convert/utils.py
index 52963916..42cb7370 100644
--- a/api/onnx_web/convert/utils.py
+++ b/api/onnx_web/convert/utils.py
@@ -185,7 +185,14 @@ def tuple_to_upscaling(model: Union[ModelDict, LegacyModel]):
 
 
 MODEL_FORMATS = ["onnx", "pth", "ckpt", "safetensors"]
-RESOLVE_FORMATS = ["safetensors", "ckpt", "pt", "bin"]
+RESOLVE_FORMATS = ["safetensors", "ckpt", "pt", "pth", "bin"]
+
+
+def check_ext(name: str, exts: List[str]) -> Tuple[bool, str]:
+    _name, ext = path.splitext(name)
+    ext = ext.strip(".")
+
+    return (name in exts, ext)
 
 
 def source_format(model: Dict) -> Optional[str]:
@@ -193,8 +200,8 @@ def source_format(model: Dict) -> Optional[str]:
         return model["format"]
 
     if "source" in model:
-        _name, ext = path.splitext(model["source"])
-        if ext in MODEL_FORMATS:
+        valid, ext = check_ext(model["source"], MODEL_FORMATS)
+        if valid:
             return ext
 
     return None

From e9b13754406929049bd30b69b63e88ce4bc000c7 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 6 Oct 2023 19:04:48 -0500
Subject: [PATCH 090/240] fix(api): write tests for embedding/inversion
 blending

---
 .../convert/diffusion/textual_inversion.py    | 297 +++++++++---------
 api/onnx_web/image/utils.py                   |   4 +-
 api/onnx_web/server/hacks.py                  |   8 +
 api/onnx_web/worker/worker.py                 |   8 +-
 api/tests/convert/test_utils.py               |  56 ++++
 api/tests/helpers.py                          |   3 +-
 onnx-web.code-workspace                       |   1 +
 7 files changed, 230 insertions(+), 147 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/textual_inversion.py b/api/onnx_web/convert/diffusion/textual_inversion.py
index 3eece453..0a5ed755 100644
--- a/api/onnx_web/convert/diffusion/textual_inversion.py
+++ b/api/onnx_web/convert/diffusion/textual_inversion.py
@@ -14,19 +14,155 @@ from ..utils import ConversionContext, load_tensor
 logger = getLogger(__name__)
 
 
+def detect_embedding_format(loaded_embeds) -> str:
+    keys: List[str] = list(loaded_embeds.keys())
+    if len(keys) == 1 and keys[0].startswith("<") and keys[0].endswith(">"):
+        logger.debug("detected Textual Inversion concept: %s", keys)
+        return "concept"
+    elif "emb_params" in keys:
+        logger.debug("detected Textual Inversion parameter embeddings: %s", keys)
+        return "parameters"
+    elif "string_to_token" in keys and "string_to_param" in keys:
+        logger.debug("detected Textual Inversion token embeddings: %s", keys)
+        return "embeddings"
+    else:
+        logger.error("unknown Textual Inversion format, no recognized keys: %s", keys)
+        return None
+
+
+def blend_embedding_concept(embeds, loaded_embeds, dtype, base_token, weight):
+    # separate token and the embeds
+    token = list(loaded_embeds.keys())[0]
+
+    layer = loaded_embeds[token].numpy().astype(dtype)
+    layer *= weight
+
+    if base_token in embeds:
+        embeds[base_token] += layer
+    else:
+        embeds[base_token] = layer
+
+    if token in embeds:
+        embeds[token] += layer
+    else:
+        embeds[token] = layer
+
+
+def blend_embedding_parameters(embeds, loaded_embeds, dtype, base_token, weight):
+    emb_params = loaded_embeds["emb_params"]
+
+    num_tokens = emb_params.shape[0]
+    logger.debug("generating %s layer tokens for %s", num_tokens, base_token)
+
+    sum_layer = np.zeros(emb_params[0, :].shape)
+
+    for i in range(num_tokens):
+        token = f"{base_token}-{i}"
+        layer = emb_params[i, :].numpy().astype(dtype)
+        layer *= weight
+
+        sum_layer += layer
+        if token in embeds:
+            embeds[token] += layer
+        else:
+            embeds[token] = layer
+
+    # add base and sum tokens to embeds
+    if base_token in embeds:
+        embeds[base_token] += sum_layer
+    else:
+        embeds[base_token] = sum_layer
+
+    sum_token = f"{base_token}-all"
+    if sum_token in embeds:
+        embeds[sum_token] += sum_layer
+    else:
+        embeds[sum_token] = sum_layer
+
+
+def blend_embedding_embeddings(embeds, loaded_embeds, dtype, base_token, weight):
+    string_to_token = loaded_embeds["string_to_token"]
+    string_to_param = loaded_embeds["string_to_param"]
+
+    # separate token and embeds
+    token = list(string_to_token.keys())[0]
+    trained_embeds = string_to_param[token]
+
+    num_tokens = trained_embeds.shape[0]
+    logger.debug("generating %s layer tokens for %s", num_tokens, base_token)
+
+    sum_layer = np.zeros(trained_embeds[0, :].shape)
+
+    for i in range(num_tokens):
+        token = f"{base_token}-{i}"
+        layer = trained_embeds[i, :].numpy().astype(dtype)
+        layer *= weight
+
+        sum_layer += layer
+        if token in embeds:
+            embeds[token] += layer
+        else:
+            embeds[token] = layer
+
+    # add base and sum tokens to embeds
+    if base_token in embeds:
+        embeds[base_token] += sum_layer
+    else:
+        embeds[base_token] = sum_layer
+
+    sum_token = f"{base_token}-all"
+    if sum_token in embeds:
+        embeds[sum_token] += sum_layer
+    else:
+        embeds[sum_token] = sum_layer
+
+
+def blend_embedding_node(text_encoder, tokenizer, embeds, num_added_tokens):
+    # resize the token embeddings
+    # text_encoder.resize_token_embeddings(len(tokenizer))
+    embedding_node = [
+        n
+        for n in text_encoder.graph.initializer
+        if n.name == "text_model.embeddings.token_embedding.weight"
+    ][0]
+    base_weights = numpy_helper.to_array(embedding_node)
+
+    weights_dim = base_weights.shape[1]
+    zero_weights = np.zeros((num_added_tokens, weights_dim))
+    embedding_weights = np.concatenate((base_weights, zero_weights), axis=0)
+
+    for token, weights in embeds.items():
+        token_id = tokenizer.convert_tokens_to_ids(token)
+        logger.trace("embedding %s weights for token %s", weights.shape, token)
+        embedding_weights[token_id] = weights
+
+    # replace embedding_node
+    for i in range(len(text_encoder.graph.initializer)):
+        if (
+            text_encoder.graph.initializer[i].name
+            == "text_model.embeddings.token_embedding.weight"
+        ):
+            new_initializer = numpy_helper.from_array(
+                embedding_weights.astype(base_weights.dtype), embedding_node.name
+            )
+            logger.trace("new initializer data type: %s", new_initializer.data_type)
+            del text_encoder.graph.initializer[i]
+            text_encoder.graph.initializer.insert(i, new_initializer)
+
+
 @torch.no_grad()
 def blend_textual_inversions(
     server: ServerContext,
     text_encoder: ModelProto,
     tokenizer: CLIPTokenizer,
-    inversions: List[Tuple[str, float, Optional[str], Optional[str]]],
+    embeddings: List[Tuple[str, float, Optional[str], Optional[str]]],
 ) -> Tuple[ModelProto, CLIPTokenizer]:
     # always load to CPU for blending
     device = torch.device("cpu")
     dtype = np.float32
     embeds = {}
 
-    for name, weight, base_token, inversion_format in inversions:
+    for name, weight, base_token, format in embeddings:
         if base_token is None:
             logger.debug("no base token provided, using name: %s", name)
             base_token = name
@@ -43,153 +179,28 @@ def blend_textual_inversions(
             logger.warning("unable to load tensor")
             continue
 
-        if inversion_format is None:
-            keys: List[str] = list(loaded_embeds.keys())
-            if len(keys) == 1 and keys[0].startswith("<") and keys[0].endswith(">"):
-                logger.debug("detected Textual Inversion concept: %s", keys)
-                inversion_format = "concept"
-            elif "emb_params" in keys:
-                logger.debug(
-                    "detected Textual Inversion parameter embeddings: %s", keys
-                )
-                inversion_format = "parameters"
-            elif "string_to_token" in keys and "string_to_param" in keys:
-                logger.debug("detected Textual Inversion token embeddings: %s", keys)
-                inversion_format = "embeddings"
-            else:
-                logger.error(
-                    "unknown Textual Inversion format, no recognized keys: %s", keys
-                )
-                continue
+        if format is None:
+            format = detect_embedding_format()
 
-        if inversion_format == "concept":
-            # separate token and the embeds
-            token = list(loaded_embeds.keys())[0]
-
-            layer = loaded_embeds[token].numpy().astype(dtype)
-            layer *= weight
-
-            if base_token in embeds:
-                embeds[base_token] += layer
-            else:
-                embeds[base_token] = layer
-
-            if token in embeds:
-                embeds[token] += layer
-            else:
-                embeds[token] = layer
-        elif inversion_format == "parameters":
-            emb_params = loaded_embeds["emb_params"]
-
-            num_tokens = emb_params.shape[0]
-            logger.debug("generating %s layer tokens for %s", num_tokens, name)
-
-            sum_layer = np.zeros(emb_params[0, :].shape)
-
-            for i in range(num_tokens):
-                token = f"{base_token}-{i}"
-                layer = emb_params[i, :].numpy().astype(dtype)
-                layer *= weight
-
-                sum_layer += layer
-                if token in embeds:
-                    embeds[token] += layer
-                else:
-                    embeds[token] = layer
-
-            # add base and sum tokens to embeds
-            if base_token in embeds:
-                embeds[base_token] += sum_layer
-            else:
-                embeds[base_token] = sum_layer
-
-            sum_token = f"{base_token}-all"
-            if sum_token in embeds:
-                embeds[sum_token] += sum_layer
-            else:
-                embeds[sum_token] = sum_layer
-        elif inversion_format == "embeddings":
-            string_to_token = loaded_embeds["string_to_token"]
-            string_to_param = loaded_embeds["string_to_param"]
-
-            # separate token and embeds
-            token = list(string_to_token.keys())[0]
-            trained_embeds = string_to_param[token]
-
-            num_tokens = trained_embeds.shape[0]
-            logger.debug("generating %s layer tokens for %s", num_tokens, name)
-
-            sum_layer = np.zeros(trained_embeds[0, :].shape)
-
-            for i in range(num_tokens):
-                token = f"{base_token}-{i}"
-                layer = trained_embeds[i, :].numpy().astype(dtype)
-                layer *= weight
-
-                sum_layer += layer
-                if token in embeds:
-                    embeds[token] += layer
-                else:
-                    embeds[token] = layer
-
-            # add base and sum tokens to embeds
-            if base_token in embeds:
-                embeds[base_token] += sum_layer
-            else:
-                embeds[base_token] = sum_layer
-
-            sum_token = f"{base_token}-all"
-            if sum_token in embeds:
-                embeds[sum_token] += sum_layer
-            else:
-                embeds[sum_token] = sum_layer
+        if format == "concept":
+            blend_embedding_concept(embeds, loaded_embeds, dtype, base_token, weight)
+        elif format == "parameters":
+            blend_embedding_parameters(embeds, loaded_embeds, dtype, base_token, weight)
+        elif format == "embeddings":
+            blend_embedding_embeddings(embeds, loaded_embeds, dtype, base_token, weight)
         else:
-            raise ValueError(f"unknown Textual Inversion format: {inversion_format}")
+            raise ValueError(f"unknown Textual Inversion format: {format}")
 
-        # add the tokens to the tokenizer
-        logger.debug(
-            "found embeddings for %s tokens: %s",
-            len(embeds.keys()),
-            list(embeds.keys()),
+    # add the tokens to the tokenizer
+    num_added_tokens = tokenizer.add_tokens(list(embeds.keys()))
+    if num_added_tokens == 0:
+        raise ValueError(
+            "The tokenizer already contains the tokens. Please pass a different `token` that is not already in the tokenizer."
         )
-        num_added_tokens = tokenizer.add_tokens(list(embeds.keys()))
-        if num_added_tokens == 0:
-            raise ValueError(
-                f"The tokenizer already contains the token {token}. Please pass a different `token` that is not already in the tokenizer."
-            )
 
-        logger.trace("added %s tokens", num_added_tokens)
+    logger.trace("added %s tokens", num_added_tokens)
 
-        # resize the token embeddings
-        # text_encoder.resize_token_embeddings(len(tokenizer))
-        embedding_node = [
-            n
-            for n in text_encoder.graph.initializer
-            if n.name == "text_model.embeddings.token_embedding.weight"
-        ][0]
-        base_weights = numpy_helper.to_array(embedding_node)
-
-        weights_dim = base_weights.shape[1]
-        zero_weights = np.zeros((num_added_tokens, weights_dim))
-        embedding_weights = np.concatenate((base_weights, zero_weights), axis=0)
-
-        for token, weights in embeds.items():
-            token_id = tokenizer.convert_tokens_to_ids(token)
-            logger.trace("embedding %s weights for token %s", weights.shape, token)
-            embedding_weights[token_id] = weights
-
-        # replace embedding_node
-        for i in range(len(text_encoder.graph.initializer)):
-            if (
-                text_encoder.graph.initializer[i].name
-                == "text_model.embeddings.token_embedding.weight"
-            ):
-                new_initializer = numpy_helper.from_array(
-                    embedding_weights.astype(base_weights.dtype), embedding_node.name
-                )
-                logger.trace("new initializer data type: %s", new_initializer.data_type)
-                del text_encoder.graph.initializer[i]
-                text_encoder.graph.initializer.insert(i, new_initializer)
+    blend_embedding_node(text_encoder, tokenizer, embeds, num_added_tokens)
 
     return (text_encoder, tokenizer)
 
diff --git a/api/onnx_web/image/utils.py b/api/onnx_web/image/utils.py
index 80972080..4e2f3a7a 100644
--- a/api/onnx_web/image/utils.py
+++ b/api/onnx_web/image/utils.py
@@ -1,3 +1,5 @@
+from typing import Tuple
+
 from PIL import Image, ImageChops
 
 from ..params import Border, Size
@@ -13,7 +15,7 @@ def expand_image(
     fill="white",
     noise_source=noise_source_histogram,
     mask_filter=mask_filter_none,
-):
+) -> Tuple[Image.Image, Image.Image, Image.Image, Tuple[int]]:
     size = Size(*source.size).add_border(expand)
     size = tuple(size)
     origin = (expand.left, expand.top)
diff --git a/api/onnx_web/server/hacks.py b/api/onnx_web/server/hacks.py
index b59bb73a..f51b51f4 100644
--- a/api/onnx_web/server/hacks.py
+++ b/api/onnx_web/server/hacks.py
@@ -2,8 +2,16 @@ import sys
 from functools import partial
 from logging import getLogger
 from os import path
+from pathlib import Path
+from typing import Dict, Optional, Union
 from urllib.parse import urlparse
 
+from optimum.onnxruntime.modeling_diffusion import (
+    ORTModel,
+    ORTStableDiffusionPipelineBase,
+)
+
+from ..torch_before_ort import SessionOptions
 from ..utils import run_gc
 from .context import ServerContext
 
diff --git a/api/onnx_web/worker/worker.py b/api/onnx_web/worker/worker.py
index 5377c42a..a55ba4a2 100644
--- a/api/onnx_web/worker/worker.py
+++ b/api/onnx_web/worker/worker.py
@@ -27,10 +27,14 @@ MEMORY_ERRORS = [
 ]
 
 
-def worker_main(worker: WorkerContext, server: ServerContext, *args):
-    apply_patches(server)
+def worker_main(
+    worker: WorkerContext, server: ServerContext, *args, exit=exit, patch=True
+):
     setproctitle("onnx-web worker: %s" % (worker.device.device))
 
+    if patch:
+        apply_patches(server)
+
     logger.trace(
         "checking in from worker with providers: %s", get_available_providers()
     )
diff --git a/api/tests/convert/test_utils.py b/api/tests/convert/test_utils.py
index 45c8fccc..f08f0d0c 100644
--- a/api/tests/convert/test_utils.py
+++ b/api/tests/convert/test_utils.py
@@ -4,11 +4,19 @@ from onnx_web.convert.utils import (
     DEFAULT_OPSET,
     ConversionContext,
     download_progress,
+    remove_prefix,
+    resolve_tensor,
+    source_format,
     tuple_to_correction,
     tuple_to_diffusion,
     tuple_to_source,
     tuple_to_upscaling,
 )
+from tests.helpers import (
+    TEST_MODEL_DIFFUSION_SD15,
+    TEST_MODEL_UPSCALING_SWINIR,
+    test_needs_models,
+)
 
 
 class ConversionContextTests(unittest.TestCase):
@@ -182,3 +190,51 @@ class TupleToUpscalingTests(unittest.TestCase):
       self.assertEqual(source["scale"], 2)
       self.assertEqual(source["half"], True)
       self.assertEqual(source["opset"], 14)
+
+
+class SourceFormatTests(unittest.TestCase):
+   def test_with_format(self):
+      result = source_format({
+         "format": "foo",
+      })
+      self.assertEqual(result, "foo")
+
+   def test_source_known_extension(self):
+      result = source_format({
+         "source": "foo.safetensors",
+      })
+      self.assertEqual(result, "safetensors")
+
+   def test_source_unknown_extension(self):
+      result = source_format({
+         "source": "foo.none"
+      })
+      self.assertEqual(result, None)
+
+   def test_incomplete_model(self):
+      self.assertIsNone(source_format({}))
+
+
+class RemovePrefixTests(unittest.TestCase):
+   def test_with_prefix(self):
+      self.assertEqual(remove_prefix("foo.bar", "foo"), ".bar")
+
+   def test_without_prefix(self):
+      self.assertEqual(remove_prefix("foo.bar", "bin"), "foo.bar")
+
+
+class LoadTorchTests(unittest.TestCase):
+   pass
+
+
+class LoadTensorTests(unittest.TestCase):
+   pass
+
+
+class ResolveTensorTests(unittest.TestCase):
+   @test_needs_models([TEST_MODEL_UPSCALING_SWINIR])
+   def test_resolve_existing(self):
+      self.assertEqual(resolve_tensor("../models/.cache/upscaling-swinir"), TEST_MODEL_UPSCALING_SWINIR)
+
+   def test_resolve_missing(self):
+      self.assertIsNone(resolve_tensor("missing"))
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index 586ecbd8..3b6716b2 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -13,4 +13,5 @@ def test_device() -> DeviceParams:
   return DeviceParams("cpu", "CPUExecutionProvider")
 
 
-TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
\ No newline at end of file
+TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
+TEST_MODEL_UPSCALING_SWINIR = "../models/.cache/upscaling-swinir.pth"
diff --git a/onnx-web.code-workspace b/onnx-web.code-workspace
index d3965a5f..9674ca2f 100644
--- a/onnx-web.code-workspace
+++ b/onnx-web.code-workspace
@@ -90,6 +90,7 @@
 			"spinalcase",
 			"stabilityai",
 			"stringcase",
+			"swinir",
 			"timestep",
 			"timesteps",
 			"tojson",

From e8d7d9a88186fedcf12ac6ce41819a5c59698715 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 4 Nov 2023 20:41:58 -0500
Subject: [PATCH 091/240] feat: split up UNet and VAE tile size and
 overlap/stride params

---
 api/onnx_web/chain/highres.py               |   6 +-
 api/onnx_web/chain/source_txt2img.py        |   4 +-
 api/onnx_web/chain/upscale_bsrgan.py        |   2 +-
 api/onnx_web/chain/upscale_outpaint.py      |   2 +-
 api/onnx_web/diffusers/load.py              |  17 ++--
 api/onnx_web/diffusers/run.py               |  18 ++--
 api/onnx_web/params.py                      |  34 ++++---
 api/onnx_web/server/params.py               |  50 +++++-----
 api/params.json                             |  44 +++++----
 api/scripts/test-release.py                 |   4 +-
 gui/src/client/api.ts                       |   9 +-
 gui/src/components/control/ImageControl.tsx | 100 +++++++++++---------
 gui/src/config.json                         |  32 ++++---
 gui/src/state.ts                            |  10 +-
 gui/src/strings/de.ts                       |   6 +-
 gui/src/strings/en.ts                       |   8 +-
 gui/src/strings/es.ts                       |   6 +-
 gui/src/strings/fr.ts                       |   6 +-
 gui/src/types/params.ts                     |   9 +-
 19 files changed, 210 insertions(+), 157 deletions(-)

diff --git a/api/onnx_web/chain/highres.py b/api/onnx_web/chain/highres.py
index 87b52d9b..482b86c7 100644
--- a/api/onnx_web/chain/highres.py
+++ b/api/onnx_web/chain/highres.py
@@ -43,7 +43,7 @@ def stage_highres(
                     outscale=highres.scale,
                 ),
                 chain=chain,
-                overlap=params.overlap,
+                overlap=params.vae_overlap,
             )
         else:
             logger.debug("using simple upscaling for highres")
@@ -51,14 +51,14 @@ def stage_highres(
                 UpscaleSimpleStage(),
                 stage,
                 method=highres.method,
-                overlap=params.overlap,
+                overlap=params.vae_overlap,
                 upscale=upscale.with_args(scale=highres.scale, outscale=highres.scale),
             )
 
         chain.stage(
             BlendImg2ImgStage(),
             stage,
-            overlap=params.overlap,
+            overlap=params.vae_overlap,
             prompt_index=prompt_index + i,
             strength=highres.strength,
         )
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 5448364e..13dc70d9 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -60,9 +60,9 @@ class SourceTxt2ImgStage(BaseStage):
         )
 
         if params.is_xl():
-            tile_size = max(stage.tile_size, params.tiles)
+            tile_size = max(stage.tile_size, params.unet_tile)
         else:
-            tile_size = params.tiles
+            tile_size = params.unet_tile
 
         # this works for panorama as well, because tile_size is already max(tile_size, *size)
         latent_size = size.min(tile_size, tile_size)
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index f9f02f1e..0137750e 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -106,5 +106,5 @@ class UpscaleBSRGANStage(BaseStage):
         params: ImageParams,
         size: Size,
     ) -> int:
-        tile = min(params.tiles, self.max_tile)
+        tile = min(params.unet_tile, self.max_tile)
         return size.width // tile * size.height // tile
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 78d32077..85ddc079 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -71,7 +71,7 @@ class UpscaleOutpaintStage(BaseStage):
                 outputs.append(source)
                 continue
 
-            tile_size = params.tiles
+            tile_size = params.unet_tile
             size = Size(*source.size)
             latent_size = size.min(tile_size, tile_size)
 
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 38b61e50..07310e74 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -266,14 +266,13 @@ def load_pipeline(
 
     # update panorama params
     if params.is_panorama():
-        latent_window = params.tiles // 8
-        latent_stride = params.stride // 8
-
-        pipe.set_window_size(latent_window, latent_stride)
+        unet_stride = (params.unet_tile * (1 - params.unet_overlap)) // 8
+        logger.debug("setting panorama window parameters: %s/%s for UNet, %s/%s for VAE", params.unet_tile, unet_stride, params.vae_tile, params.vae_overlap)
+        pipe.set_window_size(params.unet_tile // 8, unet_stride)
 
         for vae in VAE_COMPONENTS:
             if hasattr(pipe, vae):
-                getattr(pipe, vae).set_window_size(latent_window, params.overlap)
+                getattr(pipe, vae).set_window_size(params.vae_tile // 8, params.vae_overlap)
 
     run_gc([device])
 
@@ -626,8 +625,8 @@ def patch_pipeline(
             server,
             original_decoder,
             decoder=True,
-            window=params.tiles,
-            overlap=params.overlap,
+            window=params.unet_tile,
+            overlap=params.vae_overlap,
         )
         logger.debug("patched VAE decoder with wrapper")
 
@@ -637,8 +636,8 @@ def patch_pipeline(
             server,
             original_encoder,
             decoder=False,
-            window=params.tiles,
-            overlap=params.overlap,
+            window=params.unet_tile,
+            overlap=params.vae_overlap,
         )
         logger.debug("patched VAE encoder with wrapper")
 
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index a9c72d2f..b86be2b1 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -44,9 +44,9 @@ def run_txt2img_pipeline(
 ) -> None:
     # if using panorama, the pipeline will tile itself (views)
     if params.is_panorama() or params.is_xl():
-        tile_size = max(params.tiles, size.width, size.height)
+        tile_size = max(params.unet_tile, size.width, size.height)
     else:
-        tile_size = params.tiles
+        tile_size = params.unet_tile
 
     # prepare the chain pipeline and first stage
     chain = ChainPipeline()
@@ -57,11 +57,11 @@ def run_txt2img_pipeline(
         ),
         size=size,
         prompt_index=0,
-        overlap=params.overlap,
+        overlap=params.vae_overlap,
     )
 
     # apply upscaling and correction, before highres
-    stage = StageParams(tile_size=params.tiles)
+    stage = StageParams(tile_size=params.unet_tile)
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
@@ -139,14 +139,14 @@ def run_img2img_pipeline(
     # prepare the chain pipeline and first stage
     chain = ChainPipeline()
     stage = StageParams(
-        tile_size=params.tiles,
+        tile_size=params.unet_tile,
     )
     chain.stage(
         BlendImg2ImgStage(),
         stage,
         prompt_index=0,
         strength=strength,
-        overlap=params.overlap,
+        overlap=params.vae_overlap,
     )
 
     # apply upscaling and correction, before highres
@@ -236,7 +236,7 @@ def run_inpaint_pipeline(
     full_res_inpaint_padding: float,
 ) -> None:
     logger.debug("building inpaint pipeline")
-    tile_size = params.tiles
+    tile_size = params.unet_tile
 
     if mask is None:
         # if no mask was provided, keep the full source image
@@ -332,7 +332,7 @@ def run_inpaint_pipeline(
         fill_color=fill_color,
         mask_filter=mask_filter,
         noise_source=noise_source,
-        overlap=params.overlap,
+        overlap=params.vae_overlap,
         prompt_index=0,
     )
 
@@ -410,7 +410,7 @@ def run_upscale_pipeline(
 ) -> None:
     # set up the chain pipeline, no base stage for upscaling
     chain = ChainPipeline()
-    stage = StageParams(tile_size=params.tiles)
+    stage = StageParams(tile_size=params.unet_tile)
 
     # apply upscaling and correction, before highres
     first_upscale, after_upscale = split_upscale(upscale)
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 885b09b3..3b896cae 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -204,8 +204,10 @@ class ImageParams:
     input_negative_prompt: str
     loopback: int
     tiled_vae: bool
-    tiles: int
-    overlap: float
+    unet_tile: int
+    unet_overlap: float
+    vae_tile: int
+    vae_overlap: float
 
     def __init__(
         self,
@@ -224,9 +226,10 @@ class ImageParams:
         input_negative_prompt: Optional[str] = None,
         loopback: int = 0,
         tiled_vae: bool = False,
-        tiles: int = 512,
-        overlap: float = 0.25,
-        stride: int = 64,
+        unet_overlap: float = 0.25,
+        unet_tile: int = 512,
+        vae_overlap: float = 0.25,
+        vae_tile: int = 512,
     ) -> None:
         self.model = model
         self.pipeline = pipeline
@@ -243,9 +246,10 @@ class ImageParams:
         self.input_negative_prompt = input_negative_prompt or negative_prompt
         self.loopback = loopback
         self.tiled_vae = tiled_vae
-        self.tiles = tiles
-        self.overlap = overlap
-        self.stride = stride
+        self.unet_overlap = unet_overlap
+        self.unet_tile = unet_tile
+        self.vae_overlap = vae_overlap
+        self.vae_tile = vae_tile
 
     def do_cfg(self):
         return self.cfg > 1.0
@@ -312,9 +316,10 @@ class ImageParams:
             "input_negative_prompt": self.input_negative_prompt,
             "loopback": self.loopback,
             "tiled_vae": self.tiled_vae,
-            "tiles": self.tiles,
-            "overlap": self.overlap,
-            "stride": self.stride,
+            "unet_overlap": self.unet_overlap,
+            "unet_tile": self.unet_tile,
+            "vae_overlap": self.vae_overlap,
+            "vae_tile": self.vae_tile,
         }
 
     def with_args(self, **kwargs):
@@ -334,9 +339,10 @@ class ImageParams:
             kwargs.get("input_negative_prompt", self.input_negative_prompt),
             kwargs.get("loopback", self.loopback),
             kwargs.get("tiled_vae", self.tiled_vae),
-            kwargs.get("tiles", self.tiles),
-            kwargs.get("overlap", self.overlap),
-            kwargs.get("stride", self.stride),
+            kwargs.get("unet_overlap", self.unet_overlap),
+            kwargs.get("unet_tile", self.unet_tile),
+            kwargs.get("vae_overlap", self.vae_overlap),
+            kwargs.get("vae_tile", self.vae_tile),
         )
 
 
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index d68e2dcc..b8dfe871 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -117,32 +117,35 @@ def build_params(
         get_config_value("steps", "max"),
         get_config_value("steps", "min"),
     )
-    tiled_vae = get_boolean(data, "tiledVAE", get_config_value("tiledVAE"))
-    tiles = get_and_clamp_int(
+    tiled_vae = get_boolean(data, "tiled_vae", get_config_value("tiled_vae"))
+    unet_overlap = get_and_clamp_float(
         data,
-        "tiles",
-        get_config_value("tiles"),
-        get_config_value("tiles", "max"),
-        get_config_value("tiles", "min"),
+        "unet_overlap",
+        get_config_value("unet_overlap"),
+        get_config_value("unet_overlap", "max"),
+        get_config_value("unet_overlap", "min"),
     )
-    overlap = get_and_clamp_float(
+    unet_tile = get_and_clamp_int(
         data,
-        "overlap",
-        get_config_value("overlap"),
-        get_config_value("overlap", "max"),
-        get_config_value("overlap", "min"),
+        "unet_tile",
+        get_config_value("unet_tile"),
+        get_config_value("unet_tile", "max"),
+        get_config_value("unet_tile", "min"),
     )
-    stride = get_and_clamp_int(
+    vae_overlap = get_and_clamp_float(
         data,
-        "stride",
-        get_config_value("stride"),
-        get_config_value("stride", "max"),
-        get_config_value("stride", "min"),
+        "vae_overlap",
+        get_config_value("vae_overlap"),
+        get_config_value("vae_overlap", "max"),
+        get_config_value("vae_overlap", "min"),
+    )
+    vae_tile = get_and_clamp_int(
+        data,
+        "vae_tile",
+        get_config_value("vae_tile"),
+        get_config_value("vae_tile", "max"),
+        get_config_value("vae_tile", "min"),
     )
-
-    if stride > tiles:
-        logger.info("limiting stride to tile size, %s > %s", stride, tiles)
-        stride = tiles
 
     seed = int(data.get("seed", -1))
     if seed == -1:
@@ -163,9 +166,10 @@ def build_params(
         control=control,
         loopback=loopback,
         tiled_vae=tiled_vae,
-        tiles=tiles,
-        overlap=overlap,
-        stride=stride,
+        unet_overlap=unet_overlap,
+        unet_tile=unet_tile,
+        vae_overlap=vae_overlap,
+        vae_tile=vae_tile,
     )
 
     return params
diff --git a/api/params.json b/api/params.json
index c4a1ee32..9ed7451f 100644
--- a/api/params.json
+++ b/api/params.json
@@ -141,12 +141,6 @@
     "max": 4,
     "step": 1
   },
-  "overlap": {
-    "default": 0.25,
-    "min": 0.0,
-    "max": 0.9,
-    "step": 0.01
-  },
   "pipeline": {
     "default": "",
     "keys": [
@@ -197,21 +191,9 @@
     "max": 1,
     "step": 0.01
   },
-  "stride": {
-    "default": 128,
-    "min": 64,
-    "max": 512,
-    "step": 64
-  },
-  "tiledVAE": {
+  "tiled_vae": {
     "default": false
   },
-  "tiles": {
-    "default": 512,
-    "min": 128,
-    "max": 2048,
-    "step": 128
-  },
   "tileOrder": {
     "default": "spiral",
     "keys": [
@@ -225,6 +207,18 @@
     "max": 1024,
     "step": 8
   },
+  "unet_overlap": {
+    "default": 0.25,
+    "min": 0.0,
+    "max": 0.9,
+    "step": 0.01
+  },
+  "unet_tile": {
+    "default": 512,
+    "min": 128,
+    "max": 2048,
+    "step": 128
+  },
   "upscaleOrder": {
     "default": "correction-first",
     "keys": [
@@ -237,6 +231,18 @@
     "default": "",
     "keys": []
   },
+  "vae_overlap": {
+    "default": 0.25,
+    "min": 0.0,
+    "max": 0.9,
+    "step": 0.01
+  },
+  "vae_tile": {
+    "default": 512,
+    "min": 256,
+    "max": 1024,
+    "step": 128
+  },
   "width": {
     "default": 512,
     "min": 128,
diff --git a/api/scripts/test-release.py b/api/scripts/test-release.py
index 2e6d7fd2..e46843a2 100644
--- a/api/scripts/test-release.py
+++ b/api/scripts/test-release.py
@@ -305,12 +305,12 @@ TEST_DATA = [
     ),
     TestCase(
         "txt2img-panorama-1024x768-muffin",
-        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&width=1024&height=768&pipeline=panorama&tiledVAE=true",
+        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&width=1024&height=768&pipeline=panorama&tiled_vae=true",
         max_attempts=VERY_SLOW_TEST,
     ),
     TestCase(
         "img2img-panorama-1024x768-pumpkin",
-        "img2img?prompt=a+giant+pumpkin&seed=0&scheduler=ddim&sourceFilter=none&pipeline=panorama&tiledVAE=true",
+        "img2img?prompt=a+giant+pumpkin&seed=0&scheduler=ddim&sourceFilter=none&pipeline=panorama&tiled_vae=true",
         source="txt2img-panorama-1024x768-muffin-0",
         max_attempts=VERY_SLOW_TEST,
     ),
diff --git a/gui/src/client/api.ts b/gui/src/client/api.ts
index 3702440a..64fc89dc 100644
--- a/gui/src/client/api.ts
+++ b/gui/src/client/api.ts
@@ -70,10 +70,11 @@ export function makeImageURL(root: string, type: string, params: BaseImgParams):
   url.searchParams.append('cfg', params.cfg.toFixed(FIXED_FLOAT));
   url.searchParams.append('eta', params.eta.toFixed(FIXED_FLOAT));
   url.searchParams.append('steps', params.steps.toFixed(FIXED_INTEGER));
-  url.searchParams.append('tiledVAE', String(params.tiledVAE));
-  url.searchParams.append('tiles', params.tiles.toFixed(FIXED_INTEGER));
-  url.searchParams.append('overlap', params.overlap.toFixed(FIXED_FLOAT));
-  url.searchParams.append('stride', params.stride.toFixed(FIXED_INTEGER));
+  url.searchParams.append('tiled_vae', String(params.tiled_vae));
+  url.searchParams.append('unet_overlap', params.unet_overlap.toFixed(FIXED_FLOAT));
+  url.searchParams.append('unet_tile', params.unet_tile.toFixed(FIXED_INTEGER));
+  url.searchParams.append('vae_overlap', params.vae_overlap.toFixed(FIXED_FLOAT));
+  url.searchParams.append('vae_tile', params.vae_tile.toFixed(FIXED_INTEGER));
 
   if (doesExist(params.scheduler)) {
     url.searchParams.append('scheduler', params.scheduler);
diff --git a/gui/src/components/control/ImageControl.tsx b/gui/src/components/control/ImageControl.tsx
index d031b9c5..bca1d2ba 100644
--- a/gui/src/components/control/ImageControl.tsx
+++ b/gui/src/components/control/ImageControl.tsx
@@ -1,3 +1,4 @@
+/* eslint-disable camelcase */
 import { doesExist, mustDefault, mustExist } from '@apextoaster/js-utils';
 import { Casino } from '@mui/icons-material';
 import { Button, Checkbox, FormControlLabel, Stack } from '@mui/material';
@@ -47,9 +48,6 @@ export function ImageControl(props: ImageControlProps) {
     staleTime: STALE_TIME,
   });
 
-  // max stride is the lesser of tile size and server's max stride
-  const maxStride = Math.min(state.tiles, params.stride.max);
-
   return <Stack spacing={2}>
     <Stack direction='row' spacing={4}>
       <QueryList
@@ -156,58 +154,74 @@ export function ImageControl(props: ImageControlProps) {
         }}
       />
       <NumericField
-        label={t('parameter.tiles')}
-        min={params.tiles.min}
-        max={params.tiles.max}
-        step={params.tiles.step}
-        value={state.tiles}
-        onChange={(tiles) => {
+        label={t('parameter.unet_tile')}
+        min={params.unet_tile.min}
+        max={params.unet_tile.max}
+        step={params.unet_tile.step}
+        value={state.unet_tile}
+        onChange={(unet_tile) => {
           props.onChange({
             ...state,
-            tiles,
+            unet_tile,
+          });
+        }}
+      />
+      <NumericField
+        label={t('parameter.unet_overlap')}
+        min={params.unet_overlap.min}
+        max={params.unet_overlap.max}
+        step={params.unet_overlap.step}
+        value={state.unet_overlap}
+        onChange={(unet_overlap) => {
+          props.onChange({
+            ...state,
+            unet_overlap,
+          });
+        }}
+      />
+      <FormControlLabel
+        label={t('parameter.tiled_vae')}
+        control={<Checkbox
+          checked={state.tiled_vae}
+          value='check'
+          onChange={(event) => {
+            props.onChange({
+              ...state,
+              tiled_vae: state.tiled_vae === false,
+            });
+          }}
+        />}
+      />
+      <NumericField
+        decimal
+        disabled={state.tiled_vae === false}
+        label={t('parameter.vae_overlap')}
+        min={params.vae_overlap.min}
+        max={params.vae_overlap.max}
+        step={params.vae_overlap.step}
+        value={state.vae_overlap}
+        onChange={(vae_tile) => {
+          props.onChange({
+            ...state,
+            vae_tile,
           });
         }}
       />
       <NumericField
         decimal
-        label={t('parameter.overlap')}
-        min={params.overlap.min}
-        max={params.overlap.max}
-        step={params.overlap.step}
-        value={state.overlap}
-        onChange={(overlap) => {
+        disabled={state.tiled_vae === false}
+        label={t('parameter.vae_tile')}
+        min={params.vae_tile.min}
+        max={params.vae_tile.max}
+        step={params.vae_tile.step}
+        value={state.vae_tile}
+        onChange={(vae_tile) => {
           props.onChange({
             ...state,
-            overlap,
+            vae_tile,
           });
         }}
       />
-      <NumericField
-        label={t('parameter.stride')}
-        min={params.stride.min}
-        max={maxStride}
-        step={params.stride.step}
-        value={state.stride}
-        onChange={(stride) => {
-          props.onChange({
-            ...state,
-            stride,
-          });
-        }}
-      />
-      <FormControlLabel
-        label={t('parameter.tiledVAE')}
-        control={<Checkbox
-          checked={state.tiledVAE}
-          value='check'
-          onChange={(event) => {
-            props.onChange({
-              ...state,
-              tiledVAE: state.tiledVAE === false,
-            });
-          }}
-        />}
-      />
     </Stack>
     <PromptInput
       selector={selector}
diff --git a/gui/src/config.json b/gui/src/config.json
index 97a53d25..d658a121 100644
--- a/gui/src/config.json
+++ b/gui/src/config.json
@@ -131,12 +131,6 @@
       "max": 4,
       "step": 1
     },
-    "overlap": {
-      "default": 0.25,
-      "min": 0.0,
-      "max": 0.9,
-      "step": 0.01
-    },
     "pipeline": {
       "default": "",
       "keys": [
@@ -193,15 +187,9 @@
       "max": 512,
       "step": 64
     },
-    "tiledVAE": {
+    "tiled_vae": {
       "default": false
     },
-    "tiles": {
-      "default": 512,
-      "min": 128,
-      "max": 1024,
-      "step": 128
-    },
     "tileOrder": {
       "default": "spiral",
       "keys": [
@@ -215,6 +203,18 @@
       "max": 1024,
       "step": 8
     },
+    "unet_overlap": {
+      "default": 0.25,
+      "min": 0.0,
+      "max": 0.9,
+      "step": 0.01
+    },
+    "unet_tile": {
+      "default": 512,
+      "min": 128,
+      "max": 1024,
+      "step": 128
+    },
     "upscaleOrder": {
       "default": "correction-first",
       "keys": [
@@ -227,6 +227,12 @@
       "default": "",
       "keys": []
     },
+    "vae_overlap": {
+      "default": 0.25,
+      "min": 0.0,
+      "max": 0.9,
+      "step": 0.01
+    },
     "width": {
       "default": 512,
       "min": 256,
diff --git a/gui/src/state.ts b/gui/src/state.ts
index 5f59e11b..ad2a3e3a 100644
--- a/gui/src/state.ts
+++ b/gui/src/state.ts
@@ -1,3 +1,4 @@
+/* eslint-disable camelcase */
 /* eslint-disable max-lines */
 /* eslint-disable no-null/no-null */
 import { Maybe } from '@apextoaster/js-utils';
@@ -267,10 +268,11 @@ export function baseParamsFromServer(defaults: ServerParams): Required<BaseImgPa
     scheduler: defaults.scheduler.default,
     steps: defaults.steps.default,
     seed: defaults.seed.default,
-    tiledVAE: defaults.tiledVAE.default,
-    tiles: defaults.tiles.default,
-    overlap: defaults.overlap.default,
-    stride: defaults.stride.default,
+    tiled_vae: defaults.tiled_vae.default,
+    unet_overlap: defaults.unet_overlap.default,
+    unet_tile: defaults.unet_tile.default,
+    vae_overlap: defaults.vae_overlap.default,
+    vae_tile: defaults.vae_tile.default,
   };
 }
 
diff --git a/gui/src/strings/de.ts b/gui/src/strings/de.ts
index fb324301..f5dd8d2c 100644
--- a/gui/src/strings/de.ts
+++ b/gui/src/strings/de.ts
@@ -162,9 +162,11 @@ export const I18N_STRINGS_DE = {
         steps: 'Schritte',
         strength: 'Stärke',
         stride: '',
-        tiledVAE: '',
+        tiled_vae: '',
         tiles: '',
         tileOrder: '',
+        unet_overlap: '',
+        unet_tile: '',
         upscale: {
           label: '',
           denoise: 'Entrauschen',
@@ -172,6 +174,8 @@ export const I18N_STRINGS_DE = {
           order: '',
           outscale: 'Ausgangsskala',
         },
+        vae_overlap: '',
+        vae_tile: '',
         width: 'Breite',
         correction: {
           label: 'Gesichtskorrektur',
diff --git a/gui/src/strings/en.ts b/gui/src/strings/en.ts
index fc2eb448..b39d1489 100644
--- a/gui/src/strings/en.ts
+++ b/gui/src/strings/en.ts
@@ -215,10 +215,10 @@ export const I18N_STRINGS_EN = {
         sourceFilter: 'Source Filter',
         steps: 'Steps',
         strength: 'Strength',
-        stride: 'UNet Stride',
-        tiledVAE: 'Tiled VAE',
-        tiles: 'Tile Size',
+        tiled_vae: 'Tiled VAE',
         tileOrder: 'Tile Order',
+        unet_overlap: 'UNet Overlap',
+        unet_tile: 'UNet Tile Size',
         upscale: {
           label: 'Upscale',
           denoise: 'Denoise',
@@ -226,6 +226,8 @@ export const I18N_STRINGS_EN = {
           order: 'Upscale Order',
           outscale: 'Outscale',
         },
+        vae_overlap: 'UNet Overlap',
+        vae_tile: 'VAE Tile Size',
         width: 'Width',
         correction: {
           label: 'Face Correction',
diff --git a/gui/src/strings/es.ts b/gui/src/strings/es.ts
index e2b572e0..6630ef69 100644
--- a/gui/src/strings/es.ts
+++ b/gui/src/strings/es.ts
@@ -162,9 +162,11 @@ export const I18N_STRINGS_ES = {
         steps: 'Pasos',
         strength: 'Fuerza',
         stride: '',
-        tiledVAE: '',
+        tiled_vae: '',
         tiles: '',
         tileOrder: 'Orden de secciones',
+        unet_overlap: '',
+        unet_tile: '',
         upscale: {
           label: 'Aumento',
           denoise: '',
@@ -172,6 +174,8 @@ export const I18N_STRINGS_ES = {
           order: '',
           outscale: 'Escala de producción',
         },
+        vae_overlap: '',
+        vae_tile: '',
         width: 'Anchura',
         correction: {
           label: 'Corrección facial',
diff --git a/gui/src/strings/fr.ts b/gui/src/strings/fr.ts
index 589cf85f..825e57fa 100644
--- a/gui/src/strings/fr.ts
+++ b/gui/src/strings/fr.ts
@@ -162,9 +162,11 @@ export const I18N_STRINGS_FR = {
         steps: '',
         strength: '',
         stride: '',
-        tiledVAE: '',
+        tiled_vae: '',
         tiles: '',
         tileOrder: '',
+        unet_overlap: '',
+        unet_tile: '',
         upscale: {
           label: '',
           denoise: '',
@@ -172,6 +174,8 @@ export const I18N_STRINGS_FR = {
           order: '',
           outscale: '',
         },
+        vae_overlap: '',
+        vae_tile: '',
         width: '',
         correction: {
           label: '',
diff --git a/gui/src/types/params.ts b/gui/src/types/params.ts
index 2b4b3888..4e8db5b8 100644
--- a/gui/src/types/params.ts
+++ b/gui/src/types/params.ts
@@ -50,10 +50,11 @@ export interface BaseImgParams {
   negativePrompt?: string;
 
   batch: number;
-  tiledVAE: boolean;
-  tiles: number;
-  overlap: number;
-  stride: number;
+  tiled_vae: boolean;
+  vae_overlap: number;
+  vae_tile: number;
+  unet_overlap: number;
+  unet_tile: number;
 
   cfg: number;
   steps: number;

From 783e8eab4b636cb11e2944de61757b37429621ef Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 4 Nov 2023 20:42:11 -0500
Subject: [PATCH 092/240] add more tests

---
 .../diffusion/test_textual_inversion.py       | 227 ++++++++++++++++++
 api/tests/image/test_utils.py                 |  24 ++
 api/tests/worker/test_worker.py               |  42 ++++
 3 files changed, 293 insertions(+)
 create mode 100644 api/tests/convert/diffusion/test_textual_inversion.py
 create mode 100644 api/tests/image/test_utils.py
 create mode 100644 api/tests/worker/test_worker.py

diff --git a/api/tests/convert/diffusion/test_textual_inversion.py b/api/tests/convert/diffusion/test_textual_inversion.py
new file mode 100644
index 00000000..246d53b4
--- /dev/null
+++ b/api/tests/convert/diffusion/test_textual_inversion.py
@@ -0,0 +1,227 @@
+import unittest
+
+import numpy as np
+import torch
+from onnx import GraphProto, ModelProto
+from onnx.numpy_helper import from_array, to_array
+
+from onnx_web.convert.diffusion.textual_inversion import (
+    blend_embedding_concept,
+    blend_embedding_embeddings,
+    blend_embedding_node,
+    blend_embedding_parameters,
+    blend_textual_inversions,
+    detect_embedding_format,
+)
+
+TEST_DIMS = (8, 8)
+TEST_DIMS_EMBEDS = (1, *TEST_DIMS)
+
+TEST_MODEL_EMBEDS = {
+      "string_to_token": {
+        "test": 1,
+      },
+      "string_to_param": {
+        "test": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+      },
+}
+
+
+class DetectEmbeddingFormatTests(unittest.TestCase):
+  def test_concept(self):
+    embedding = {
+      "<test>": "test",
+    }
+    self.assertEqual(detect_embedding_format(embedding), "concept")
+
+  def test_parameters(self):
+    embedding = {
+      "emb_params": "test",
+    }
+    self.assertEqual(detect_embedding_format(embedding), "parameters")
+
+  def test_embeddings(self):
+    embedding = {
+      "string_to_token": "test",
+      "string_to_param": "test",
+    }
+    self.assertEqual(detect_embedding_format(embedding), "embeddings")
+
+  def test_unknown(self):
+    embedding = {
+      "what_is_this": "test",
+    }
+    self.assertEqual(detect_embedding_format(embedding), None)
+
+
+class BlendEmbeddingConceptTests(unittest.TestCase):
+  def test_existing_base_token(self):
+    embeds = {
+      "test": np.ones(TEST_DIMS),
+    }
+    blend_embedding_concept(embeds, {
+      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+    }, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+    self.assertEqual(embeds["test"].mean(), 2)
+
+  def test_missing_base_token(self):
+    embeds = {}
+    blend_embedding_concept(embeds, {
+      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+    }, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+
+  def test_existing_token(self):
+    embeds = {
+      "<test>": np.ones(TEST_DIMS),
+    }
+    blend_embedding_concept(embeds, {
+      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+    }, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["<test>", "test"])
+
+  def test_missing_token(self):
+    embeds = {}
+    blend_embedding_concept(embeds, {
+      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+    }, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["<test>", "test"])
+
+
+class BlendEmbeddingParametersTests(unittest.TestCase):
+  def test_existing_base_token(self):
+    embeds = {
+      "test": np.ones(TEST_DIMS),
+    }
+    blend_embedding_parameters(embeds, {
+      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+    }, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+    self.assertEqual(embeds["test"].mean(), 2)
+
+  def test_missing_base_token(self):
+    embeds = {}
+    blend_embedding_parameters(embeds, {
+      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+    }, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+
+  def test_existing_token(self):
+    embeds = {
+      "test": np.ones(TEST_DIMS_EMBEDS),
+    }
+    blend_embedding_parameters(embeds, {
+      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+    }, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["test", "test-0", "test-all"])
+
+  def test_missing_token(self):
+    embeds = {}
+    blend_embedding_parameters(embeds, {
+      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+    }, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["test", "test-0", "test-all"])
+
+
+class BlendEmbeddingEmbeddingsTests(unittest.TestCase):
+  def test_existing_base_token(self):
+    embeds = {
+      "test": np.ones(TEST_DIMS),
+    }
+    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+    self.assertEqual(embeds["test"].mean(), 2)
+
+  def test_missing_base_token(self):
+    embeds = {}
+    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+
+    self.assertIn("test", embeds)
+    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+
+  def test_existing_token(self):
+    embeds = {
+      "test": np.ones(TEST_DIMS),
+    }
+    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["test", "test-0", "test-all"])
+
+  def test_missing_token(self):
+    embeds = {}
+    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+
+    keys = list(embeds.keys())
+    keys.sort()
+
+    self.assertIn("test", embeds)
+    self.assertEqual(keys, ["test", "test-0", "test-all"])
+
+
+class BlendEmbeddingNodeTests(unittest.TestCase):
+  def test_expand_weights(self):
+    weights = from_array(np.ones(TEST_DIMS))
+    weights.name = "text_model.embeddings.token_embedding.weight"
+
+    model = ModelProto(graph=GraphProto(initializer=[
+      weights,
+    ]))
+
+    embeds = {}
+    blend_embedding_node(model, {
+      'convert_tokens_to_ids': lambda t: t,
+    }, embeds, 2)
+
+    result = to_array(model.graph.initializer[0])
+
+    self.assertEqual(len(model.graph.initializer), 1)
+    self.assertEqual(result.shape, (10, 8)) # (8 + 2, 8)
+
+
+class BlendTextualInversionsTests(unittest.TestCase):
+  def test_blend_multi_concept(self):
+    pass
+
+  def test_blend_multi_parameters(self):
+    pass
+
+  def test_blend_multi_embeddings(self):
+    pass
+
+  def test_blend_multi_mixed(self):
+    pass
diff --git a/api/tests/image/test_utils.py b/api/tests/image/test_utils.py
new file mode 100644
index 00000000..f3b10fd5
--- /dev/null
+++ b/api/tests/image/test_utils.py
@@ -0,0 +1,24 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.image.utils import expand_image
+from onnx_web.params import Border
+
+
+class ExpandImageTests(unittest.TestCase):
+  def test_expand(self):
+    result = expand_image(
+      Image.new("RGB", (8, 8)),
+      Image.new("RGB", (8, 8), "white"),
+      Border.even(4),
+    )
+    self.assertEqual(result[0].size, (16, 16))
+
+  def test_masked(self):
+    result = expand_image(
+      Image.new("RGB", (8, 8), "red"),
+      Image.new("RGB", (8, 8), "white"),
+      Border.even(4),
+    )
+    self.assertEqual(result[0].getpixel((8, 8)), (255, 0, 0))
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
new file mode 100644
index 00000000..06c0822d
--- /dev/null
+++ b/api/tests/worker/test_worker.py
@@ -0,0 +1,42 @@
+import unittest
+from multiprocessing import Queue, Value
+
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from onnx_web.worker.worker import EXIT_INTERRUPT, worker_main
+from tests.helpers import test_device
+
+
+class WorkerMainTests(unittest.TestCase):
+  def test_pending_exception_empty(self):
+    pass
+
+  def test_pending_exception_interrupt(self):
+    status = None
+
+    def exit(exit_status):
+      status = exit_status
+
+    cancel = Value("L", False)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    pid = Value("L", False)
+    idle = Value("L", False)
+
+    pending.close()
+    # worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+
+    self.assertEqual(status, EXIT_INTERRUPT)
+
+  def test_pending_exception_retry(self):
+    pass
+
+  def test_pending_exception_value(self):
+    pass
+
+  def test_pending_exception_other_memory(self):
+    pass
+
+  def test_pending_exception_other_unknown(self):
+    pass

From 8a1d9b2530ba19adfbe9d6aa7b0bafb43aa7d2d4 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 4 Nov 2023 20:53:34 -0500
Subject: [PATCH 093/240] fix VAE strings

---
 gui/src/strings/en.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/gui/src/strings/en.ts b/gui/src/strings/en.ts
index b39d1489..5c312c42 100644
--- a/gui/src/strings/en.ts
+++ b/gui/src/strings/en.ts
@@ -226,7 +226,7 @@ export const I18N_STRINGS_EN = {
           order: 'Upscale Order',
           outscale: 'Outscale',
         },
-        vae_overlap: 'UNet Overlap',
+        vae_overlap: 'VAE Overlap',
         vae_tile: 'VAE Tile Size',
         width: 'Width',
         correction: {

From 59e1a1a4c2550648c6ed2873adb318dee3b27f50 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:35:58 -0600
Subject: [PATCH 094/240] fix(gui): make overlap params decimal inputs

---
 gui/src/components/control/ImageControl.tsx | 32 ++++++++++-----------
 1 file changed, 16 insertions(+), 16 deletions(-)

diff --git a/gui/src/components/control/ImageControl.tsx b/gui/src/components/control/ImageControl.tsx
index bca1d2ba..8271c700 100644
--- a/gui/src/components/control/ImageControl.tsx
+++ b/gui/src/components/control/ImageControl.tsx
@@ -167,6 +167,7 @@ export function ImageControl(props: ImageControlProps) {
         }}
       />
       <NumericField
+        decimal
         label={t('parameter.unet_overlap')}
         min={params.unet_overlap.min}
         max={params.unet_overlap.max}
@@ -193,22 +194,6 @@ export function ImageControl(props: ImageControlProps) {
         />}
       />
       <NumericField
-        decimal
-        disabled={state.tiled_vae === false}
-        label={t('parameter.vae_overlap')}
-        min={params.vae_overlap.min}
-        max={params.vae_overlap.max}
-        step={params.vae_overlap.step}
-        value={state.vae_overlap}
-        onChange={(vae_tile) => {
-          props.onChange({
-            ...state,
-            vae_tile,
-          });
-        }}
-      />
-      <NumericField
-        decimal
         disabled={state.tiled_vae === false}
         label={t('parameter.vae_tile')}
         min={params.vae_tile.min}
@@ -222,6 +207,21 @@ export function ImageControl(props: ImageControlProps) {
           });
         }}
       />
+      <NumericField
+        decimal
+        disabled={state.tiled_vae === false}
+        label={t('parameter.vae_overlap')}
+        min={params.vae_overlap.min}
+        max={params.vae_overlap.max}
+        step={params.vae_overlap.step}
+        value={state.vae_overlap}
+        onChange={(vae_overlap) => {
+          props.onChange({
+            ...state,
+            vae_overlap,
+          });
+        }}
+      />
     </Stack>
     <PromptInput
       selector={selector}

From 5cf7a39be0210c32a2a280490b2c4756e4799ca9 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:36:31 -0600
Subject: [PATCH 095/240] feat(api): add experimental region prompts to SDXL
 panorama

---
 .../diffusers/pipelines/panorama_xl.py        | 99 +++++++++++++++++++
 api/onnx_web/diffusers/utils.py               |  6 ++
 2 files changed, 105 insertions(+)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index fed65722..a0c92d07 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -12,6 +12,8 @@ from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
 )
 from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
 
+from ..utils import parse_regions
+
 logger = logging.getLogger(__name__)
 
 
@@ -299,6 +301,33 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
         )
 
+        # 3.b. Encode region prompts
+        regions = parse_regions(prompt)
+        region_embeds: List[Tuple[List[np.ndarray], Optional[np.ndarray], Optional[np.ndarray], Optional[np.ndarray]]] = []
+        add_region_embeds: List[np.ndarray] = []
+
+        for _top, _left, _bottom, _right, _mode, region_prompt in regions:
+            current_region_embeds = self._encode_prompt(
+                region_prompt,
+                num_images_per_prompt,
+                do_classifier_free_guidance,
+                negative_prompt,
+                prompt_embeds=prompt_embeds,
+                negative_prompt_embeds=negative_prompt_embeds,
+                pooled_prompt_embeds=pooled_prompt_embeds,
+                negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
+            )
+
+            if do_classifier_free_guidance:
+                current_region_embeds[0] = np.concatenate(
+                    (current_region_embeds[1], current_region_embeds[0]), axis=0
+                )
+                add_region_embeds.append(np.concatenate(
+                    (current_region_embeds[3], current_region_embeds[2]), axis=0
+                ))
+
+            region_embeds.append(current_region_embeds)
+
         # 4. Prepare timesteps
         self.scheduler.set_timesteps(num_inference_steps)
         timesteps = self.scheduler.timesteps
@@ -330,6 +359,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 (negative_pooled_prompt_embeds, add_text_embeds), axis=0
             )
             add_time_ids = np.concatenate((add_time_ids, add_time_ids), axis=0)
+
         add_time_ids = np.repeat(
             add_time_ids, batch_size * num_images_per_prompt, axis=0
         )
@@ -400,6 +430,75 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
+            for i in range(len(regions)):
+                top, left, bottom, right, mode, prompt = regions[i]
+                print("running region prompt", top, left, bottom, right, mode, prompt)
+
+                # convert coordinates to latent space
+                h_start = top // 8
+                h_end = bottom // 8
+                w_start = left // 8
+                w_end = right // 8
+
+                # get the latents corresponding to the current view coordinates
+                latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
+
+                # expand the latents if we are doing classifier free guidance
+                latent_model_input = (
+                    np.concatenate([latents_for_view] * 2)
+                    if do_classifier_free_guidance
+                    else latents_for_view
+                )
+                latent_model_input = self.scheduler.scale_model_input(
+                    torch.from_numpy(latent_model_input), t
+                )
+                latent_model_input = latent_model_input.cpu().numpy()
+
+                # fetch region embeds
+                region_1 = region_embeds[i][0]
+                region_2 = add_region_embeds[i]
+
+                # predict the noise residual
+                timestep = np.array([t], dtype=timestep_dtype)
+                noise_pred = self.unet(
+                    sample=latent_model_input,
+                    timestep=timestep,
+                    encoder_hidden_states=region_1,
+                    text_embeds=region_2,
+                    time_ids=add_time_ids,
+                )
+                noise_pred = noise_pred[0]
+
+                # perform guidance
+                if do_classifier_free_guidance:
+                    noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
+                    noise_pred = noise_pred_uncond + guidance_scale * (
+                        noise_pred_text - noise_pred_uncond
+                    )
+                    if guidance_rescale > 0.0:
+                        # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
+                        noise_pred = rescale_noise_cfg(
+                            noise_pred,
+                            noise_pred_text,
+                            guidance_rescale=guidance_rescale,
+                        )
+
+                # compute the previous noisy sample x_t -> x_t-1
+                scheduler_output = self.scheduler.step(
+                    torch.from_numpy(noise_pred),
+                    t,
+                    torch.from_numpy(latents_for_view),
+                    **extra_step_kwargs,
+                )
+                latents_view_denoised = scheduler_output.prev_sample.numpy()
+
+                if mode:
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_view_denoised
+                    count[:, :, h_start:h_end, w_start:w_end] = 1
+                else:
+                    value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
+                    count[:, :, h_start:h_end, w_start:w_end] += 1
+
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
 
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index ab3c63c5..152b5bca 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -444,3 +444,9 @@ def slice_prompt(prompt: str, slice: int) -> str:
         return parts[min(slice, len(parts) - 1)]
     else:
         return prompt
+
+
+Region = Tuple[int, int, int, int, bool, str]
+
+def parse_regions(prompt: str) -> List[Region]:
+    return []

From 44851e3785074c228b1ebcb7740ffec29e3c6200 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:37:05 -0600
Subject: [PATCH 096/240] fix: increase step limits for SDXL

---
 api/params.json     | 4 ++--
 gui/src/config.json | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/api/params.json b/api/params.json
index 9ed7451f..d9cd6fa0 100644
--- a/api/params.json
+++ b/api/params.json
@@ -98,7 +98,7 @@
   "highresSteps": {
     "default": 0,
     "min": 1,
-    "max": 200,
+    "max": 500,
     "step": 1
   },
   "highresStrength": {
@@ -182,7 +182,7 @@
   "steps": {
     "default": 25,
     "min": 1,
-    "max": 200,
+    "max": 300,
     "step": 1
   },
   "strength": {
diff --git a/gui/src/config.json b/gui/src/config.json
index d658a121..91cccb8e 100644
--- a/gui/src/config.json
+++ b/gui/src/config.json
@@ -88,7 +88,7 @@
     "highresSteps": {
       "default": 0,
       "min": 1,
-      "max": 200,
+      "max": 500,
       "step": 1
     },
     "highresStrength": {
@@ -172,7 +172,7 @@
     "steps": {
       "default": 25,
       "min": 1,
-      "max": 200,
+      "max": 300,
       "step": 1
     },
     "strength": {

From 8ba9f3c0b702af77cee187c6a68730e8467c73b8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:46:37 -0600
Subject: [PATCH 097/240] basic region prompt parsing

---
 api/onnx_web/diffusers/load.py                | 12 ++++++++++--
 .../diffusers/pipelines/panorama_xl.py        | 19 ++++++++++++++-----
 api/onnx_web/diffusers/run.py                 |  3 ++-
 api/onnx_web/diffusers/utils.py               |  8 +++++---
 api/onnx_web/server/hacks.py                  |  8 --------
 5 files changed, 31 insertions(+), 19 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 07310e74..642ccf77 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -267,12 +267,20 @@ def load_pipeline(
     # update panorama params
     if params.is_panorama():
         unet_stride = (params.unet_tile * (1 - params.unet_overlap)) // 8
-        logger.debug("setting panorama window parameters: %s/%s for UNet, %s/%s for VAE", params.unet_tile, unet_stride, params.vae_tile, params.vae_overlap)
+        logger.debug(
+            "setting panorama window parameters: %s/%s for UNet, %s/%s for VAE",
+            params.unet_tile,
+            unet_stride,
+            params.vae_tile,
+            params.vae_overlap,
+        )
         pipe.set_window_size(params.unet_tile // 8, unet_stride)
 
         for vae in VAE_COMPONENTS:
             if hasattr(pipe, vae):
-                getattr(pipe, vae).set_window_size(params.vae_tile // 8, params.vae_overlap)
+                getattr(pipe, vae).set_window_size(
+                    params.vae_tile // 8, params.vae_overlap
+                )
 
     run_gc([device])
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index a0c92d07..7c46326c 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -303,7 +303,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 3.b. Encode region prompts
         regions = parse_regions(prompt)
-        region_embeds: List[Tuple[List[np.ndarray], Optional[np.ndarray], Optional[np.ndarray], Optional[np.ndarray]]] = []
+        region_embeds: List[
+            Tuple[
+                List[np.ndarray],
+                Optional[np.ndarray],
+                Optional[np.ndarray],
+                Optional[np.ndarray],
+            ]
+        ] = []
         add_region_embeds: List[np.ndarray] = []
 
         for _top, _left, _bottom, _right, _mode, region_prompt in regions:
@@ -322,9 +329,11 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 current_region_embeds[0] = np.concatenate(
                     (current_region_embeds[1], current_region_embeds[0]), axis=0
                 )
-                add_region_embeds.append(np.concatenate(
-                    (current_region_embeds[3], current_region_embeds[2]), axis=0
-                ))
+                add_region_embeds.append(
+                    np.concatenate(
+                        (current_region_embeds[3], current_region_embeds[2]), axis=0
+                    )
+                )
 
             region_embeds.append(current_region_embeds)
 
@@ -492,7 +501,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_view_denoised = scheduler_output.prev_sample.numpy()
 
-                if mode:
+                if mode == "replace":
                     value[:, :, h_start:h_end, w_start:w_end] = latents_view_denoised
                     count[:, :, h_start:h_end, w_start:w_end] = 1
                 else:
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index b86be2b1..6c6ebc8e 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -43,8 +43,9 @@ def run_txt2img_pipeline(
     highres: HighresParams,
 ) -> None:
     # if using panorama, the pipeline will tile itself (views)
-    if params.is_panorama() or params.is_xl():
+    if params.is_panorama():
         tile_size = max(params.unet_tile, size.width, size.height)
+        logger.debug("adjusting tile size for panorama to %s", tile_size)
     else:
         tile_size = params.unet_tile
 
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 152b5bca..d06a28cd 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -3,7 +3,7 @@ from copy import deepcopy
 from logging import getLogger
 from math import ceil
 from re import Pattern, compile
-from typing import Dict, List, Optional, Tuple
+from typing import Dict, List, Literal, Optional, Tuple
 
 import numpy as np
 import torch
@@ -21,6 +21,7 @@ CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
+REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(add|replace):([^\>])\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -446,7 +447,8 @@ def slice_prompt(prompt: str, slice: int) -> str:
         return prompt
 
 
-Region = Tuple[int, int, int, int, bool, str]
+Region = Tuple[int, int, int, int, Literal["add", "replace"], str]
+
 
 def parse_regions(prompt: str) -> List[Region]:
-    return []
+    return get_tokens_from_prompt(prompt, REGION_TOKEN)
diff --git a/api/onnx_web/server/hacks.py b/api/onnx_web/server/hacks.py
index f51b51f4..b59bb73a 100644
--- a/api/onnx_web/server/hacks.py
+++ b/api/onnx_web/server/hacks.py
@@ -2,16 +2,8 @@ import sys
 from functools import partial
 from logging import getLogger
 from os import path
-from pathlib import Path
-from typing import Dict, Optional, Union
 from urllib.parse import urlparse
 
-from optimum.onnxruntime.modeling_diffusion import (
-    ORTModel,
-    ORTStableDiffusionPipelineBase,
-)
-
-from ..torch_before_ort import SessionOptions
 from ..utils import run_gc
 from .context import ServerContext
 

From 046803fc2b7ec779f6218fb62e368787ee3e3cd5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:55:49 -0600
Subject: [PATCH 098/240] lint(api): reduce log level during SDXL LoRA blending

---
 api/onnx_web/convert/diffusion/lora.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index afa681f2..270bf2ce 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -112,7 +112,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
             logger.warning("new XL key type: %s", root)
             continue
 
-        logger.debug("searching for XL node: /%s/*/%s", block, suffix)
+        logger.trace("searching for XL node: /%s/*/%s", block, suffix)
         match = None
         if block == "text_model":
             match = next(
@@ -139,7 +139,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
             # wtf
             name = f"{name}ut"
 
-        logger.debug("matching XL key with node: %s -> %s", key, match.name)
+        logger.trace("matching XL key with node: %s -> %s", key, match.name)
 
         fixed[name] = value
         nodes.remove(match)

From c3f4c520042947f16c6e2efe7eea8416f51004be Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 15:56:03 -0600
Subject: [PATCH 099/240] fix region prompt regex

---
 api/onnx_web/diffusers/utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index d06a28cd..a29c8876 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -21,7 +21,7 @@ CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
-REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(add|replace):([^\>])\>")
+REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(add|replace):([^\>]+)\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")

From 8498252c7559762c07a816126d6c725b1d1b64ee Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 16:06:49 -0600
Subject: [PATCH 100/240] parse region groups better

---
 api/onnx_web/diffusers/utils.py | 16 ++++++++++++----
 1 file changed, 12 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index a29c8876..d96e3d5e 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -220,8 +220,15 @@ def expand_prompt(
     return prompt_embeds
 
 
+def parse_float_group(group: Tuple[str, str]) -> Tuple[str, float]:
+    name, weight = group
+    return (name, float(weight))
+
+
 def get_tokens_from_prompt(
-    prompt: str, pattern: Pattern
+    prompt: str,
+    pattern: Pattern,
+    parser = parse_float_group,
 ) -> Tuple[str, List[Tuple[str, float]]]:
     """
     TODO: replace with Arpeggio
@@ -232,8 +239,9 @@ def get_tokens_from_prompt(
     next_match = pattern.search(remaining_prompt)
     while next_match is not None:
         logger.debug("found token in prompt: %s", next_match)
-        name, weight = next_match.groups()
-        tokens.append((name, float(weight)))
+        group = next_match.groups()
+        tokens.append(parser(group))
+
         # remove this match and look for another
         remaining_prompt = (
             remaining_prompt[: next_match.start()]
@@ -451,4 +459,4 @@ Region = Tuple[int, int, int, int, Literal["add", "replace"], str]
 
 
 def parse_regions(prompt: str) -> List[Region]:
-    return get_tokens_from_prompt(prompt, REGION_TOKEN)
+    return get_tokens_from_prompt(prompt, REGION_TOKEN, lambda it: it)

From baecb38343202153f9ddafa03e2ceec984d36003 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 16:25:48 -0600
Subject: [PATCH 101/240] fix region parsing

---
 .../diffusers/pipelines/panorama_xl.py        | 23 ++++++++++++-------
 api/onnx_web/diffusers/utils.py               |  2 +-
 2 files changed, 16 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 7c46326c..27fc4964 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -284,6 +284,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         # corresponds to doing no classifier free guidance.
         do_classifier_free_guidance = guidance_scale > 1.0
 
+        prompt, regions = parse_regions(prompt)
+
         # 3. Encode input prompt
         (
             prompt_embeds,
@@ -302,7 +304,6 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         )
 
         # 3.b. Encode region prompts
-        regions = parse_regions(prompt)
         region_embeds: List[
             Tuple[
                 List[np.ndarray],
@@ -314,7 +315,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         add_region_embeds: List[np.ndarray] = []
 
         for _top, _left, _bottom, _right, _mode, region_prompt in regions:
-            current_region_embeds = self._encode_prompt(
+            (
+                region_prompt_embeds,
+                region_negative_prompt_embeds,
+                region_pooled_prompt_embeds,
+                region_negative_pooled_prompt_embeds,
+            ) = self._encode_prompt(
                 region_prompt,
                 num_images_per_prompt,
                 do_classifier_free_guidance,
@@ -326,16 +332,16 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             )
 
             if do_classifier_free_guidance:
-                current_region_embeds[0] = np.concatenate(
-                    (current_region_embeds[1], current_region_embeds[0]), axis=0
+                region_prompt_embeds = np.concatenate(
+                    (region_negative_prompt_embeds, region_prompt_embeds), axis=0
                 )
                 add_region_embeds.append(
                     np.concatenate(
-                        (current_region_embeds[3], current_region_embeds[2]), axis=0
+                        (region_negative_pooled_prompt_embeds, region_pooled_prompt_embeds), axis=0
                     )
                 )
 
-            region_embeds.append(current_region_embeds)
+            region_embeds.append(region_prompt_embeds)
 
         # 4. Prepare timesteps
         self.scheduler.set_timesteps(num_inference_steps)
@@ -441,7 +447,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
             for i in range(len(regions)):
                 top, left, bottom, right, mode, prompt = regions[i]
-                print("running region prompt", top, left, bottom, right, mode, prompt)
+                logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mode, prompt)
 
                 # convert coordinates to latent space
                 h_start = top // 8
@@ -464,8 +470,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 latent_model_input = latent_model_input.cpu().numpy()
 
                 # fetch region embeds
-                region_1 = region_embeds[i][0]
+                region_1 = region_embeds[i]
                 region_2 = add_region_embeds[i]
+                logger.debug("region embeds shape: %s, %s", region_1.shape, region_2.shape)
 
                 # predict the noise residual
                 timestep = np.array([t], dtype=timestep_dtype)
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index d96e3d5e..5a5cfcd4 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -458,5 +458,5 @@ def slice_prompt(prompt: str, slice: int) -> str:
 Region = Tuple[int, int, int, int, Literal["add", "replace"], str]
 
 
-def parse_regions(prompt: str) -> List[Region]:
+def parse_regions(prompt: str) -> Tuple[str, List[Region]]:
     return get_tokens_from_prompt(prompt, REGION_TOKEN, lambda it: it)

From b365660adcc34d3c92a318332aa780d3539056e2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 16:35:32 -0600
Subject: [PATCH 102/240] move more SDXL LoRA logs to trace level

---
 api/onnx_web/convert/diffusion/lora.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index 270bf2ce..f99d1ee8 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -76,7 +76,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
 
     for key, value in keys.items():
         root, *rest = key.split(".")
-        logger.debug("fixing XL node name: %s -> %s", key, root)  # TODO: move to trace
+        logger.trace("fixing XL node name: %s -> %s", key, root)
 
         if root.startswith("input"):
             block = "down_blocks"

From ee2173405ab8ca820219b4fbcfc0e17c1dad4b50 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 16:38:43 -0600
Subject: [PATCH 103/240] parse region coordinates

---
 api/onnx_web/diffusers/utils.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 5a5cfcd4..b4a9f031 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -458,5 +458,10 @@ def slice_prompt(prompt: str, slice: int) -> str:
 Region = Tuple[int, int, int, int, Literal["add", "replace"], str]
 
 
+def parse_region_group(group) -> Region:
+    top, left, bottom, right, mode, prompt = group
+    return (int(top), int(left), int(bottom), int(right), mode, prompt)
+
+
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:
-    return get_tokens_from_prompt(prompt, REGION_TOKEN, lambda it: it)
+    return get_tokens_from_prompt(prompt, REGION_TOKEN, parser=parse_region_group)

From 1af6a75723f6a2b0c8397e6be9bfa5557fdf03ed Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 17:28:07 -0600
Subject: [PATCH 104/240] replace region mode with multiplier

---
 .../diffusers/pipelines/panorama_xl.py        | 21 ++++++-------------
 api/onnx_web/diffusers/utils.py               |  4 ++--
 2 files changed, 8 insertions(+), 17 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 27fc4964..c5ea69df 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -446,8 +446,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
             for i in range(len(regions)):
-                top, left, bottom, right, mode, prompt = regions[i]
-                logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mode, prompt)
+                top, left, bottom, right, mult, prompt = regions[i]
+                logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mult, prompt)
 
                 # convert coordinates to latent space
                 h_start = top // 8
@@ -469,18 +469,13 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latent_model_input = latent_model_input.cpu().numpy()
 
-                # fetch region embeds
-                region_1 = region_embeds[i]
-                region_2 = add_region_embeds[i]
-                logger.debug("region embeds shape: %s, %s", region_1.shape, region_2.shape)
-
                 # predict the noise residual
                 timestep = np.array([t], dtype=timestep_dtype)
                 noise_pred = self.unet(
                     sample=latent_model_input,
                     timestep=timestep,
-                    encoder_hidden_states=region_1,
-                    text_embeds=region_2,
+                    encoder_hidden_states=region_embeds[i],
+                    text_embeds=add_region_embeds[i],
                     time_ids=add_time_ids,
                 )
                 noise_pred = noise_pred[0]
@@ -508,12 +503,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_view_denoised = scheduler_output.prev_sample.numpy()
 
-                if mode == "replace":
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_view_denoised
-                    count[:, :, h_start:h_end, w_start:w_end] = 1
-                else:
-                    value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
-                    count[:, :, h_start:h_end, w_start:w_end] += 1
+                value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised * mult
+                count[:, :, h_start:h_end, w_start:w_end] += mult
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index b4a9f031..50d55267 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -455,12 +455,12 @@ def slice_prompt(prompt: str, slice: int) -> str:
         return prompt
 
 
-Region = Tuple[int, int, int, int, Literal["add", "replace"], str]
+Region = Tuple[int, int, int, int, float, str]
 
 
 def parse_region_group(group) -> Region:
     top, left, bottom, right, mode, prompt = group
-    return (int(top), int(left), int(bottom), int(right), mode, prompt)
+    return (int(top), int(left), int(bottom), int(right), float(mode), prompt)
 
 
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:

From df8b4abc77742b5540745cf3df4acd1167a5891a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 17:46:28 -0600
Subject: [PATCH 105/240] fix region regex

---
 api/onnx_web/diffusers/utils.py |  6 +++---
 run/onnx-web.service            | 13 +++++++++++++
 2 files changed, 16 insertions(+), 3 deletions(-)
 create mode 100644 run/onnx-web.service

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 50d55267..f4d1928d 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -21,7 +21,7 @@ CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
-REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(add|replace):([^\>]+)\>")
+REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -459,8 +459,8 @@ Region = Tuple[int, int, int, int, float, str]
 
 
 def parse_region_group(group) -> Region:
-    top, left, bottom, right, mode, prompt = group
-    return (int(top), int(left), int(bottom), int(right), float(mode), prompt)
+    top, left, bottom, right, mult, prompt = group
+    return (int(top), int(left), int(bottom), int(right), float(mult), prompt)
 
 
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:
diff --git a/run/onnx-web.service b/run/onnx-web.service
new file mode 100644
index 00000000..4b2e1b26
--- /dev/null
+++ b/run/onnx-web.service
@@ -0,0 +1,13 @@
+[Unit]
+Description=onnx-web server
+After=network.target
+
+[Service]
+Type=simple
+# EnvironmentFile=/path/to/your/env
+ExecStart=/opt/onnx-web/api/launch.sh
+ExecStop=/bin/kill -WINCH ${MAINPID}
+KillSignal=SIGINT
+
+[Install]
+WantedBy=multi-user.target

From 911f87f7ec5c066d700acd1510d24439be319204 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 19:23:42 -0600
Subject: [PATCH 106/240] fix(api): only consume one retry per error

---
 api/onnx_web/chain/base.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index b67bf40b..944e6116 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -251,11 +251,11 @@ class ChainPipeline:
                         break
                     except Exception:
                         logger.exception(
-                            "error while running stage pipeline, retry %s of 3", i
+                            "error while running stage pipeline, %s retries left", worker.retries
                         )
                         server.cache.clear()
                         run_gc([worker.get_device()])
-                        worker.retries = worker.retries - (i + 1)
+                        worker.retries = worker.retries - 1
 
                 if worker.retries <= 0:
                     raise RetryException("exhausted retries on stage")

From 05f63a32b7196a7eca99c090f2d52664a7e628b3 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 19:25:13 -0600
Subject: [PATCH 107/240] flip and fix h/v coords for regions

---
 .../diffusers/pipelines/panorama_xl.py        | 31 ++++++++++---------
 1 file changed, 16 insertions(+), 15 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index c5ea69df..e55a5870 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -450,29 +450,30 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mult, prompt)
 
                 # convert coordinates to latent space
-                h_start = top // 8
-                h_end = bottom // 8
-                w_start = left // 8
-                w_end = right // 8
+                h_start = left // 8
+                h_end = right // 8
+                w_start = top // 8
+                w_end = bottom // 8
 
                 # get the latents corresponding to the current view coordinates
-                latents_for_view = latents[:, :, h_start:h_end, w_start:w_end]
+                latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
+                logger.trace("region latent shape: %s", latents_for_region.shape)
 
                 # expand the latents if we are doing classifier free guidance
-                latent_model_input = (
-                    np.concatenate([latents_for_view] * 2)
+                latent_region_input = (
+                    np.concatenate([latents_for_region] * 2)
                     if do_classifier_free_guidance
-                    else latents_for_view
+                    else latents_for_region
                 )
-                latent_model_input = self.scheduler.scale_model_input(
-                    torch.from_numpy(latent_model_input), t
+                latent_region_input = self.scheduler.scale_model_input(
+                    torch.from_numpy(latent_region_input), t
                 )
-                latent_model_input = latent_model_input.cpu().numpy()
+                latent_region_input = latent_region_input.cpu().numpy()
 
                 # predict the noise residual
                 timestep = np.array([t], dtype=timestep_dtype)
                 noise_pred = self.unet(
-                    sample=latent_model_input,
+                    sample=latent_region_input,
                     timestep=timestep,
                     encoder_hidden_states=region_embeds[i],
                     text_embeds=add_region_embeds[i],
@@ -498,12 +499,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 scheduler_output = self.scheduler.step(
                     torch.from_numpy(noise_pred),
                     t,
-                    torch.from_numpy(latents_for_view),
+                    torch.from_numpy(latents_for_region),
                     **extra_step_kwargs,
                 )
-                latents_view_denoised = scheduler_output.prev_sample.numpy()
+                latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised * mult
+                value[:, :, h_start:h_end, w_start:w_end] += latents_region_denoised * mult
                 count[:, :, h_start:h_end, w_start:w_end] += mult
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113

From 2de4eb92b215e895d5c0fa95836123032f374f57 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 21:41:40 -0600
Subject: [PATCH 108/240] replace previous latents when region multiplier
 passes threshold

---
 api/onnx_web/chain/base.py                      |  2 +-
 api/onnx_web/diffusers/load.py                  | 12 +++++-------
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 16 ++++++++++------
 3 files changed, 16 insertions(+), 14 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 944e6116..fadce75d 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -250,12 +250,12 @@ class ChainPipeline:
                         stage_sources = stage_outputs
                         break
                     except Exception:
+                        worker.retries = worker.retries - 1
                         logger.exception(
                             "error while running stage pipeline, %s retries left", worker.retries
                         )
                         server.cache.clear()
                         run_gc([worker.get_device()])
-                        worker.retries = worker.retries - 1
 
                 if worker.retries <= 0:
                     raise RetryException("exhausted retries on stage")
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 642ccf77..622ae341 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -262,7 +262,11 @@ def load_pipeline(
 
     for vae in VAE_COMPONENTS:
         if hasattr(pipe, vae):
-            getattr(pipe, vae).set_tiled(tiled=params.tiled_vae)
+            vae_model = getattr(pipe, vae)
+            vae_model.set_tiled(tiled=params.tiled_vae)
+            vae_model.set_window_size(
+                params.vae_tile // 8, params.vae_overlap
+            )
 
     # update panorama params
     if params.is_panorama():
@@ -276,12 +280,6 @@ def load_pipeline(
         )
         pipe.set_window_size(params.unet_tile // 8, unet_stride)
 
-        for vae in VAE_COMPONENTS:
-            if hasattr(pipe, vae):
-                getattr(pipe, vae).set_window_size(
-                    params.vae_tile // 8, params.vae_overlap
-                )
-
     run_gc([device])
 
     return pipe
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index e55a5870..7c87ed1a 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -445,8 +445,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
-            for i in range(len(regions)):
-                top, left, bottom, right, mult, prompt = regions[i]
+            for r in range(len(regions)):
+                top, left, bottom, right, mult, prompt = regions[r]
                 logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mult, prompt)
 
                 # convert coordinates to latent space
@@ -475,8 +475,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 noise_pred = self.unet(
                     sample=latent_region_input,
                     timestep=timestep,
-                    encoder_hidden_states=region_embeds[i],
-                    text_embeds=add_region_embeds[i],
+                    encoder_hidden_states=region_embeds[r],
+                    text_embeds=add_region_embeds[r],
                     time_ids=add_time_ids,
                 )
                 noise_pred = noise_pred[0]
@@ -504,8 +504,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                value[:, :, h_start:h_end, w_start:w_end] += latents_region_denoised * mult
-                count[:, :, h_start:h_end, w_start:w_end] += mult
+                if mult > 1000.0:
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mult
+                    count[:, :, h_start:h_end, w_start:w_end] = mult
+                else:
+                    value[:, :, h_start:h_end, w_start:w_end] += latents_region_denoised * mult
+                    count[:, :, h_start:h_end, w_start:w_end] += mult
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)

From 997891b255dcb4992d3bfc30152477c5ad3e9604 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 22:19:55 -0600
Subject: [PATCH 109/240] fix coords and threshold

---
 .../diffusers/pipelines/panorama_xl.py        | 19 ++++++-------------
 1 file changed, 6 insertions(+), 13 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 7c87ed1a..e99768ee 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -304,14 +304,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         )
 
         # 3.b. Encode region prompts
-        region_embeds: List[
-            Tuple[
-                List[np.ndarray],
-                Optional[np.ndarray],
-                Optional[np.ndarray],
-                Optional[np.ndarray],
-            ]
-        ] = []
+        region_embeds: List[np.ndarray] = []
         add_region_embeds: List[np.ndarray] = []
 
         for _top, _left, _bottom, _right, _mode, region_prompt in regions:
@@ -450,10 +443,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mult, prompt)
 
                 # convert coordinates to latent space
-                h_start = left // 8
-                h_end = right // 8
-                w_start = top // 8
-                w_end = bottom // 8
+                h_start = top // 8
+                h_end = bottom // 8
+                w_start = left // 8
+                w_end = right // 8
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
@@ -504,7 +497,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if mult > 1000.0:
+                if mult >= 1000.0:
                     value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mult
                     count[:, :, h_start:h_end, w_start:w_end] = mult
                 else:

From 408e3d725b8e4e3d8a9578d3d54d97c55706be21 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 5 Nov 2023 22:48:07 -0600
Subject: [PATCH 110/240] use regional noise sample, avoid very errors from
 large multipliers

---
 .../diffusers/pipelines/panorama_xl.py        | 22 +++++++++----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index e99768ee..7b804438 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -465,32 +465,32 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 # predict the noise residual
                 timestep = np.array([t], dtype=timestep_dtype)
-                noise_pred = self.unet(
+                region_noise_pred = self.unet(
                     sample=latent_region_input,
                     timestep=timestep,
                     encoder_hidden_states=region_embeds[r],
                     text_embeds=add_region_embeds[r],
                     time_ids=add_time_ids,
                 )
-                noise_pred = noise_pred[0]
+                region_noise_pred = region_noise_pred[0]
 
                 # perform guidance
                 if do_classifier_free_guidance:
-                    noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
-                    noise_pred = noise_pred_uncond + guidance_scale * (
-                        noise_pred_text - noise_pred_uncond
+                    region_noise_pred_uncond, region_noise_pred_text = np.split(region_noise_pred, 2)
+                    region_noise_pred = region_noise_pred_uncond + guidance_scale * (
+                        region_noise_pred_text - region_noise_pred_uncond
                     )
                     if guidance_rescale > 0.0:
                         # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
-                        noise_pred = rescale_noise_cfg(
-                            noise_pred,
-                            noise_pred_text,
+                        region_noise_pred = rescale_noise_cfg(
+                            region_noise_pred,
+                            region_noise_pred_text,
                             guidance_rescale=guidance_rescale,
                         )
 
                 # compute the previous noisy sample x_t -> x_t-1
                 scheduler_output = self.scheduler.step(
-                    torch.from_numpy(noise_pred),
+                    torch.from_numpy(region_noise_pred),
                     t,
                     torch.from_numpy(latents_for_region),
                     **extra_step_kwargs,
@@ -498,8 +498,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
                 if mult >= 1000.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mult
-                    count[:, :, h_start:h_end, w_start:w_end] = mult
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised
+                    count[:, :, h_start:h_end, w_start:w_end] = 1
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += latents_region_denoised * mult
                     count[:, :, h_start:h_end, w_start:w_end] += mult

From 7c67d595fbd180b35c2d720314c7fc0fa2479603 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 6 Nov 2023 08:48:35 -0600
Subject: [PATCH 111/240] add more misc logging

---
 api/onnx_web/chain/base.py                    |  3 ++-
 api/onnx_web/chain/persist_disk.py            |  4 ++++
 api/onnx_web/chain/source_txt2img.py          |  6 ++++-
 .../convert/diffusion/diffusion_xl.py         |  6 ++++-
 api/onnx_web/diffusers/load.py                |  4 +---
 .../diffusers/pipelines/panorama_xl.py        | 24 +++++++++++++++----
 api/onnx_web/diffusers/utils.py               |  2 +-
 7 files changed, 38 insertions(+), 11 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index fadce75d..41d36651 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -252,7 +252,8 @@ class ChainPipeline:
                     except Exception:
                         worker.retries = worker.retries - 1
                         logger.exception(
-                            "error while running stage pipeline, %s retries left", worker.retries
+                            "error while running stage pipeline, %s retries left",
+                            worker.retries,
                         )
                         server.cache.clear()
                         run_gc([worker.get_device()])
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 7d9a0fe6..124f0989 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -28,6 +28,10 @@ class PersistDiskStage(BaseStage):
         stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> List[Image.Image]:
+        logger.info(
+            "persisting images to disk: %s, %s", [s.size for s in sources], output
+        )
+
         for source, name in zip(sources, output):
             dest = save_image(server, name, source, params=params, size=size)
             logger.info("saved image to %s", dest)
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 13dc70d9..4ad3885c 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -47,7 +47,10 @@ class SourceTxt2ImgStage(BaseStage):
             params = params.with_args(prompt=slice_prompt(params.prompt, prompt_index))
 
         logger.info(
-            "generating image using txt2img, %s steps: %s", params.steps, params.prompt
+            "generating image using txt2img, %s steps of %s: %s",
+            params.steps,
+            params.model,
+            params.prompt,
         )
 
         if len(sources):
@@ -125,6 +128,7 @@ class SourceTxt2ImgStage(BaseStage):
 
         output = list(sources)
         output.extend(result.images)
+        logger.debug("produced %s outputs", len(output))
         return output
 
     def steps(
diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index 54f37752..f6413cb7 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -69,7 +69,11 @@ def convert_diffusion_diffusers_xl(
         else:
             pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
 
-    pipeline.save_pretrained(temp_path)
+    if path.exists(temp_path):
+        logger.debug("torch model already exists for %s: %s", source, temp_path)
+    else:
+        logger.debug("exporting torch model for %s: %s", source, temp_path)
+        pipeline.save_pretrained(temp_path)
 
     # directory -> onnx using optimum exporters
     main_export(
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 622ae341..cbbb10d0 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -264,9 +264,7 @@ def load_pipeline(
         if hasattr(pipe, vae):
             vae_model = getattr(pipe, vae)
             vae_model.set_tiled(tiled=params.tiled_vae)
-            vae_model.set_window_size(
-                params.vae_tile // 8, params.vae_overlap
-            )
+            vae_model.set_window_size(params.vae_tile // 8, params.vae_overlap)
 
     # update panorama params
     if params.is_panorama():
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 7b804438..91e8b040 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -330,7 +330,11 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 add_region_embeds.append(
                     np.concatenate(
-                        (region_negative_pooled_prompt_embeds, region_pooled_prompt_embeds), axis=0
+                        (
+                            region_negative_pooled_prompt_embeds,
+                            region_pooled_prompt_embeds,
+                        ),
+                        axis=0,
                     )
                 )
 
@@ -440,7 +444,15 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
             for r in range(len(regions)):
                 top, left, bottom, right, mult, prompt = regions[r]
-                logger.debug("running region prompt: %s, %s, %s, %s, %s, %s", top, left, bottom, right, mult, prompt)
+                logger.debug(
+                    "running region prompt: %s, %s, %s, %s, %s, %s",
+                    top,
+                    left,
+                    bottom,
+                    right,
+                    mult,
+                    prompt,
+                )
 
                 # convert coordinates to latent space
                 h_start = top // 8
@@ -476,7 +488,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 # perform guidance
                 if do_classifier_free_guidance:
-                    region_noise_pred_uncond, region_noise_pred_text = np.split(region_noise_pred, 2)
+                    region_noise_pred_uncond, region_noise_pred_text = np.split(
+                        region_noise_pred, 2
+                    )
                     region_noise_pred = region_noise_pred_uncond + guidance_scale * (
                         region_noise_pred_text - region_noise_pred_uncond
                     )
@@ -501,7 +515,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                     value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised
                     count[:, :, h_start:h_end, w_start:w_end] = 1
                 else:
-                    value[:, :, h_start:h_end, w_start:w_end] += latents_region_denoised * mult
+                    value[:, :, h_start:h_end, w_start:w_end] += (
+                        latents_region_denoised * mult
+                    )
                     count[:, :, h_start:h_end, w_start:w_end] += mult
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index f4d1928d..45928a48 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -228,7 +228,7 @@ def parse_float_group(group: Tuple[str, str]) -> Tuple[str, float]:
 def get_tokens_from_prompt(
     prompt: str,
     pattern: Pattern,
-    parser = parse_float_group,
+    parser=parse_float_group,
 ) -> Tuple[str, List[Tuple[str, float]]]:
     """
     TODO: replace with Arpeggio

From 63dfec677096c58bb47133fc9e1b4b374bc56e79 Mon Sep 17 00:00:00 2001
From: HoopyFreud <HoopyFreud@users.noreply.github.com>
Date: Mon, 6 Nov 2023 16:53:16 -0500
Subject: [PATCH 112/240] Fixed inpaint issue with no tile_mask

Currently inpainting does not work because the tiler needs to generate a tile_mask. This solves the issue by sending any pipeline that has sources through the tiler.
---
 api/onnx_web/chain/base.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index b67bf40b..0cb6f095 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -160,11 +160,11 @@ class ChainPipeline:
             if stage_pipe.max_tile > 0:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
-            if must_tile:
+            if stage_sources or must_tile:
                 stage_outputs = []
                 for source in stage_sources:
                     logger.info(
-                        "image larger than tile size of %s, tiling stage",
+                        "image contains sources or is larger than tile size of %s, tiling stage",
                         tile,
                     )
 
@@ -232,7 +232,7 @@ class ChainPipeline:
 
                 stage_sources = stage_outputs
             else:
-                logger.debug("image within tile size of %s, running stage", tile)
+                logger.debug("image does not contain sources and is within tile size of %s, running stage", tile)
                 for i in range(worker.retries):
                     try:
                         stage_outputs = stage_pipe.run(

From f564bb3f6557f20e98b864220e0797395b725398 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 18:51:31 -0600
Subject: [PATCH 113/240] add regions to non-XL panorama, add feathering to
 SDXL regions

---
 api/onnx_web/chain/tile.py                    | 27 +++++-
 api/onnx_web/diffusers/pipelines/panorama.py  | 89 +++++++++++++++++++
 .../diffusers/pipelines/panorama_xl.py        | 32 ++++---
 3 files changed, 136 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 44f62671..8258ae7a 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -91,6 +91,31 @@ def get_tile_grads(
     return (grad_x, grad_y)
 
 
+def make_tile_mask(
+    shape: np.ndarray,
+    tile: int,
+    overlap: float,
+) -> np.ndarray:
+    mask = np.ones_like(shape[:, :, 0])
+    adj_tile = int(float(tile) * (1.0 - overlap))
+
+    # sort gradient points
+    p1 = adj_tile
+    p2 = (tile - adj_tile)
+    points = [0, min(p1, p2), max(p1, p2), tile]
+
+    # build gradients
+    grad_x, grad_y = [0, 1, 1, 0], [0, 1, 1, 0]
+    logger.debug("tile gradients: %s, %s, %s", points, grad_x, grad_y)
+
+    mult_x = [np.interp(i, points, grad_x) for i in range(tile)]
+    mult_y = [np.interp(i, points, grad_y) for i in range(tile)]
+
+    mask = ((mask * mult_x).T * mult_y).T
+
+    return mask
+
+
 def blend_tiles(
     tiles: List[Tuple[int, int, Image.Image]],
     scale: int,
@@ -109,7 +134,7 @@ def blend_tiles(
     value = np.zeros(scaled_size)
 
     for left, top, tile_image in tiles:
-        # histogram equalization
+        # TODO: histogram equalization
         equalized = np.array(tile_image).astype(np.float32)
         mask = np.ones_like(equalized[:, :, 0])
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 99e283a1..3ed6c67a 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -26,6 +26,8 @@ from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMSchedu
 from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
 from transformers import CLIPImageProcessor, CLIPTokenizer
 
+from ..utils import parse_regions
+
 logger = logging.get_logger(__name__)
 
 
@@ -479,6 +481,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         # corresponds to doing no classifier free guidance.
         do_classifier_free_guidance = guidance_scale > 1.0
 
+        prompt, regions = parse_regions(prompt)
+
         prompt_embeds = self._encode_prompt(
             prompt,
             num_images_per_prompt,
@@ -488,6 +492,22 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             negative_prompt_embeds=negative_prompt_embeds,
         )
 
+        # 3.b. Encode region prompts
+        region_embeds: List[np.ndarray] = []
+
+        for _top, _left, _bottom, _right, _mult, region_prompt in regions:
+            if region_prompt.endswith("+"):
+                region_prompt = region_prompt[:-1] + " " + prompt
+
+            region_prompt_embeds = self._encode_prompt(
+                region_prompt,
+                num_images_per_prompt,
+                do_classifier_free_guidance,
+                negative_prompt,
+            )
+
+            region_embeds.append(region_prompt_embeds)
+
         # get the initial random noise unless the user supplied it
         latents_dtype = prompt_embeds.dtype
         latents_shape = (batch_size * num_images_per_prompt, 4, height // 8, width // 8)
@@ -576,6 +596,75 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
+            for r in range(len(regions)):
+                top, left, bottom, right, mult, prompt = regions[r]
+                logger.debug(
+                    "running region prompt: %s, %s, %s, %s, %s, %s",
+                    top,
+                    left,
+                    bottom,
+                    right,
+                    mult,
+                    prompt,
+                )
+
+                # convert coordinates to latent space
+                h_start = top // 8
+                h_end = bottom // 8
+                w_start = left // 8
+                w_end = right // 8
+
+                # get the latents corresponding to the current view coordinates
+                latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
+                logger.trace("region latent shape: [:,:,%s:%s,%s:%s] -> %s", h_start, h_end, w_start, w_end, latents_for_region.shape)
+
+                # expand the latents if we are doing classifier free guidance
+                latent_region_input = (
+                    np.concatenate([latents_for_region] * 2)
+                    if do_classifier_free_guidance
+                    else latents_for_region
+                )
+                latent_region_input = self.scheduler.scale_model_input(
+                    torch.from_numpy(latent_region_input), t
+                )
+                latent_region_input = latent_region_input.cpu().numpy()
+
+                # predict the noise residual
+                timestep = np.array([t], dtype=timestep_dtype)
+                region_noise_pred = self.unet(
+                    sample=latent_region_input,
+                    timestep=timestep,
+                    encoder_hidden_states=region_embeds[r],
+                )
+                region_noise_pred = region_noise_pred[0]
+
+                # perform guidance
+                if do_classifier_free_guidance:
+                    region_noise_pred_uncond, region_noise_pred_text = np.split(
+                        region_noise_pred, 2
+                    )
+                    region_noise_pred = region_noise_pred_uncond + guidance_scale * (
+                        region_noise_pred_text - region_noise_pred_uncond
+                    )
+
+                # compute the previous noisy sample x_t -> x_t-1
+                scheduler_output = self.scheduler.step(
+                    torch.from_numpy(region_noise_pred),
+                    t,
+                    torch.from_numpy(latents_for_region),
+                    **extra_step_kwargs,
+                )
+                latents_region_denoised = scheduler_output.prev_sample.numpy()
+
+                if mult >= 10.0:
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised
+                    count[:, :, h_start:h_end, w_start:w_end] = 1
+                else:
+                    value[:, :, h_start:h_end, w_start:w_end] += (
+                        latents_region_denoised * mult
+                    )
+                    count[:, :, h_start:h_end, w_start:w_end] += mult
+
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 91e8b040..61817b15 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -12,6 +12,8 @@ from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
 )
 from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
 
+from onnx_web.chain.tile import make_tile_mask
+
 from ..utils import parse_regions
 
 logger = logging.getLogger(__name__)
@@ -307,7 +309,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         region_embeds: List[np.ndarray] = []
         add_region_embeds: List[np.ndarray] = []
 
-        for _top, _left, _bottom, _right, _mode, region_prompt in regions:
+        for _top, _left, _bottom, _right, _mult, region_prompt in regions:
+            if region_prompt.endswith("+"):
+                region_prompt = region_prompt[:-1] + " " + prompt
+
             (
                 region_prompt_embeds,
                 region_negative_prompt_embeds,
@@ -318,10 +323,6 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 num_images_per_prompt,
                 do_classifier_free_guidance,
                 negative_prompt,
-                prompt_embeds=prompt_embeds,
-                negative_prompt_embeds=negative_prompt_embeds,
-                pooled_prompt_embeds=pooled_prompt_embeds,
-                negative_pooled_prompt_embeds=negative_pooled_prompt_embeds,
             )
 
             if do_classifier_free_guidance:
@@ -462,7 +463,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
-                logger.trace("region latent shape: %s", latents_for_region.shape)
+                logger.trace("region latent shape: [:,:,%s:%s,%s:%s] -> %s", h_start, h_end, w_start, w_end, latents_for_region.shape)
 
                 # expand the latents if we are doing classifier free guidance
                 latent_region_input = (
@@ -511,14 +512,23 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if mult >= 1000.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised
-                    count[:, :, h_start:h_end, w_start:w_end] = 1
+                # TODO: get feather settings from prompt
+                feather = 0.25
+                tile = 1024
+
+                if feather > 0.0:
+                    mask = make_tile_mask(latents_region_denoised, tile, feather)
+                else:
+                    mask = 1
+
+                if mult >= 10.0:
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mask
+                    count[:, :, h_start:h_end, w_start:w_end] = mask
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += (
-                        latents_region_denoised * mult
+                        latents_region_denoised * mult * mask
                     )
-                    count[:, :, h_start:h_end, w_start:w_end] += mult
+                    count[:, :, h_start:h_end, w_start:w_end] += mult * mask
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)

From 633e078036242d0b21572261a0d6684fad7c087c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 19:07:41 -0600
Subject: [PATCH 114/240] unpack mask to match latents

---
 api/onnx_web/chain/tile.py                      | 2 +-
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 6 ++++--
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 8258ae7a..4e2a4e3b 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -96,7 +96,7 @@ def make_tile_mask(
     tile: int,
     overlap: float,
 ) -> np.ndarray:
-    mask = np.ones_like(shape[:, :, 0])
+    mask = np.ones(shape)
     adj_tile = int(float(tile) * (1.0 - overlap))
 
     # sort gradient points
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 61817b15..444cfa3c 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -514,10 +514,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 # TODO: get feather settings from prompt
                 feather = 0.25
-                tile = 1024
+                tile = 128
 
                 if feather > 0.0:
-                    mask = make_tile_mask(latents_region_denoised, tile, feather)
+                    mask = make_tile_mask(latents_region_denoised, (tile, tile), feather)
+                    mask = np.repeat(mask, 4, axis=0)
+                    mask = np.expand_dims(mask, axis=0)
                 else:
                     mask = 1
 

From 59515193a1cd6ffc0027f08e652adb675f60eeeb Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 22:00:32 -0600
Subject: [PATCH 115/240] feat(api): add edge feathering to region prompts

---
 api/onnx_web/chain/tile.py                    |  4 +--
 api/onnx_web/diffusers/pipelines/panorama.py  | 28 +++++++++++++------
 .../diffusers/pipelines/panorama_xl.py        | 21 ++++++--------
 api/onnx_web/diffusers/utils.py               |  6 ++--
 4 files changed, 33 insertions(+), 26 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 4e2a4e3b..1e9fa38d 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -2,7 +2,7 @@ import itertools
 from enum import Enum
 from logging import getLogger
 from math import ceil
-from typing import List, Optional, Protocol, Tuple
+from typing import Any, List, Optional, Protocol, Tuple
 
 import numpy as np
 from PIL import Image
@@ -92,7 +92,7 @@ def get_tile_grads(
 
 
 def make_tile_mask(
-    shape: np.ndarray,
+    shape: Any,
     tile: int,
     overlap: float,
 ) -> np.ndarray:
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 3ed6c67a..afb05b76 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -26,6 +26,8 @@ from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMSchedu
 from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
 from transformers import CLIPImageProcessor, CLIPTokenizer
 
+from onnx_web.chain.tile import make_tile_mask
+
 from ..utils import parse_regions
 
 logger = logging.get_logger(__name__)
@@ -495,7 +497,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         # 3.b. Encode region prompts
         region_embeds: List[np.ndarray] = []
 
-        for _top, _left, _bottom, _right, _mult, region_prompt in regions:
+        for _top, _left, _bottom, _right, _weight, _feather, region_prompt in regions:
             if region_prompt.endswith("+"):
                 region_prompt = region_prompt[:-1] + " " + prompt
 
@@ -597,14 +599,15 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
             for r in range(len(regions)):
-                top, left, bottom, right, mult, prompt = regions[r]
+                top, left, bottom, right, weight, feather, prompt = regions[r]
                 logger.debug(
-                    "running region prompt: %s, %s, %s, %s, %s, %s",
+                    "running region prompt: %s, %s, %s, %s, %s, %s, %s",
                     top,
                     left,
                     bottom,
                     right,
-                    mult,
+                    weight,
+                    feather,
                     prompt,
                 )
 
@@ -656,14 +659,21 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if mult >= 10.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised
-                    count[:, :, h_start:h_end, w_start:w_end] = 1
+                if feather > 0.0:
+                    mask = make_tile_mask((h_end - h_start, w_end - w_start), self.window, feather)
+                    mask = np.repeat(mask, 4, axis=0)
+                    mask = np.expand_dims(mask, axis=0)
+                else:
+                    mask = 1
+
+                if weight >= 10.0:
+                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mask
+                    count[:, :, h_start:h_end, w_start:w_end] = mask
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += (
-                        latents_region_denoised * mult
+                        latents_region_denoised * weight * mask
                     )
-                    count[:, :, h_start:h_end, w_start:w_end] += mult
+                    count[:, :, h_start:h_end, w_start:w_end] += weight * mask
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 444cfa3c..ee6d0413 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -309,7 +309,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         region_embeds: List[np.ndarray] = []
         add_region_embeds: List[np.ndarray] = []
 
-        for _top, _left, _bottom, _right, _mult, region_prompt in regions:
+        for _top, _left, _bottom, _right, _weight, region_prompt in regions:
             if region_prompt.endswith("+"):
                 region_prompt = region_prompt[:-1] + " " + prompt
 
@@ -444,14 +444,15 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
             for r in range(len(regions)):
-                top, left, bottom, right, mult, prompt = regions[r]
+                top, left, bottom, right, weight, feather, prompt = regions[r]
                 logger.debug(
-                    "running region prompt: %s, %s, %s, %s, %s, %s",
+                    "running region prompt: %s, %s, %s, %s, %s, %s, %s",
                     top,
                     left,
                     bottom,
                     right,
-                    mult,
+                    weight,
+                    feather,
                     prompt,
                 )
 
@@ -512,25 +513,21 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                # TODO: get feather settings from prompt
-                feather = 0.25
-                tile = 128
-
                 if feather > 0.0:
-                    mask = make_tile_mask(latents_region_denoised, (tile, tile), feather)
+                    mask = make_tile_mask((h_end - h_start, w_end - w_start), self.window, feather)
                     mask = np.repeat(mask, 4, axis=0)
                     mask = np.expand_dims(mask, axis=0)
                 else:
                     mask = 1
 
-                if mult >= 10.0:
+                if weight >= 10.0:
                     value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mask
                     count[:, :, h_start:h_end, w_start:w_end] = mask
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += (
-                        latents_region_denoised * mult * mask
+                        latents_region_denoised * weight * mask
                     )
-                    count[:, :, h_start:h_end, w_start:w_end] += mult * mask
+                    count[:, :, h_start:h_end, w_start:w_end] += weight * mask
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 45928a48..fa4b1dcd 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -21,7 +21,7 @@ CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
-REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>")
+REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -459,8 +459,8 @@ Region = Tuple[int, int, int, int, float, str]
 
 
 def parse_region_group(group) -> Region:
-    top, left, bottom, right, mult, prompt = group
-    return (int(top), int(left), int(bottom), int(right), float(mult), prompt)
+    top, left, bottom, right, weight, feather, prompt = group
+    return (int(top), int(left), int(bottom), int(right), float(weight), float(feather), prompt)
 
 
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:

From f4f3bda6f815b68afbe2eded85ee172c3a99d60f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 22:00:56 -0600
Subject: [PATCH 116/240] fix(api): allow all supported tensors extensions for
 VAE files

---
 api/onnx_web/convert/diffusion/diffusion.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index f14de94d..cee41d52 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -36,7 +36,7 @@ from ...diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
 from ...diffusers.version_safe_diffusers import AttnProcessor
 from ...models.cnet import UNet2DConditionModel_CNet
 from ...utils import run_gc
-from ..utils import ConversionContext, is_torch_2_0, load_tensor, onnx_export
+from ..utils import RESOLVE_FORMATS, ConversionContext, check_ext, is_torch_2_0, load_tensor, onnx_export
 from .checkpoint import convert_extract_checkpoint
 
 logger = getLogger(__name__)
@@ -375,7 +375,7 @@ def convert_diffusion_diffusers(
 
     if replace_vae is not None:
         vae_path = path.join(conversion.model_path, replace_vae)
-        if replace_vae.endswith(".safetensors"):
+        if check_ext(replace_vae, RESOLVE_FORMATS):
             pipeline.vae = AutoencoderKL.from_single_file(vae_path)
         else:
             pipeline.vae = AutoencoderKL.from_pretrained(vae_path)

From 4a2498ad8d6dd1c90296271a1a326e0377ceeb8f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 22:04:15 -0600
Subject: [PATCH 117/240] apply lint

---
 api/onnx_web/chain/tile.py                     |  2 +-
 api/onnx_web/convert/diffusion/diffusion.py    |  9 ++++++++-
 api/onnx_web/diffusers/pipelines/panorama.py   | 18 +++++++++++++++---
 .../diffusers/pipelines/panorama_xl.py         | 18 +++++++++++++++---
 api/onnx_web/diffusers/utils.py                | 16 +++++++++++++---
 5 files changed, 52 insertions(+), 11 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 1e9fa38d..efbdc771 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -101,7 +101,7 @@ def make_tile_mask(
 
     # sort gradient points
     p1 = adj_tile
-    p2 = (tile - adj_tile)
+    p2 = tile - adj_tile
     points = [0, min(p1, p2), max(p1, p2), tile]
 
     # build gradients
diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index cee41d52..45762ffe 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -36,7 +36,14 @@ from ...diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
 from ...diffusers.version_safe_diffusers import AttnProcessor
 from ...models.cnet import UNet2DConditionModel_CNet
 from ...utils import run_gc
-from ..utils import RESOLVE_FORMATS, ConversionContext, check_ext, is_torch_2_0, load_tensor, onnx_export
+from ..utils import (
+    RESOLVE_FORMATS,
+    ConversionContext,
+    check_ext,
+    is_torch_2_0,
+    load_tensor,
+    onnx_export,
+)
 from .checkpoint import convert_extract_checkpoint
 
 logger = getLogger(__name__)
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index afb05b76..98da1ac8 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -619,7 +619,14 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
-                logger.trace("region latent shape: [:,:,%s:%s,%s:%s] -> %s", h_start, h_end, w_start, w_end, latents_for_region.shape)
+                logger.trace(
+                    "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
+                    h_start,
+                    h_end,
+                    w_start,
+                    w_end,
+                    latents_for_region.shape,
+                )
 
                 # expand the latents if we are doing classifier free guidance
                 latent_region_input = (
@@ -660,14 +667,19 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
                 if feather > 0.0:
-                    mask = make_tile_mask((h_end - h_start, w_end - w_start), self.window, feather)
+                    mask = make_tile_mask(
+                        (h_end - h_start, w_end - w_start), self.window, feather
+                    )
+                    mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)
                     mask = np.expand_dims(mask, axis=0)
                 else:
                     mask = 1
 
                 if weight >= 10.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mask
+                    value[:, :, h_start:h_end, w_start:w_end] = (
+                        latents_region_denoised * mask
+                    )
                     count[:, :, h_start:h_end, w_start:w_end] = mask
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += (
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index ee6d0413..f5efd2a1 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -464,7 +464,14 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
-                logger.trace("region latent shape: [:,:,%s:%s,%s:%s] -> %s", h_start, h_end, w_start, w_end, latents_for_region.shape)
+                logger.trace(
+                    "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
+                    h_start,
+                    h_end,
+                    w_start,
+                    w_end,
+                    latents_for_region.shape,
+                )
 
                 # expand the latents if we are doing classifier free guidance
                 latent_region_input = (
@@ -514,14 +521,19 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
                 if feather > 0.0:
-                    mask = make_tile_mask((h_end - h_start, w_end - w_start), self.window, feather)
+                    mask = make_tile_mask(
+                        (h_end - h_start, w_end - w_start), self.window, feather
+                    )
+                    mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)
                     mask = np.expand_dims(mask, axis=0)
                 else:
                     mask = 1
 
                 if weight >= 10.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = latents_region_denoised * mask
+                    value[:, :, h_start:h_end, w_start:w_end] = (
+                        latents_region_denoised * mask
+                    )
                     count[:, :, h_start:h_end, w_start:w_end] = mask
                 else:
                     value[:, :, h_start:h_end, w_start:w_end] += (
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index fa4b1dcd..8d16662a 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -3,7 +3,7 @@ from copy import deepcopy
 from logging import getLogger
 from math import ceil
 from re import Pattern, compile
-from typing import Dict, List, Literal, Optional, Tuple
+from typing import Dict, List, Optional, Tuple
 
 import numpy as np
 import torch
@@ -21,7 +21,9 @@ CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
-REGION_TOKEN = compile(r"\<region:(\d+):(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>")
+REGION_TOKEN = compile(
+    r"\<region:(\d+):(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>"
+)
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -460,7 +462,15 @@ Region = Tuple[int, int, int, int, float, str]
 
 def parse_region_group(group) -> Region:
     top, left, bottom, right, weight, feather, prompt = group
-    return (int(top), int(left), int(bottom), int(right), float(weight), float(feather), prompt)
+    return (
+        int(top),
+        int(left),
+        int(bottom),
+        int(right),
+        float(weight),
+        float(feather),
+        prompt,
+    )
 
 
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:

From 2af584eabf969abe6e5c8041b363cdaa6ae860f6 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 8 Nov 2023 22:05:06 -0600
Subject: [PATCH 118/240] add missing feather var

---
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index f5efd2a1..7c71748e 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -309,7 +309,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         region_embeds: List[np.ndarray] = []
         add_region_embeds: List[np.ndarray] = []
 
-        for _top, _left, _bottom, _right, _weight, region_prompt in regions:
+        for _top, _left, _bottom, _right, _weight, _feather, region_prompt in regions:
             if region_prompt.endswith("+"):
                 region_prompt = region_prompt[:-1] + " " + prompt
 

From 42c526eb253fa8a3f886f5c98d2639d16cd9b283 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 9 Nov 2023 18:06:59 -0600
Subject: [PATCH 119/240] fix region pattern, make strength and feather both
 decimals

---
 api/onnx_web/diffusers/utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 8d16662a..2e644a77 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -22,7 +22,7 @@ INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 REGION_TOKEN = compile(
-    r"\<region:(\d+):(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):([^\>]+)\>"
+    r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+):([^\>]+)\>"
 )
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")

From 918ffde8e61ec6a2e193ad72c90faaa97ff72b68 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 9 Nov 2023 18:23:19 -0600
Subject: [PATCH 120/240] start documenting region prompts

---
 docs/user-guide.md | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/docs/user-guide.md b/docs/user-guide.md
index e5baa12b..8db17430 100644
--- a/docs/user-guide.md
+++ b/docs/user-guide.md
@@ -32,6 +32,7 @@ Please see [the server admin guide](server-admin.md) for details on how to confi
     - [Prompt tokens](#prompt-tokens)
       - [LoRA and LyCORIS tokens](#lora-and-lycoris-tokens)
       - [Textual Inversion tokens](#textual-inversion-tokens)
+      - [Region tokens](#region-tokens)
       - [CLIP skip tokens](#clip-skip-tokens)
     - [Long prompt weighting syntax](#long-prompt-weighting-syntax)
   - [Pipelines](#pipelines)
@@ -414,6 +415,24 @@ much less useful. For a concept called `cubex` with the token `<cube>`, the avai
 - `<cube>`
 - `cubex-0`
 
+#### Region tokens
+
+You can use a different prompt for part of the image using `<region:...>` tokens. Region tokens are more complicated
+than the other tokens and have more parameters, which may change in the future.
+
+```none
+<region:top:left:bottom:right:strength:feather:prompt>
+```
+
+- the prompt can end with +
+- top/left/bottom/right are integer pixels
+  - will be rounded down to nearest 8
+- strength and feather are floats
+  - strength > 10 replaces other prompt
+  - strength < 0 does weird things
+  - feather can be 0.0 to 0.5, reasonably
+- prompt can end with + to append the regular prompt
+
 #### CLIP skip tokens
 
 You can skip the last layers of the CLIP text encoder using the `clip` token:

From 30a9d014324a3db3d5ae199500196d229793ebdb Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 9 Nov 2023 20:16:18 -0600
Subject: [PATCH 121/240] better docs for regions

---
 docs/user-guide.md | 35 +++++++++++++++++++++++++++--------
 1 file changed, 27 insertions(+), 8 deletions(-)

diff --git a/docs/user-guide.md b/docs/user-guide.md
index 8db17430..b830b928 100644
--- a/docs/user-guide.md
+++ b/docs/user-guide.md
@@ -34,6 +34,7 @@ Please see [the server admin guide](server-admin.md) for details on how to confi
       - [Textual Inversion tokens](#textual-inversion-tokens)
       - [Region tokens](#region-tokens)
       - [CLIP skip tokens](#clip-skip-tokens)
+      - [Prompt stages](#prompt-stages)
     - [Long prompt weighting syntax](#long-prompt-weighting-syntax)
   - [Pipelines](#pipelines)
     - [ControlNet pipeline](#controlnet-pipeline)
@@ -424,14 +425,28 @@ than the other tokens and have more parameters, which may change in the future.
 <region:top:left:bottom:right:strength:feather:prompt>
 ```
 
-- the prompt can end with +
-- top/left/bottom/right are integer pixels
-  - will be rounded down to nearest 8
-- strength and feather are floats
-  - strength > 10 replaces other prompt
-  - strength < 0 does weird things
-  - feather can be 0.0 to 0.5, reasonably
-- prompt can end with + to append the regular prompt
+- `top`, `left`, `bottom`, and `right` define the four corners of a rectangle
+  - must be integers
+  - will be rounded down to the nearest multiple of 8
+- `strength` defines the ratio between the two prompts
+  - must be a float or integer
+  - strength should be between 0.0 and 10.0
+    - 2.0 to 5.0 generally works
+    - 10.0 completely replaces the base prompt
+    - < 0 does weird things
+- `feather` defines the blending between the two prompts
+  - must be a float or integer
+  - this is similar to UNet and VAE overlap
+  - feather should be between 0.0 and 0.5
+    - 0.0 will cause hard edges
+    - 0.25 is a good default
+- the region has its own `prompt`
+  - any characters _except_ `>`
+  - if the region prompt ends with `+`, the base prompt will be appended to it
+    - this can help the region blend with the rest of the image better
+    - `<region:0:0:1024:1024:5.0:0.25:small dog,+> autumn forest, detailed background, 4k, HDR` will use two prompts:
+      - `small dog, autumn forest, detailed background, 4k, HDR` for the region
+      - `autumn forest, detailed background, 4k, HDR` for the rest of the image
 
 #### CLIP skip tokens
 
@@ -443,6 +458,10 @@ You can skip the last layers of the CLIP text encoder using the `clip` token:
 
 This makes your prompt less specific and some models have been trained to work better with some amount of skipping.
 
+#### Prompt stages
+
+TODO: explain `first stage || hires prompt` syntax
+
 ### Long prompt weighting syntax
 
 You can emphasize or deemphasize certain parts of the prompt by using the long prompt weighting option. This adds

From 3622ac4bfb05a5b398f48b432645c7d472143d7a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 9 Nov 2023 22:42:45 -0600
Subject: [PATCH 122/240] work on non-square regions

---
 api/onnx_web/chain/tile.py                    | 24 ++++++++++++-------
 api/onnx_web/diffusers/pipelines/panorama.py  |  4 +++-
 .../diffusers/pipelines/panorama_xl.py        |  4 +++-
 3 files changed, 22 insertions(+), 10 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index efbdc771..4d8bee2d 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -93,23 +93,31 @@ def get_tile_grads(
 
 def make_tile_mask(
     shape: Any,
-    tile: int,
+    tile: Tuple[int, int],
     overlap: float,
 ) -> np.ndarray:
     mask = np.ones(shape)
-    adj_tile = int(float(tile) * (1.0 - overlap))
+
+    tile_h, tile_w = tile
+
+    adj_tile_h = int(float(tile_h) * (1.0 - overlap))
+    adj_tile_w = int(float(tile_w) * (1.0 - overlap))
 
     # sort gradient points
-    p1 = adj_tile
-    p2 = tile - adj_tile
-    points = [0, min(p1, p2), max(p1, p2), tile]
+    p1_h = adj_tile_h
+    p2_h = tile_h - adj_tile_h
+    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile]
+
+    p1_w = adj_tile_w
+    p2_w = tile_w - adj_tile_w
+    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile]
 
     # build gradients
     grad_x, grad_y = [0, 1, 1, 0], [0, 1, 1, 0]
-    logger.debug("tile gradients: %s, %s, %s", points, grad_x, grad_y)
+    logger.debug("tile gradients: %s, %s, %s, %s", points_w, points_h, grad_x, grad_y)
 
-    mult_x = [np.interp(i, points, grad_x) for i in range(tile)]
-    mult_y = [np.interp(i, points, grad_y) for i in range(tile)]
+    mult_x = [np.interp(i, points_w, grad_x) for i in range(tile_w)]
+    mult_y = [np.interp(i, points_h, grad_y) for i in range(tile_h)]
 
     mask = ((mask * mult_x).T * mult_y).T
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 98da1ac8..c5c39f7a 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -668,7 +668,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
                 if feather > 0.0:
                     mask = make_tile_mask(
-                        (h_end - h_start, w_end - w_start), self.window, feather
+                        (h_end - h_start, w_end - w_start),
+                        (h_end - h_start, w_end - w_start),
+                        feather,
                     )
                     mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 7c71748e..6b230108 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -522,7 +522,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
                 if feather > 0.0:
                     mask = make_tile_mask(
-                        (h_end - h_start, w_end - w_start), self.window, feather
+                        (h_end - h_start, w_end - w_start),
+                        (h_end - h_start, w_end - w_start),
+                        feather,
                     )
                     mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)

From 01d8aabc42e6662f63b7e4295707ffba0a8e7aa5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 10 Nov 2023 04:33:29 -0600
Subject: [PATCH 123/240] update features

---
 README.md          | 14 ++++++++++----
 docs/user-guide.md | 14 +++++++++++++-
 2 files changed, 23 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index cc386468..19e8f227 100644
--- a/README.md
+++ b/README.md
@@ -23,6 +23,7 @@ details](https://github.com/ssube/onnx-web/blob/main/docs/user-guide.md).
 
 This is an incomplete list of new and interesting features, with links to the user guide:
 
+- SDXL support
 - hardware acceleration on both AMD and Nvidia
   - tested on CUDA, DirectML, and ROCm
   - [half-precision support for low-memory GPUs](docs/user-guide.md#optimizing-models-for-lower-memory-usage) on both
@@ -37,6 +38,7 @@ This is an incomplete list of new and interesting features, with links to the us
   - [txt2img](docs/user-guide.md#txt2img-tab)
   - [img2img](docs/user-guide.md#img2img-tab)
   - [inpainting](docs/user-guide.md#inpaint-tab), with mask drawing and upload
+  - [panorama](docs/user-guide.md#panorama-pipeline)
   - [upscaling](docs/user-guide.md#upscale-tab), with ONNX acceleration
 - [add and use your own models](docs/user-guide.md#adding-your-own-models)
   - [convert models from diffusers and SD checkpoints](docs/converting-models.md)
@@ -45,20 +47,24 @@ This is an incomplete list of new and interesting features, with links to the us
   - [permanent and prompt-based blending](docs/user-guide.md#permanently-blending-additional-networks)
   - [supports LoRA and LyCORIS weights](docs/user-guide.md#lora-tokens)
   - [supports Textual Inversion concepts and embeddings](docs/user-guide.md#textual-inversion-tokens)
+    - each layer of the embeddings can be controlled and used individually
 - ControlNet
   - image filters for edge detection and other methods
   - with ONNX acceleration
 - highres mode
   - runs img2img on the results of the other pipelines
   - multiple iterations can produce 8k images and larger
+- [multi-stage](docs/user-guide.md#prompt-stages) and [region prompts](docs/user-guide.md#region-tokens)
+  - combine multiple prompts in the same image
+  - provide prompts for different areas in the image and blend them together
+  - change the prompt for highres mode and refine details without recursion
 - infinite prompt length
   - [with long prompt weighting](docs/user-guide.md#long-prompt-weighting)
-  - expand and control Textual Inversions per-layer
 - [image blending mode](docs/user-guide.md#blend-tab)
   - combine images from history
-- upscaling and face correction
-  - upscaling with Real ESRGAN or Stable Diffusion
-  - face correction with CodeFormer or GFPGAN
+- upscaling and correction
+  - upscaling with Real ESRGAN, SwinIR, and Stable Diffusion
+  - face correction with CodeFormer and GFPGAN
 - [API server can be run remotely](docs/server-admin.md)
   - REST API can be served over HTTPS or HTTP
   - background processing for all image pipelines
diff --git a/docs/user-guide.md b/docs/user-guide.md
index b830b928..c8d11287 100644
--- a/docs/user-guide.md
+++ b/docs/user-guide.md
@@ -460,7 +460,19 @@ This makes your prompt less specific and some models have been trained to work b
 
 #### Prompt stages
 
-TODO: explain `first stage || hires prompt` syntax
+You can provide a different prompt for the highres and upscaling stages of an image using prompt stages. Each stage
+of a prompt is separated by `||` and can include its own LoRAs, embeddings, and regions. If you are using multiple
+iterations of highres, each iteration can have its own prompt stage. This can help you avoid recursive body parts
+and some other weird mutations that can be caused by iterating over a subject prompt.
+
+For example, a prompt like `human being sitting on wet grass, outdoors, bright sunny day` is likely to produce many
+small people mixed in with the grass when used with highres. This becomes even worse with 2+ iterations. However,
+changing that prompt to `human being sitting on wet grass, outdoors, bright sunny day || outdoors, bright sunny day, detailed, intricate, HDR`
+will use the second stage as the prompt for highres: `outdoors, bright sunny day, detailed, intricate, HDR`.
+
+This allows you to add and refine details, textures, and even the style of the image during the highres pass.
+
+Prompt stages are only used during upscaling if you are using the Stable Diffusion upscaling model.
 
 ### Long prompt weighting syntax
 

From 8a94cdb385a1808ba172bdb95cffb7c913524340 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 10 Nov 2023 18:37:42 -0600
Subject: [PATCH 124/240] feat(api): add tokens to reseed region

---
 api/onnx_web/chain/source_txt2img.py | 16 ++++++++++++++++
 api/onnx_web/diffusers/utils.py      | 19 +++++++++++++++++++
 2 files changed, 35 insertions(+)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 4ad3885c..8a4dd61b 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -11,6 +11,7 @@ from ..diffusers.utils import (
     get_latents_from_seed,
     get_tile_latents,
     parse_prompt,
+    parse_reseed,
     slice_prompt,
 )
 from ..params import ImageParams, Size, SizeChart, StageParams
@@ -76,6 +77,21 @@ class SourceTxt2ImgStage(BaseStage):
         else:
             latents = get_tile_latents(latents, int(params.seed), latent_size, dims)
 
+        # reseed latents as needed
+        prompt, reseed = parse_reseed(prompt)
+        for top, left, bottom, right, region_seed in reseed:
+            logger.debug(
+                "reseed latent region: [:, :, %s:%s, %s:%s] with %s",
+                top,
+                left,
+                bottom,
+                right,
+                region_seed,
+            )
+            latents[
+                :, :, top // 8 : bottom // 8, left // 8 : right // 8
+            ] = get_latents_from_seed(region_seed, latent_size, params.batch)
+
         pipe_type = params.get_valid_pipeline("txt2img")
         pipe = load_pipeline(
             server,
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 2e644a77..b9a43900 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -24,6 +24,7 @@ WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 REGION_TOKEN = compile(
     r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+):([^\>]+)\>"
 )
+RESEED_TOKEN = compile(r"\<reseed:(\d+):(\d+):(\d+):(\d+):(\d+)\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -475,3 +476,21 @@ def parse_region_group(group) -> Region:
 
 def parse_regions(prompt: str) -> Tuple[str, List[Region]]:
     return get_tokens_from_prompt(prompt, REGION_TOKEN, parser=parse_region_group)
+
+
+Reseed = Tuple[int, int, int, int, int]
+
+
+def parse_reseed_group(group) -> Region:
+    top, left, bottom, right, seed = group
+    return (
+        int(top),
+        int(left),
+        int(bottom),
+        int(right),
+        int(seed),
+    )
+
+
+def parse_reseed(prompt: str) -> Tuple[str, List[Reseed]]:
+    return get_tokens_from_prompt(prompt, RESEED_TOKEN, parser=parse_reseed_group)

From 0d1bf44d2563cdd9ef690153c1da89c9fa4979a2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 10 Nov 2023 20:00:50 -0600
Subject: [PATCH 125/240] fix reseed size and mask dims

---
 api/onnx_web/chain/source_txt2img.py | 2 +-
 api/onnx_web/chain/tile.py           | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 8a4dd61b..cf2f039d 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -90,7 +90,7 @@ class SourceTxt2ImgStage(BaseStage):
             )
             latents[
                 :, :, top // 8 : bottom // 8, left // 8 : right // 8
-            ] = get_latents_from_seed(region_seed, latent_size, params.batch)
+            ] = get_latents_from_seed(region_seed, Size(right - left, bottom - top), params.batch)
 
         pipe_type = params.get_valid_pipeline("txt2img")
         pipe = load_pipeline(
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 4d8bee2d..e3505984 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -106,11 +106,11 @@ def make_tile_mask(
     # sort gradient points
     p1_h = adj_tile_h
     p2_h = tile_h - adj_tile_h
-    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile]
+    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile_h]
 
     p1_w = adj_tile_w
     p2_w = tile_w - adj_tile_w
-    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile]
+    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w]
 
     # build gradients
     grad_x, grad_y = [0, 1, 1, 0], [0, 1, 1, 0]

From c0a4fb6cada9179a2247f0690ab79eea64837777 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 10 Nov 2023 20:07:47 -0600
Subject: [PATCH 126/240] fix(docs): describe reseed tokens

---
 docs/user-guide.md | 53 ++++++++++++++++++++++++++++++----------------
 1 file changed, 35 insertions(+), 18 deletions(-)

diff --git a/docs/user-guide.md b/docs/user-guide.md
index c8d11287..d186d628 100644
--- a/docs/user-guide.md
+++ b/docs/user-guide.md
@@ -32,9 +32,10 @@ Please see [the server admin guide](server-admin.md) for details on how to confi
     - [Prompt tokens](#prompt-tokens)
       - [LoRA and LyCORIS tokens](#lora-and-lycoris-tokens)
       - [Textual Inversion tokens](#textual-inversion-tokens)
-      - [Region tokens](#region-tokens)
-      - [CLIP skip tokens](#clip-skip-tokens)
       - [Prompt stages](#prompt-stages)
+      - [Region tokens](#region-tokens)
+      - [Reseed tokens (region seeds)](#reseed-tokens-region-seeds)
+      - [CLIP skip tokens](#clip-skip-tokens)
     - [Long prompt weighting syntax](#long-prompt-weighting-syntax)
   - [Pipelines](#pipelines)
     - [ControlNet pipeline](#controlnet-pipeline)
@@ -416,6 +417,22 @@ much less useful. For a concept called `cubex` with the token `<cube>`, the avai
 - `<cube>`
 - `cubex-0`
 
+#### Prompt stages
+
+You can provide a different prompt for the highres and upscaling stages of an image using prompt stages. Each stage
+of a prompt is separated by `||` and can include its own LoRAs, embeddings, and regions. If you are using multiple
+iterations of highres, each iteration can have its own prompt stage. This can help you avoid recursive body parts
+and some other weird mutations that can be caused by iterating over a subject prompt.
+
+For example, a prompt like `human being sitting on wet grass, outdoors, bright sunny day` is likely to produce many
+small people mixed in with the grass when used with highres. This becomes even worse with 2+ iterations. However,
+changing that prompt to `human being sitting on wet grass, outdoors, bright sunny day || outdoors, bright sunny day, detailed, intricate, HDR`
+will use the second stage as the prompt for highres: `outdoors, bright sunny day, detailed, intricate, HDR`.
+
+This allows you to add and refine details, textures, and even the style of the image during the highres pass.
+
+Prompt stages are only used during upscaling if you are using the Stable Diffusion upscaling model.
+
 #### Region tokens
 
 You can use a different prompt for part of the image using `<region:...>` tokens. Region tokens are more complicated
@@ -448,6 +465,22 @@ than the other tokens and have more parameters, which may change in the future.
       - `small dog, autumn forest, detailed background, 4k, HDR` for the region
       - `autumn forest, detailed background, 4k, HDR` for the rest of the image
 
+#### Reseed tokens (region seeds)
+
+You can use a different seed for part of the image using `<reseed:...>` tokens. Reseed tokens will replace the initial
+latents in the selected rectangle. There will be some small differences between images due to how the latents
+interpreted by the UNet, but the seeded area should be similar to an image of the same size and seed.
+
+```none
+<reseed:top:left:bottom:right:seed>
+```
+
+- `top`, `left`, `bottom`, and `right` define the four corners of a rectangle
+  - must be integers
+  - will be rounded down to the nearest multiple of 8
+- the region has its own `seed`
+  - must be an integer
+
 #### CLIP skip tokens
 
 You can skip the last layers of the CLIP text encoder using the `clip` token:
@@ -458,22 +491,6 @@ You can skip the last layers of the CLIP text encoder using the `clip` token:
 
 This makes your prompt less specific and some models have been trained to work better with some amount of skipping.
 
-#### Prompt stages
-
-You can provide a different prompt for the highres and upscaling stages of an image using prompt stages. Each stage
-of a prompt is separated by `||` and can include its own LoRAs, embeddings, and regions. If you are using multiple
-iterations of highres, each iteration can have its own prompt stage. This can help you avoid recursive body parts
-and some other weird mutations that can be caused by iterating over a subject prompt.
-
-For example, a prompt like `human being sitting on wet grass, outdoors, bright sunny day` is likely to produce many
-small people mixed in with the grass when used with highres. This becomes even worse with 2+ iterations. However,
-changing that prompt to `human being sitting on wet grass, outdoors, bright sunny day || outdoors, bright sunny day, detailed, intricate, HDR`
-will use the second stage as the prompt for highres: `outdoors, bright sunny day, detailed, intricate, HDR`.
-
-This allows you to add and refine details, textures, and even the style of the image during the highres pass.
-
-Prompt stages are only used during upscaling if you are using the Stable Diffusion upscaling model.
-
 ### Long prompt weighting syntax
 
 You can emphasize or deemphasize certain parts of the prompt by using the long prompt weighting option. This adds

From 798fa5fc6d07a2ae3294aea618d8a5372ab0fd73 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 14:37:23 -0600
Subject: [PATCH 127/240] fix(api): allow random seed in reseed regions

---
 api/onnx_web/chain/source_txt2img.py          | 14 +++++++++++--
 api/onnx_web/diffusers/load.py                | 10 +++++----
 api/onnx_web/diffusers/pipelines/panorama.py  | 21 ++++++++++++-------
 .../diffusers/pipelines/panorama_xl.py        | 10 ++++-----
 api/onnx_web/diffusers/utils.py               |  2 +-
 5 files changed, 37 insertions(+), 20 deletions(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index cf2f039d..a6008d98 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -7,6 +7,7 @@ from PIL import Image
 
 from ..diffusers.load import load_pipeline
 from ..diffusers.utils import (
+    LATENT_FACTOR,
     encode_prompt,
     get_latents_from_seed,
     get_tile_latents,
@@ -78,8 +79,12 @@ class SourceTxt2ImgStage(BaseStage):
             latents = get_tile_latents(latents, int(params.seed), latent_size, dims)
 
         # reseed latents as needed
+        reseed_rng = np.random.default_rng(params.seed)
         prompt, reseed = parse_reseed(prompt)
         for top, left, bottom, right, region_seed in reseed:
+            if region_seed == -1:
+                region_seed = reseed_rng.integers(2**32)
+
             logger.debug(
                 "reseed latent region: [:, :, %s:%s, %s:%s] with %s",
                 top,
@@ -89,8 +94,13 @@ class SourceTxt2ImgStage(BaseStage):
                 region_seed,
             )
             latents[
-                :, :, top // 8 : bottom // 8, left // 8 : right // 8
-            ] = get_latents_from_seed(region_seed, Size(right - left, bottom - top), params.batch)
+                :,
+                :,
+                top // LATENT_FACTOR : bottom // LATENT_FACTOR,
+                left // LATENT_FACTOR : right // LATENT_FACTOR,
+            ] = get_latents_from_seed(
+                region_seed, Size(right - left, bottom - top), params.batch
+            )
 
         pipe_type = params.get_valid_pipeline("txt2img")
         pipe = load_pipeline(
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index cbbb10d0..162a8699 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -19,7 +19,7 @@ from ..constants import ONNX_MODEL
 from ..convert.diffusion.lora import blend_loras, buffer_external_data_tensors
 from ..convert.diffusion.textual_inversion import blend_textual_inversions
 from ..diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
-from ..diffusers.utils import expand_prompt
+from ..diffusers.utils import LATENT_FACTOR, expand_prompt
 from ..params import DeviceParams, ImageParams
 from ..server import ModelTypes, ServerContext
 from ..torch_before_ort import InferenceSession
@@ -264,11 +264,13 @@ def load_pipeline(
         if hasattr(pipe, vae):
             vae_model = getattr(pipe, vae)
             vae_model.set_tiled(tiled=params.tiled_vae)
-            vae_model.set_window_size(params.vae_tile // 8, params.vae_overlap)
+            vae_model.set_window_size(
+                params.vae_tile // LATENT_FACTOR, params.vae_overlap
+            )
 
     # update panorama params
     if params.is_panorama():
-        unet_stride = (params.unet_tile * (1 - params.unet_overlap)) // 8
+        unet_stride = (params.unet_tile * (1 - params.unet_overlap)) // LATENT_FACTOR
         logger.debug(
             "setting panorama window parameters: %s/%s for UNet, %s/%s for VAE",
             params.unet_tile,
@@ -276,7 +278,7 @@ def load_pipeline(
             params.vae_tile,
             params.vae_overlap,
         )
-        pipe.set_window_size(params.unet_tile // 8, unet_stride)
+        pipe.set_window_size(params.unet_tile // LATENT_FACTOR, unet_stride)
 
     run_gc([device])
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index c5c39f7a..14d1143a 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -28,7 +28,7 @@ from transformers import CLIPImageProcessor, CLIPTokenizer
 
 from onnx_web.chain.tile import make_tile_mask
 
-from ..utils import parse_regions
+from ..utils import LATENT_CHANNELS, LATENT_FACTOR, parse_regions
 
 logger = logging.get_logger(__name__)
 
@@ -512,7 +512,12 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # get the initial random noise unless the user supplied it
         latents_dtype = prompt_embeds.dtype
-        latents_shape = (batch_size * num_images_per_prompt, 4, height // 8, width // 8)
+        latents_shape = (
+            batch_size * num_images_per_prompt,
+            LATENT_CHANNELS,
+            height // LATENT_FACTOR,
+            width // LATENT_FACTOR,
+        )
         if latents is None:
             latents = generator.randn(*latents_shape).astype(latents_dtype)
         elif latents.shape != latents_shape:
@@ -612,10 +617,10 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 )
 
                 # convert coordinates to latent space
-                h_start = top // 8
-                h_end = bottom // 8
-                w_start = left // 8
-                w_end = right // 8
+                h_start = top // LATENT_FACTOR
+                h_end = bottom // LATENT_FACTOR
+                w_start = left // LATENT_FACTOR
+                w_end = right // LATENT_FACTOR
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
@@ -1170,8 +1175,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         latents_shape = (
             batch_size * num_images_per_prompt,
             num_channels_latents,
-            height // 8,
-            width // 8,
+            height // LATENT_FACTOR,
+            width // LATENT_FACTOR,
         )
         latents_dtype = prompt_embeds.dtype
         if latents is None:
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 6b230108..e64abe3f 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -14,7 +14,7 @@ from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise
 
 from onnx_web.chain.tile import make_tile_mask
 
-from ..utils import parse_regions
+from ..utils import LATENT_FACTOR, parse_regions
 
 logger = logging.getLogger(__name__)
 
@@ -457,10 +457,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
 
                 # convert coordinates to latent space
-                h_start = top // 8
-                h_end = bottom // 8
-                w_start = left // 8
-                w_end = right // 8
+                h_start = top // LATENT_FACTOR
+                h_end = bottom // LATENT_FACTOR
+                w_start = left // LATENT_FACTOR
+                w_end = right // LATENT_FACTOR
 
                 # get the latents corresponding to the current view coordinates
                 latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index b9a43900..d4dccc2d 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -24,7 +24,7 @@ WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 REGION_TOKEN = compile(
     r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+):([^\>]+)\>"
 )
-RESEED_TOKEN = compile(r"\<reseed:(\d+):(\d+):(\d+):(\d+):(\d+)\>")
+RESEED_TOKEN = compile(r"\<reseed:(\d+):(\d+):(\d+):(\d+):(-?\d+)\>")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")

From 5fb2de85c5dc9b791f14382f6b140d88b2720b13 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 17:03:01 -0600
Subject: [PATCH 128/240] feat(api): add feature flag for single-tile panorama
 highres

---
 api/onnx_web/chain/source_txt2img.py |  4 +--
 api/onnx_web/diffusers/run.py        |  7 +++-
 api/onnx_web/diffusers/utils.py      |  3 --
 api/onnx_web/server/context.py       | 48 ++++++++++++++++++++++++----
 onnx-web.code-workspace              |  1 +
 5 files changed, 51 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index a6008d98..40377fe0 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -79,11 +79,11 @@ class SourceTxt2ImgStage(BaseStage):
             latents = get_tile_latents(latents, int(params.seed), latent_size, dims)
 
         # reseed latents as needed
-        reseed_rng = np.random.default_rng(params.seed)
+        reseed_rng = np.random.RandomState(params.seed)
         prompt, reseed = parse_reseed(prompt)
         for top, left, bottom, right, region_seed in reseed:
             if region_seed == -1:
-                region_seed = reseed_rng.integers(2**32)
+                region_seed = reseed_rng.random_integers(2**32 - 1)
 
             logger.debug(
                 "reseed latent region: [:, :, %s:%s, %s:%s] with %s",
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 6c6ebc8e..a18cb75d 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -62,7 +62,12 @@ def run_txt2img_pipeline(
     )
 
     # apply upscaling and correction, before highres
-    stage = StageParams(tile_size=params.unet_tile)
+    if params.is_panorama() and server.panorama_tiles:
+        highres_size = tile_size * highres.scale
+    else:
+        highres_size = params.unet_tile
+
+    stage = StageParams(tile_size=highres_size)
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index d4dccc2d..6655e2bc 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -233,9 +233,6 @@ def get_tokens_from_prompt(
     pattern: Pattern,
     parser=parse_float_group,
 ) -> Tuple[str, List[Tuple[str, float]]]:
-    """
-    TODO: replace with Arpeggio
-    """
     remaining_prompt = prompt
 
     tokens = []
diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 9ab9210c..eb7f5a2a 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -10,13 +10,38 @@ from .model_cache import ModelCache
 
 logger = getLogger(__name__)
 
+DEFAULT_ANY_PLATFORM = True
 DEFAULT_CACHE_LIMIT = 5
 DEFAULT_JOB_LIMIT = 10
 DEFAULT_IMAGE_FORMAT = "png"
 DEFAULT_SERVER_VERSION = "v0.10.0"
+DEFAULT_SHOW_PROGRESS = True
+DEFAULT_PANORAMA_TILES = False
+DEFAULT_WORKER_RETRIES = 3
 
 
 class ServerContext:
+    bundle_path: str
+    model_path: str
+    output_path: str
+    params_path: str
+    cors_origin: str
+    any_platform: bool
+    block_platforms: List[str]
+    default_platform: str
+    image_format: str
+    cache_limit: int
+    cache_path: str
+    show_progress: bool
+    optimizations: List[str]
+    extra_models: List[str]
+    job_limit: int
+    memory_limit: int
+    admin_token: str
+    server_version: str
+    worker_retries: int
+    panorama_tiles: bool
+
     def __init__(
         self,
         bundle_path: str = ".",
@@ -24,20 +49,21 @@ class ServerContext:
         output_path: str = ".",
         params_path: str = ".",
         cors_origin: str = "*",
-        any_platform: bool = True,
+        any_platform: bool = DEFAULT_ANY_PLATFORM,
         block_platforms: Optional[List[str]] = None,
         default_platform: Optional[str] = None,
         image_format: str = DEFAULT_IMAGE_FORMAT,
         cache_limit: int = DEFAULT_CACHE_LIMIT,
         cache_path: Optional[str] = None,
-        show_progress: bool = True,
+        show_progress: bool = DEFAULT_SHOW_PROGRESS,
         optimizations: Optional[List[str]] = None,
         extra_models: Optional[List[str]] = None,
         job_limit: int = DEFAULT_JOB_LIMIT,
         memory_limit: Optional[int] = None,
         admin_token: Optional[str] = None,
         server_version: Optional[str] = DEFAULT_SERVER_VERSION,
-        worker_retries: Optional[int] = 3,
+        worker_retries: Optional[int] = DEFAULT_WORKER_RETRIES,
+        panorama_tiles: Optional[bool] = DEFAULT_PANORAMA_TILES,
     ) -> None:
         self.bundle_path = bundle_path
         self.model_path = model_path
@@ -58,6 +84,7 @@ class ServerContext:
         self.admin_token = admin_token or token_urlsafe()
         self.server_version = server_version
         self.worker_retries = worker_retries
+        self.panorama_tiles = panorama_tiles
 
         self.cache = ModelCache(self.cache_limit)
 
@@ -76,12 +103,16 @@ class ServerContext:
             params_path=environ.get("ONNX_WEB_PARAMS_PATH", "."),
             # others
             cors_origin=environ.get("ONNX_WEB_CORS_ORIGIN", "*").split(","),
-            any_platform=get_boolean(environ, "ONNX_WEB_ANY_PLATFORM", True),
+            any_platform=get_boolean(
+                environ, "ONNX_WEB_ANY_PLATFORM", DEFAULT_ANY_PLATFORM
+            ),
             block_platforms=environ.get("ONNX_WEB_BLOCK_PLATFORMS", "").split(","),
             default_platform=environ.get("ONNX_WEB_DEFAULT_PLATFORM", None),
             image_format=environ.get("ONNX_WEB_IMAGE_FORMAT", "png"),
             cache_limit=int(environ.get("ONNX_WEB_CACHE_MODELS", DEFAULT_CACHE_LIMIT)),
-            show_progress=get_boolean(environ, "ONNX_WEB_SHOW_PROGRESS", True),
+            show_progress=get_boolean(
+                environ, "ONNX_WEB_SHOW_PROGRESS", DEFAULT_SHOW_PROGRESS
+            ),
             optimizations=environ.get("ONNX_WEB_OPTIMIZATIONS", "").split(","),
             extra_models=environ.get("ONNX_WEB_EXTRA_MODELS", "").split(","),
             job_limit=int(environ.get("ONNX_WEB_JOB_LIMIT", DEFAULT_JOB_LIMIT)),
@@ -90,7 +121,12 @@ class ServerContext:
             server_version=environ.get(
                 "ONNX_WEB_SERVER_VERSION", DEFAULT_SERVER_VERSION
             ),
-            worker_retries=int(environ.get("ONNX_WEB_WORKER_RETRIES", 3)),
+            worker_retries=int(
+                environ.get("ONNX_WEB_WORKER_RETRIES", DEFAULT_WORKER_RETRIES)
+            ),
+            panorama_tiles=get_boolean(
+                environ, "ONNX_WEB_PANORAMA_TILES", DEFAULT_PANORAMA_TILES
+            ),
         )
 
     def torch_dtype(self):
diff --git a/onnx-web.code-workspace b/onnx-web.code-workspace
index 9674ca2f..995a75d0 100644
--- a/onnx-web.code-workspace
+++ b/onnx-web.code-workspace
@@ -35,6 +35,7 @@
 			"ddpm",
 			"deis",
 			"denoise",
+			"denoised",
 			"denoising",
 			"directml",
 			"Dreambooth",

From 1fae41ddcf918168cfc20862ce4755eeeabf925a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 20:17:52 -0600
Subject: [PATCH 129/240] feat(api): add edge options to region feathering

---
 api/onnx_web/chain/tile.py                     |  3 ++-
 api/onnx_web/diffusers/pipelines/panorama.py   |  5 +++--
 .../diffusers/pipelines/panorama_xl.py         |  5 +++--
 api/onnx_web/diffusers/utils.py                | 18 ++++++++++++++----
 4 files changed, 22 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index e3505984..5850b23d 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -95,6 +95,7 @@ def make_tile_mask(
     shape: Any,
     tile: Tuple[int, int],
     overlap: float,
+    edges: Tuple[bool, bool, bool, bool],
 ) -> np.ndarray:
     mask = np.ones(shape)
 
@@ -113,7 +114,7 @@ def make_tile_mask(
     points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w]
 
     # build gradients
-    grad_x, grad_y = [0, 1, 1, 0], [0, 1, 1, 0]
+    grad_x, grad_y = [int(edges[0]), 1, 1, int(edges[2])], [int(edges[1]), 1, 1, int(edges[3])]
     logger.debug("tile gradients: %s, %s, %s, %s", points_w, points_h, grad_x, grad_y)
 
     mult_x = [np.interp(i, points_w, grad_x) for i in range(tile_w)]
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 14d1143a..d90a5def 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -671,11 +671,12 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if feather > 0.0:
+                if feather[0] > 0.0:
                     mask = make_tile_mask(
                         (h_end - h_start, w_end - w_start),
                         (h_end - h_start, w_end - w_start),
-                        feather,
+                        feather[0],
+                        feather[1],
                     )
                     mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index e64abe3f..24147160 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -520,11 +520,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 )
                 latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if feather > 0.0:
+                if feather[0] > 0.0:
                     mask = make_tile_mask(
                         (h_end - h_start, w_end - w_start),
                         (h_end - h_start, w_end - w_start),
-                        feather,
+                        feather[0],
+                        feather[1],
                     )
                     mask = np.expand_dims(mask, axis=0)
                     mask = np.repeat(mask, 4, axis=0)
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 6655e2bc..4a0bbd31 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -22,7 +22,7 @@ INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
 WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 REGION_TOKEN = compile(
-    r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+):([^\>]+)\>"
+    r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+_?[TLBR]*):([^\>]+)\>"
 )
 RESEED_TOKEN = compile(r"\<reseed:(\d+):(\d+):(\d+):(\d+):(-?\d+)\>")
 
@@ -455,18 +455,28 @@ def slice_prompt(prompt: str, slice: int) -> str:
         return prompt
 
 
-Region = Tuple[int, int, int, int, float, str]
+Region = Tuple[int, int, int, int, float, Tuple[float, Tuple[bool, bool, bool, bool]], str]
 
 
-def parse_region_group(group) -> Region:
+def parse_region_group(group: Tuple[str, ...]) -> Region:
     top, left, bottom, right, weight, feather, prompt = group
+
+    # break down the feather section
+    feather_radius, *feather_edges = feather.split("_")
+    feather_edges = "".join(feather_edges)
+
     return (
         int(top),
         int(left),
         int(bottom),
         int(right),
         float(weight),
-        float(feather),
+        (float(feather_radius), (
+            "T" in feather_edges,
+            "L" in feather_edges,
+            "B" in feather_edges,
+            "R" in feather_edges,
+        )),
         prompt,
     )
 

From c7cff78784e4837378ebd82a0e0a0678b85615bd Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 20:22:08 -0600
Subject: [PATCH 130/240] fix(api): feather all edges by default

---
 api/onnx_web/diffusers/utils.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 4a0bbd31..b720e711 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -463,7 +463,10 @@ def parse_region_group(group: Tuple[str, ...]) -> Region:
 
     # break down the feather section
     feather_radius, *feather_edges = feather.split("_")
-    feather_edges = "".join(feather_edges)
+    if len(feather_edges) == 0:
+        feather_edges = "TLBR"
+    else:
+        feather_edges = "".join(feather_edges)
 
     return (
         int(top),

From 196ef46750974dca6ef61e70afafc42c74030f3c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 20:24:02 -0600
Subject: [PATCH 131/240] correct region edges

---
 api/onnx_web/chain/tile.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 5850b23d..9a294727 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -114,7 +114,8 @@ def make_tile_mask(
     points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w]
 
     # build gradients
-    grad_x, grad_y = [int(edges[0]), 1, 1, int(edges[2])], [int(edges[1]), 1, 1, int(edges[3])]
+    edge_t, edge_l, edge_b, edge_r = edges
+    grad_x, grad_y = [int(edge_l), 1, 1, int(edge_r)], [int(edge_t), 1, 1, int(edge_b)]
     logger.debug("tile gradients: %s, %s, %s, %s", points_w, points_h, grad_x, grad_y)
 
     mult_x = [np.interp(i, points_w, grad_x) for i in range(tile_w)]

From 4513fa34285aa54292c9989bab067d2713f0e8a7 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 21:21:12 -0600
Subject: [PATCH 132/240] fix edge logic

---
 api/onnx_web/chain/tile.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 9a294727..bc3a57ab 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -115,7 +115,7 @@ def make_tile_mask(
 
     # build gradients
     edge_t, edge_l, edge_b, edge_r = edges
-    grad_x, grad_y = [int(edge_l), 1, 1, int(edge_r)], [int(edge_t), 1, 1, int(edge_b)]
+    grad_x, grad_y = [int(not edge_l), 1, 1, int(not edge_r)], [int(not edge_t), 1, 1, int(not edge_b)]
     logger.debug("tile gradients: %s, %s, %s, %s", points_w, points_h, grad_x, grad_y)
 
     mult_x = [np.interp(i, points_w, grad_x) for i in range(tile_w)]

From 09f600ab54fd8346ded95d3bc44945754b29f23a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 11 Nov 2023 22:43:41 -0600
Subject: [PATCH 133/240] feat(api): skip regions on last timestep

---
 api/onnx_web/diffusers/pipelines/panorama.py  | 170 ++++++++--------
 .../diffusers/pipelines/panorama_xl.py        | 190 +++++++++---------
 2 files changed, 182 insertions(+), 178 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index d90a5def..fb5ea0e8 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -557,6 +557,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         value = np.zeros_like(latents)
 
         for i, t in enumerate(self.progress_bar(self.scheduler.timesteps)):
+            last = i == (len(self.scheduler.timesteps) - 1)
             count.fill(0)
             value.fill(0)
 
@@ -603,97 +604,98 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
-            for r in range(len(regions)):
-                top, left, bottom, right, weight, feather, prompt = regions[r]
-                logger.debug(
-                    "running region prompt: %s, %s, %s, %s, %s, %s, %s",
-                    top,
-                    left,
-                    bottom,
-                    right,
-                    weight,
-                    feather,
-                    prompt,
-                )
-
-                # convert coordinates to latent space
-                h_start = top // LATENT_FACTOR
-                h_end = bottom // LATENT_FACTOR
-                w_start = left // LATENT_FACTOR
-                w_end = right // LATENT_FACTOR
-
-                # get the latents corresponding to the current view coordinates
-                latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
-                logger.trace(
-                    "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
-                    h_start,
-                    h_end,
-                    w_start,
-                    w_end,
-                    latents_for_region.shape,
-                )
-
-                # expand the latents if we are doing classifier free guidance
-                latent_region_input = (
-                    np.concatenate([latents_for_region] * 2)
-                    if do_classifier_free_guidance
-                    else latents_for_region
-                )
-                latent_region_input = self.scheduler.scale_model_input(
-                    torch.from_numpy(latent_region_input), t
-                )
-                latent_region_input = latent_region_input.cpu().numpy()
-
-                # predict the noise residual
-                timestep = np.array([t], dtype=timestep_dtype)
-                region_noise_pred = self.unet(
-                    sample=latent_region_input,
-                    timestep=timestep,
-                    encoder_hidden_states=region_embeds[r],
-                )
-                region_noise_pred = region_noise_pred[0]
-
-                # perform guidance
-                if do_classifier_free_guidance:
-                    region_noise_pred_uncond, region_noise_pred_text = np.split(
-                        region_noise_pred, 2
-                    )
-                    region_noise_pred = region_noise_pred_uncond + guidance_scale * (
-                        region_noise_pred_text - region_noise_pred_uncond
+            if not last:
+                for r, region in enumerate(regions):
+                    top, left, bottom, right, weight, feather, prompt = region
+                    logger.debug(
+                        "running region prompt: %s, %s, %s, %s, %s, %s, %s",
+                        top,
+                        left,
+                        bottom,
+                        right,
+                        weight,
+                        feather,
+                        prompt,
                     )
 
-                # compute the previous noisy sample x_t -> x_t-1
-                scheduler_output = self.scheduler.step(
-                    torch.from_numpy(region_noise_pred),
-                    t,
-                    torch.from_numpy(latents_for_region),
-                    **extra_step_kwargs,
-                )
-                latents_region_denoised = scheduler_output.prev_sample.numpy()
+                    # convert coordinates to latent space
+                    h_start = top // LATENT_FACTOR
+                    h_end = bottom // LATENT_FACTOR
+                    w_start = left // LATENT_FACTOR
+                    w_end = right // LATENT_FACTOR
 
-                if feather[0] > 0.0:
-                    mask = make_tile_mask(
-                        (h_end - h_start, w_end - w_start),
-                        (h_end - h_start, w_end - w_start),
-                        feather[0],
-                        feather[1],
+                    # get the latents corresponding to the current view coordinates
+                    latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
+                    logger.trace(
+                        "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
+                        h_start,
+                        h_end,
+                        w_start,
+                        w_end,
+                        latents_for_region.shape,
                     )
-                    mask = np.expand_dims(mask, axis=0)
-                    mask = np.repeat(mask, 4, axis=0)
-                    mask = np.expand_dims(mask, axis=0)
-                else:
-                    mask = 1
 
-                if weight >= 10.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = (
-                        latents_region_denoised * mask
+                    # expand the latents if we are doing classifier free guidance
+                    latent_region_input = (
+                        np.concatenate([latents_for_region] * 2)
+                        if do_classifier_free_guidance
+                        else latents_for_region
                     )
-                    count[:, :, h_start:h_end, w_start:w_end] = mask
-                else:
-                    value[:, :, h_start:h_end, w_start:w_end] += (
-                        latents_region_denoised * weight * mask
+                    latent_region_input = self.scheduler.scale_model_input(
+                        torch.from_numpy(latent_region_input), t
                     )
-                    count[:, :, h_start:h_end, w_start:w_end] += weight * mask
+                    latent_region_input = latent_region_input.cpu().numpy()
+
+                    # predict the noise residual
+                    timestep = np.array([t], dtype=timestep_dtype)
+                    region_noise_pred = self.unet(
+                        sample=latent_region_input,
+                        timestep=timestep,
+                        encoder_hidden_states=region_embeds[r],
+                    )
+                    region_noise_pred = region_noise_pred[0]
+
+                    # perform guidance
+                    if do_classifier_free_guidance:
+                        region_noise_pred_uncond, region_noise_pred_text = np.split(
+                            region_noise_pred, 2
+                        )
+                        region_noise_pred = region_noise_pred_uncond + guidance_scale * (
+                            region_noise_pred_text - region_noise_pred_uncond
+                        )
+
+                    # compute the previous noisy sample x_t -> x_t-1
+                    scheduler_output = self.scheduler.step(
+                        torch.from_numpy(region_noise_pred),
+                        t,
+                        torch.from_numpy(latents_for_region),
+                        **extra_step_kwargs,
+                    )
+                    latents_region_denoised = scheduler_output.prev_sample.numpy()
+
+                    if feather[0] > 0.0:
+                        mask = make_tile_mask(
+                            (h_end - h_start, w_end - w_start),
+                            (h_end - h_start, w_end - w_start),
+                            feather[0],
+                            feather[1],
+                        )
+                        mask = np.expand_dims(mask, axis=0)
+                        mask = np.repeat(mask, 4, axis=0)
+                        mask = np.expand_dims(mask, axis=0)
+                    else:
+                        mask = 1
+
+                    if weight >= 10.0:
+                        value[:, :, h_start:h_end, w_start:w_end] = (
+                            latents_region_denoised * mask
+                        )
+                        count[:, :, h_start:h_end, w_start:w_end] = mask
+                    else:
+                        value[:, :, h_start:h_end, w_start:w_end] += (
+                            latents_region_denoised * weight * mask
+                        )
+                        count[:, :, h_start:h_end, w_start:w_end] += weight * mask
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 24147160..650ed17a 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -388,6 +388,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         # 8. Denoising loop
         num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
         for i, t in enumerate(self.progress_bar(timesteps)):
+            last = i == (len(timesteps) - 1)
             count.fill(0)
             value.fill(0)
 
@@ -443,106 +444,107 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 value[:, :, h_start:h_end, w_start:w_end] += latents_view_denoised
                 count[:, :, h_start:h_end, w_start:w_end] += 1
 
-            for r in range(len(regions)):
-                top, left, bottom, right, weight, feather, prompt = regions[r]
-                logger.debug(
-                    "running region prompt: %s, %s, %s, %s, %s, %s, %s",
-                    top,
-                    left,
-                    bottom,
-                    right,
-                    weight,
-                    feather,
-                    prompt,
-                )
-
-                # convert coordinates to latent space
-                h_start = top // LATENT_FACTOR
-                h_end = bottom // LATENT_FACTOR
-                w_start = left // LATENT_FACTOR
-                w_end = right // LATENT_FACTOR
-
-                # get the latents corresponding to the current view coordinates
-                latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
-                logger.trace(
-                    "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
-                    h_start,
-                    h_end,
-                    w_start,
-                    w_end,
-                    latents_for_region.shape,
-                )
-
-                # expand the latents if we are doing classifier free guidance
-                latent_region_input = (
-                    np.concatenate([latents_for_region] * 2)
-                    if do_classifier_free_guidance
-                    else latents_for_region
-                )
-                latent_region_input = self.scheduler.scale_model_input(
-                    torch.from_numpy(latent_region_input), t
-                )
-                latent_region_input = latent_region_input.cpu().numpy()
-
-                # predict the noise residual
-                timestep = np.array([t], dtype=timestep_dtype)
-                region_noise_pred = self.unet(
-                    sample=latent_region_input,
-                    timestep=timestep,
-                    encoder_hidden_states=region_embeds[r],
-                    text_embeds=add_region_embeds[r],
-                    time_ids=add_time_ids,
-                )
-                region_noise_pred = region_noise_pred[0]
-
-                # perform guidance
-                if do_classifier_free_guidance:
-                    region_noise_pred_uncond, region_noise_pred_text = np.split(
-                        region_noise_pred, 2
+            if not last:
+                for r, region in enumerate(regions):
+                    top, left, bottom, right, weight, feather, prompt = region
+                    logger.debug(
+                        "running region prompt: %s, %s, %s, %s, %s, %s, %s",
+                        top,
+                        left,
+                        bottom,
+                        right,
+                        weight,
+                        feather,
+                        prompt,
                     )
-                    region_noise_pred = region_noise_pred_uncond + guidance_scale * (
-                        region_noise_pred_text - region_noise_pred_uncond
+
+                    # convert coordinates to latent space
+                    h_start = top // LATENT_FACTOR
+                    h_end = bottom // LATENT_FACTOR
+                    w_start = left // LATENT_FACTOR
+                    w_end = right // LATENT_FACTOR
+
+                    # get the latents corresponding to the current view coordinates
+                    latents_for_region = latents[:, :, h_start:h_end, w_start:w_end]
+                    logger.trace(
+                        "region latent shape: [:,:,%s:%s,%s:%s] -> %s",
+                        h_start,
+                        h_end,
+                        w_start,
+                        w_end,
+                        latents_for_region.shape,
                     )
-                    if guidance_rescale > 0.0:
-                        # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
-                        region_noise_pred = rescale_noise_cfg(
-                            region_noise_pred,
-                            region_noise_pred_text,
-                            guidance_rescale=guidance_rescale,
+
+                    # expand the latents if we are doing classifier free guidance
+                    latent_region_input = (
+                        np.concatenate([latents_for_region] * 2)
+                        if do_classifier_free_guidance
+                        else latents_for_region
+                    )
+                    latent_region_input = self.scheduler.scale_model_input(
+                        torch.from_numpy(latent_region_input), t
+                    )
+                    latent_region_input = latent_region_input.cpu().numpy()
+
+                    # predict the noise residual
+                    timestep = np.array([t], dtype=timestep_dtype)
+                    region_noise_pred = self.unet(
+                        sample=latent_region_input,
+                        timestep=timestep,
+                        encoder_hidden_states=region_embeds[r],
+                        text_embeds=add_region_embeds[r],
+                        time_ids=add_time_ids,
+                    )
+                    region_noise_pred = region_noise_pred[0]
+
+                    # perform guidance
+                    if do_classifier_free_guidance:
+                        region_noise_pred_uncond, region_noise_pred_text = np.split(
+                            region_noise_pred, 2
                         )
+                        region_noise_pred = region_noise_pred_uncond + guidance_scale * (
+                            region_noise_pred_text - region_noise_pred_uncond
+                        )
+                        if guidance_rescale > 0.0:
+                            # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
+                            region_noise_pred = rescale_noise_cfg(
+                                region_noise_pred,
+                                region_noise_pred_text,
+                                guidance_rescale=guidance_rescale,
+                            )
 
-                # compute the previous noisy sample x_t -> x_t-1
-                scheduler_output = self.scheduler.step(
-                    torch.from_numpy(region_noise_pred),
-                    t,
-                    torch.from_numpy(latents_for_region),
-                    **extra_step_kwargs,
-                )
-                latents_region_denoised = scheduler_output.prev_sample.numpy()
+                    # compute the previous noisy sample x_t -> x_t-1
+                    scheduler_output = self.scheduler.step(
+                        torch.from_numpy(region_noise_pred),
+                        t,
+                        torch.from_numpy(latents_for_region),
+                        **extra_step_kwargs,
+                    )
+                    latents_region_denoised = scheduler_output.prev_sample.numpy()
 
-                if feather[0] > 0.0:
-                    mask = make_tile_mask(
-                        (h_end - h_start, w_end - w_start),
-                        (h_end - h_start, w_end - w_start),
-                        feather[0],
-                        feather[1],
-                    )
-                    mask = np.expand_dims(mask, axis=0)
-                    mask = np.repeat(mask, 4, axis=0)
-                    mask = np.expand_dims(mask, axis=0)
-                else:
-                    mask = 1
+                    if feather[0] > 0.0:
+                        mask = make_tile_mask(
+                            (h_end - h_start, w_end - w_start),
+                            (h_end - h_start, w_end - w_start),
+                            feather[0],
+                            feather[1],
+                        )
+                        mask = np.expand_dims(mask, axis=0)
+                        mask = np.repeat(mask, 4, axis=0)
+                        mask = np.expand_dims(mask, axis=0)
+                    else:
+                        mask = 1
 
-                if weight >= 10.0:
-                    value[:, :, h_start:h_end, w_start:w_end] = (
-                        latents_region_denoised * mask
-                    )
-                    count[:, :, h_start:h_end, w_start:w_end] = mask
-                else:
-                    value[:, :, h_start:h_end, w_start:w_end] += (
-                        latents_region_denoised * weight * mask
-                    )
-                    count[:, :, h_start:h_end, w_start:w_end] += weight * mask
+                    if weight >= 10.0:
+                        value[:, :, h_start:h_end, w_start:w_end] = (
+                            latents_region_denoised * mask
+                        )
+                        count[:, :, h_start:h_end, w_start:w_end] = mask
+                    else:
+                        value[:, :, h_start:h_end, w_start:w_end] += (
+                            latents_region_denoised * weight * mask
+                        )
+                        count[:, :, h_start:h_end, w_start:w_end] += weight * mask
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)

From 6eb014cec88b33a98c5f307a0f9b76d3a01e670e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 14:12:28 -0600
Subject: [PATCH 134/240] fix(api): enable prompt alternatives for SDXL

---
 api/onnx_web/chain/blend_img2img.py  |  4 +---
 api/onnx_web/chain/source_txt2img.py |  4 +---
 api/onnx_web/diffusers/utils.py      | 12 +++++++++---
 3 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index af181c10..89f1301b 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -84,9 +84,7 @@ class BlendImg2ImgStage(BaseStage):
                 prompt_embeds = encode_prompt(
                     pipe, prompt_pairs, params.batch, params.do_cfg()
                 )
-
-                if not params.is_xl():
-                    pipe.unet.set_prompts(prompt_embeds)
+                pipe.unet.set_prompts(prompt_embeds)
 
                 rng = np.random.RandomState(params.seed)
                 result = pipe(
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 40377fe0..3840fdd2 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -133,9 +133,7 @@ class SourceTxt2ImgStage(BaseStage):
             prompt_embeds = encode_prompt(
                 pipe, prompt_pairs, params.batch, params.do_cfg()
             )
-
-            if not params.is_xl():
-                pipe.unet.set_prompts(prompt_embeds)
+            pipe.unet.set_prompts(prompt_embeds)
 
             rng = np.random.RandomState(params.seed)
             result = pipe(
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index b720e711..9686a48e 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -17,14 +17,15 @@ LATENT_CHANNELS = 4
 LATENT_FACTOR = 8
 MAX_TOKENS_PER_GROUP = 77
 
+ANY_TOKEN = compile(r"\<([^\>]*)\>")
 CLIP_TOKEN = compile(r"\<clip:([-\w]+):(\d+)\>")
 INVERSION_TOKEN = compile(r"\<inversion:([^:\>]+):(-?[\.|\d]+)\>")
 LORA_TOKEN = compile(r"\<lora:([^:\>]+):(-?[\.|\d]+)\>")
-WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 REGION_TOKEN = compile(
     r"\<region:(\d+):(\d+):(\d+):(\d+):(-?[\.|\d]+):(-?[\.|\d]+_?[TLBR]*):([^\>]+)\>"
 )
 RESEED_TOKEN = compile(r"\<reseed:(\d+):(\d+):(\d+):(\d+):(-?\d+)\>")
+WILDCARD_TOKEN = compile(r"__([-/\\\w]+)__")
 
 INTERVAL_RANGE = compile(r"(\w+)-{(\d+),(\d+)(?:,(\d+))?}")
 ALTERNATIVE_RANGE = compile(r"\(([^\)]+)\)")
@@ -380,10 +381,10 @@ def encode_prompt(
 ) -> List[np.ndarray]:
     return [
         pipe._encode_prompt(
-            prompt,
+            remove_tokens(prompt),
             num_images_per_prompt=num_images_per_prompt,
             do_classifier_free_guidance=do_classifier_free_guidance,
-            negative_prompt=neg_prompt,
+            negative_prompt=remove_tokens(neg_prompt),
         )
         for prompt, neg_prompt in prompt_pairs
     ]
@@ -504,3 +505,8 @@ def parse_reseed_group(group) -> Region:
 
 def parse_reseed(prompt: str) -> Tuple[str, List[Reseed]]:
     return get_tokens_from_prompt(prompt, RESEED_TOKEN, parser=parse_reseed_group)
+
+
+def remove_tokens(prompt: str) -> str:
+    remainder, tokens = get_tokens_from_prompt(prompt, ANY_TOKEN)
+    return remainder

From 3ffbc00390d95a4a03096807b168e6b96fd2c14b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 14:23:02 -0600
Subject: [PATCH 135/240] fix(api): turn alternatives back off for SDXL

---
 api/onnx_web/chain/blend_img2img.py            |  9 +++++----
 api/onnx_web/chain/source_txt2img.py           |  9 +++++----
 api/onnx_web/chain/upscale_outpaint.py         |  9 +++++----
 api/onnx_web/chain/upscale_stable_diffusion.py | 15 ++++++++-------
 4 files changed, 23 insertions(+), 19 deletions(-)

diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index 89f1301b..274ab407 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -81,10 +81,11 @@ class BlendImg2ImgStage(BaseStage):
                 )
             else:
                 # encode and record alternative prompts outside of LPW
-                prompt_embeds = encode_prompt(
-                    pipe, prompt_pairs, params.batch, params.do_cfg()
-                )
-                pipe.unet.set_prompts(prompt_embeds)
+                if not params.is_xl():
+                    prompt_embeds = encode_prompt(
+                        pipe, prompt_pairs, params.batch, params.do_cfg()
+                    )
+                    pipe.unet.set_prompts(prompt_embeds)
 
                 rng = np.random.RandomState(params.seed)
                 result = pipe(
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 3840fdd2..ce1f04df 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -130,10 +130,11 @@ class SourceTxt2ImgStage(BaseStage):
             )
         else:
             # encode and record alternative prompts outside of LPW
-            prompt_embeds = encode_prompt(
-                pipe, prompt_pairs, params.batch, params.do_cfg()
-            )
-            pipe.unet.set_prompts(prompt_embeds)
+            if not params.is_xl():
+                prompt_embeds = encode_prompt(
+                    pipe, prompt_pairs, params.batch, params.do_cfg()
+                )
+                pipe.unet.set_prompts(prompt_embeds)
 
             rng = np.random.RandomState(params.seed)
             result = pipe(
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 85ddc079..cdc3a067 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -99,10 +99,11 @@ class UpscaleOutpaintStage(BaseStage):
                 )
             else:
                 # encode and record alternative prompts outside of LPW
-                prompt_embeds = encode_prompt(
-                    pipe, prompt_pairs, params.batch, params.do_cfg()
-                )
-                pipe.unet.set_prompts(prompt_embeds)
+                if not params.is_xl():
+                    prompt_embeds = encode_prompt(
+                        pipe, prompt_pairs, params.batch, params.do_cfg()
+                    )
+                    pipe.unet.set_prompts(prompt_embeds)
 
                 rng = np.random.RandomState(params.seed)
                 result = pipe(
diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index 9d5a7b32..cf784b05 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -48,13 +48,14 @@ class UpscaleStableDiffusionStage(BaseStage):
         )
         generator = torch.manual_seed(params.seed)
 
-        prompt_embeds = encode_prompt(
-            pipeline,
-            prompt_pairs,
-            num_images_per_prompt=params.batch,
-            do_classifier_free_guidance=params.do_cfg(),
-        )
-        pipeline.unet.set_prompts(prompt_embeds)
+        if not params.is_xl():
+            prompt_embeds = encode_prompt(
+                pipeline,
+                prompt_pairs,
+                num_images_per_prompt=params.batch,
+                do_classifier_free_guidance=params.do_cfg(),
+            )
+            pipeline.unet.set_prompts(prompt_embeds)
 
         outputs = []
         for source in sources:

From 44e483322e41c67e17d80268dd6d14e29668205c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 15:15:06 -0600
Subject: [PATCH 136/240] feat: show tokens for networks in prompt

---
 api/onnx_web/diffusers/utils.py          |  3 +
 api/schemas/extras.yaml                  | 89 +++++++++++-------------
 gui/src/components/input/PromptInput.tsx | 89 ++++++++++++++++++++----
 gui/src/types/api.ts                     | 23 ++++--
 4 files changed, 140 insertions(+), 64 deletions(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 9686a48e..d37f55a0 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -379,6 +379,9 @@ def encode_prompt(
     num_images_per_prompt: int = 1,
     do_classifier_free_guidance: bool = True,
 ) -> List[np.ndarray]:
+    """
+    TODO: does not work with SDXL, fix or turn into a pipeline patch
+    """
     return [
         pipe._encode_prompt(
             remove_tokens(prompt),
diff --git a/api/schemas/extras.yaml b/api/schemas/extras.yaml
index 30886f2c..e83ba046 100644
--- a/api/schemas/extras.yaml
+++ b/api/schemas/extras.yaml
@@ -10,34 +10,53 @@ $defs:
         - type: number
         - type: string
 
-  lora_network:
+  tensor_format:
+    type: string
+    enum: [bin, ckpt, onnx, pt, pth, safetensors]
+
+  embedding_network:
     type: object
     required: [name, source]
     properties:
-      name:
-        type: string
-      source:
-        type: string
+      format:
+        $ref: "#/defs/tensor_format"
       label:
         type: string
-      weight:
-        type: number
-
-  textual_inversion_network:
-    type: object
-    required: [name, source]
-    properties:
-      name:
-        type: string
-      source:
-        type: string
-      format:
+      model:
         type: string
         enum: [concept, embeddings]
-      label:
+      name:
+        type: string
+      source:
         type: string
       token:
         type: string
+      type:
+        type: string
+        const: inversion # TODO: add embedding
+      weight:
+        type: number
+
+  lora_network:
+    type: object
+    required: [name, source, type]
+    properties:
+      label:
+        type: string
+      model:
+        type: string
+        enum: [cloneofsimo, sd-scripts]
+      name:
+        type: string
+      source:
+        type: string
+      tokens:
+        type: array
+        items:
+          type: string
+      type:
+        type: string
+        const: lora
       weight:
         type: number
 
@@ -46,8 +65,7 @@ $defs:
     required: [name, source]
     properties:
       format:
-        type: string
-        enum: [bin, ckpt, onnx, pt, pth, safetensors]
+        $ref: "#/defs/tensor_format"
       half:
         type: boolean
       label:
@@ -85,7 +103,7 @@ $defs:
           inversions:
             type: array
             items:
-              $ref: "#/$defs/textual_inversion_network"
+              $ref: "#/$defs/embedding_network"
           loras:
             type: array
             items:
@@ -142,31 +160,6 @@ $defs:
       source:
         type: string
 
-  source_network:
-    type: object
-    required: [name, source, type]
-    properties:
-      format:
-        type: string
-        enum: [bin, ckpt, onnx, pt, pth, safetensors]
-      model:
-        type: string
-        enum: [
-          # inversion
-          concept,
-          embeddings,
-          # lora
-          cloneofsimo,
-          sd-scripts
-        ]
-      name:
-        type: string
-      source:
-        type: string
-      type:
-        type: string
-        enum: [inversion, lora]
-
   translation:
     type: object
     additionalProperties: False
@@ -194,7 +187,9 @@ properties:
   networks:
     type: array
     items:
-      $ref: "#/$defs/source_network"
+      oneOf:
+        - $ref: "#/$defs/lora_network"
+        - $ref: "#/$defs/embedding_network"
   sources:
     type: array
     items:
diff --git a/gui/src/components/input/PromptInput.tsx b/gui/src/components/input/PromptInput.tsx
index 2fc52ca3..2d8c8413 100644
--- a/gui/src/components/input/PromptInput.tsx
+++ b/gui/src/components/input/PromptInput.tsx
@@ -1,5 +1,5 @@
-import { mustExist } from '@apextoaster/js-utils';
-import { TextField } from '@mui/material';
+import { Maybe, doesExist, mustExist } from '@apextoaster/js-utils';
+import { Chip, TextField } from '@mui/material';
 import { Stack } from '@mui/system';
 import { useQuery } from '@tanstack/react-query';
 import * as React from 'react';
@@ -10,6 +10,7 @@ import { shallow } from 'zustand/shallow';
 import { STALE_TIME } from '../../config.js';
 import { ClientContext, OnnxState, StateContext } from '../../state.js';
 import { QueryMenu } from '../input/QueryMenu.js';
+import { ModelResponse } from '../../types/api.js';
 
 const { useContext } = React;
 
@@ -48,26 +49,27 @@ export function PromptInput(props: PromptInputProps) {
     staleTime: STALE_TIME,
   });
 
-  const tokens = splitPrompt(prompt);
-  const groups = Math.ceil(tokens.length / PROMPT_GROUP);
-
   const { t } = useTranslation();
-  const helper = t('input.prompt.tokens', {
-    groups,
-    tokens: tokens.length,
-  });
 
-  function addToken(type: string, name: string, weight = 1.0) {
+  function addNetwork(type: string, name: string, weight = 1.0) {
     onChange({
       prompt: `<${type}:${name}:1.0> ${prompt}`,
       negativePrompt,
     });
   }
 
+  function addToken(name: string) {
+    onChange({
+      prompt: `${prompt}, ${name}`,
+    });
+  }
+
+  const networks = extractNetworks(prompt);
+  const tokens = getNetworkTokens(models.data, networks);
+
   return <Stack spacing={2}>
     <TextField
       label={t('parameter.prompt')}
-      helperText={helper}
       variant='outlined'
       value={prompt}
       onChange={(event) => {
@@ -77,6 +79,7 @@ export function PromptInput(props: PromptInputProps) {
         });
       }}
     />
+    {tokens.map(([token, _weight]) => <Chip label={token} onClick={() => addToken(token)} />)}
     <TextField
       label={t('parameter.negativePrompt')}
       variant='outlined'
@@ -98,7 +101,7 @@ export function PromptInput(props: PromptInputProps) {
           selector: (result) => result.networks.filter((network) => network.type === 'inversion').map((network) => network.name),
         }}
         onSelect={(name) => {
-          addToken('inversion', name);
+          addNetwork('inversion', name);
         }}
       />
       <QueryMenu
@@ -110,9 +113,69 @@ export function PromptInput(props: PromptInputProps) {
           selector: (result) => result.networks.filter((network) => network.type === 'lora').map((network) => network.name),
         }}
         onSelect={(name) => {
-          addToken('lora', name);
+          addNetwork('lora', name);
         }}
       />
     </Stack>
   </Stack>;
 }
+
+export const ANY_TOKEN = /<([^>])+>/g;
+
+export type TokenList = Array<[string, number]>;
+
+export interface PromptNetworks {
+  inversion: TokenList;
+  lora: TokenList;
+}
+
+export function extractNetworks(prompt: string): PromptNetworks {
+  const inversion: TokenList = [];
+  const lora: TokenList = [];
+
+  for (const token of prompt.matchAll(ANY_TOKEN)) {
+    const [_whole, match] = Array.from(token);
+    const [type, name, weight, ..._rest] = match.split(':');
+
+    switch (type) {
+      case 'inversion':
+        inversion.push([name, parseFloat(weight)]);
+        break;
+      case 'lora':
+        lora.push([name, parseFloat(weight)]);
+        break;
+      default:
+        // ignore others
+    }
+  }
+
+  return {
+    inversion,
+    lora,
+  };
+}
+
+// eslint-disable-next-line sonarjs/cognitive-complexity
+export function getNetworkTokens(models: Maybe<ModelResponse>, networks: PromptNetworks): TokenList {
+  const tokens: TokenList = [];
+
+  if (doesExist(models)) {
+    for (const [name, weight] of networks.inversion) {
+      const model = models.networks.find((it) => it.type === 'inversion' && it.name === name);
+      if (doesExist(model) && model.type === 'inversion') {
+        tokens.push([model.token, weight]);
+      }
+    }
+
+    for (const [name, weight] of networks.inversion) {
+      const model = models.networks.find((it) => it.type === 'lora' && it.name === name);
+      if (doesExist(model) && model.type === 'lora') {
+        for (const token of model.tokens) {
+          tokens.push([token, weight]);
+        }
+      }
+    }
+  }
+
+  return tokens;
+}
diff --git a/gui/src/types/api.ts b/gui/src/types/api.ts
index 70b99f7a..65179280 100644
--- a/gui/src/types/api.ts
+++ b/gui/src/types/api.ts
@@ -39,13 +39,28 @@ export interface ReadyResponse {
   ready: boolean;
 }
 
-export interface NetworkModel {
+export interface ControlNetwork {
   name: string;
-  type: 'control' | 'inversion' | 'lora';
-  // TODO: add token
-  // TODO: add layer/token count
+  type: 'control';
 }
 
+export interface EmbeddingNetwork {
+  label: string;
+  name: string;
+  token: string;
+  type: 'inversion';
+  // TODO: add layer count
+}
+
+export interface LoraNetwork {
+  name: string;
+  label: string;
+  tokens: Array<string>;
+  type: 'lora';
+}
+
+export type NetworkModel = EmbeddingNetwork | LoraNetwork | ControlNetwork;
+
 export interface FilterResponse {
   mask: Array<string>;
   source: Array<string>;

From d79af78ef0d5646330509b592a0610d1be07d6a9 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 15:19:04 -0600
Subject: [PATCH 137/240] fix schema

---
 api/schemas/extras.yaml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/schemas/extras.yaml b/api/schemas/extras.yaml
index e83ba046..518023e0 100644
--- a/api/schemas/extras.yaml
+++ b/api/schemas/extras.yaml
@@ -19,7 +19,7 @@ $defs:
     required: [name, source]
     properties:
       format:
-        $ref: "#/defs/tensor_format"
+        $ref: "#/$defs/tensor_format"
       label:
         type: string
       model:
@@ -65,7 +65,7 @@ $defs:
     required: [name, source]
     properties:
       format:
-        $ref: "#/defs/tensor_format"
+        $ref: "#/$defs/tensor_format"
       half:
         type: boolean
       label:

From a4bf4ac65159c5a6f18446e6138e13fe2caea481 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 15:36:51 -0600
Subject: [PATCH 138/240] add tokens to network response

---
 api/onnx_web/models/meta.py              |  7 +++++--
 api/onnx_web/server/load.py              | 10 ++++++++--
 gui/src/components/input/PromptInput.tsx |  8 ++++----
 3 files changed, 17 insertions(+), 8 deletions(-)

diff --git a/api/onnx_web/models/meta.py b/api/onnx_web/models/meta.py
index dcd43c25..453e24b2 100644
--- a/api/onnx_web/models/meta.py
+++ b/api/onnx_web/models/meta.py
@@ -1,18 +1,21 @@
-from typing import Literal
+from typing import List, Literal
 
 NetworkType = Literal["inversion", "lora"]
 
 
 class NetworkModel:
     name: str
+    tokens: List[str]
     type: NetworkType
 
-    def __init__(self, name: str, type: NetworkType) -> None:
+    def __init__(self, name: str, type: NetworkType, tokens = None) -> None:
         self.name = name
+        self.tokens = tokens or []
         self.type = type
 
     def tojson(self):
         return {
             "name": self.name,
+            "tokens": self.tokens,
             "type": self.type,
         }
diff --git a/api/onnx_web/server/load.py b/api/onnx_web/server/load.py
index a3759ff6..fa8f009b 100644
--- a/api/onnx_web/server/load.py
+++ b/api/onnx_web/server/load.py
@@ -96,6 +96,7 @@ wildcard_data: Dict[str, List[str]] = defaultdict(list)
 # Loaded from extra_models
 extra_hashes: Dict[str, str] = {}
 extra_strings: Dict[str, Any] = {}
+extra_tokens: Dict[str, List[str]] = {}
 
 
 def get_config_params():
@@ -160,6 +161,7 @@ def load_extras(server: ServerContext):
     """
     global extra_hashes
     global extra_strings
+    global extra_tokens
 
     labels = {}
     strings = {}
@@ -210,6 +212,10 @@ def load_extras(server: ServerContext):
                                 else:
                                     labels[model_name] = model["label"]
 
+                            if "tokens" in model:
+                                logger.debug("collecting tokens for model %s from %s", model_name, file)
+                                extra_tokens[model_name] = model["tokens"]
+
                             if "inversions" in model:
                                 for inversion in model["inversions"]:
                                     if "label" in inversion:
@@ -353,7 +359,7 @@ def load_models(server: ServerContext) -> None:
     )
     logger.debug("loaded Textual Inversion models from disk: %s", inversion_models)
     network_models.extend(
-        [NetworkModel(model, "inversion") for model in inversion_models]
+        [NetworkModel(model, "inversion", tokens=extra_tokens.get(model, [])) for model in inversion_models]
     )
 
     lora_models = list_model_globs(
@@ -364,7 +370,7 @@ def load_models(server: ServerContext) -> None:
         base_path=path.join(server.model_path, "lora"),
     )
     logger.debug("loaded LoRA models from disk: %s", lora_models)
-    network_models.extend([NetworkModel(model, "lora") for model in lora_models])
+    network_models.extend([NetworkModel(model, "lora", tokens=extra_tokens.get(model, [])) for model in lora_models])
 
 
 def load_params(server: ServerContext) -> None:
diff --git a/gui/src/components/input/PromptInput.tsx b/gui/src/components/input/PromptInput.tsx
index 2d8c8413..fa6a7aba 100644
--- a/gui/src/components/input/PromptInput.tsx
+++ b/gui/src/components/input/PromptInput.tsx
@@ -1,4 +1,4 @@
-import { Maybe, doesExist, mustExist } from '@apextoaster/js-utils';
+import { Maybe, doesExist, mustDefault, mustExist } from '@apextoaster/js-utils';
 import { Chip, TextField } from '@mui/material';
 import { Stack } from '@mui/system';
 import { useQuery } from '@tanstack/react-query';
@@ -120,7 +120,7 @@ export function PromptInput(props: PromptInputProps) {
   </Stack>;
 }
 
-export const ANY_TOKEN = /<([^>])+>/g;
+export const ANY_TOKEN = /<([^>]+)>/g;
 
 export type TokenList = Array<[string, number]>;
 
@@ -167,10 +167,10 @@ export function getNetworkTokens(models: Maybe<ModelResponse>, networks: PromptN
       }
     }
 
-    for (const [name, weight] of networks.inversion) {
+    for (const [name, weight] of networks.lora) {
       const model = models.networks.find((it) => it.type === 'lora' && it.name === name);
       if (doesExist(model) && model.type === 'lora') {
-        for (const token of model.tokens) {
+        for (const token of mustDefault(model.tokens, [])) {
           tokens.push([token, weight]);
         }
       }

From fd34b4a76418a7034d620756d0811963411bc30a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 15:50:04 -0600
Subject: [PATCH 139/240] feat(gui): highlight tokens that have been used in
 prompt

---
 gui/src/components/input/PromptInput.tsx | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/gui/src/components/input/PromptInput.tsx b/gui/src/components/input/PromptInput.tsx
index fa6a7aba..6fbc7f09 100644
--- a/gui/src/components/input/PromptInput.tsx
+++ b/gui/src/components/input/PromptInput.tsx
@@ -79,7 +79,13 @@ export function PromptInput(props: PromptInputProps) {
         });
       }}
     />
-    {tokens.map(([token, _weight]) => <Chip label={token} onClick={() => addToken(token)} />)}
+    <Stack direction='row' spacing={2}>
+      {tokens.map(([token, _weight]) => <Chip
+        color={prompt.includes(token) ? 'primary' : 'default'}
+        label={token}
+        onClick={() => addToken(token)}
+      />)}
+    </Stack>
     <TextField
       label={t('parameter.negativePrompt')}
       variant='outlined'

From d3784158fa3fd293b9bea97bb3b753286d159534 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 16:38:15 -0600
Subject: [PATCH 140/240] fix(docs): update readme screenshot for SDXL

---
 README.md            | 2 +-
 docs/readme-sdxl.png | 3 +++
 2 files changed, 4 insertions(+), 1 deletion(-)
 create mode 100644 docs/readme-sdxl.png

diff --git a/README.md b/README.md
index 19e8f227..76d6daba 100644
--- a/README.md
+++ b/README.md
@@ -17,7 +17,7 @@ with a CPU fallback capable of running on laptop-class machines.
 Please check out [the setup guide to get started](docs/setup-guide.md) and [the user guide for more
 details](https://github.com/ssube/onnx-web/blob/main/docs/user-guide.md).
 
-![txt2img with detailed knollingcase renders of a soldier in a cloudy alien jungle](./docs/readme-preview.png)
+![preview of txt2img tab using SDXL to generate ghostly astronauts eating weird hamburgers on an abandoned space station](./docs/readme-sdxl.png)
 
 ## Features
 
diff --git a/docs/readme-sdxl.png b/docs/readme-sdxl.png
new file mode 100644
index 00000000..eb0b2223
--- /dev/null
+++ b/docs/readme-sdxl.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:145b8a98ecf5cfd4948d5ab17d28b34a8fc63cbb3b2c5e3f94b4411538733a59
+size 1633570

From 1ee67613402d25b71e486f543702460ceead89c0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 16:38:56 -0600
Subject: [PATCH 141/240] apply lint

---
 api/onnx_web/chain/tile.py                    |  7 ++++++-
 api/onnx_web/diffusers/pipelines/panorama.py  |  6 ++++--
 .../diffusers/pipelines/panorama_xl.py        |  6 ++++--
 api/onnx_web/diffusers/utils.py               | 19 ++++++++++++-------
 api/onnx_web/models/meta.py                   |  2 +-
 api/onnx_web/server/load.py                   | 18 +++++++++++++++---
 6 files changed, 42 insertions(+), 16 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index bc3a57ab..eb4aebc4 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -115,7 +115,12 @@ def make_tile_mask(
 
     # build gradients
     edge_t, edge_l, edge_b, edge_r = edges
-    grad_x, grad_y = [int(not edge_l), 1, 1, int(not edge_r)], [int(not edge_t), 1, 1, int(not edge_b)]
+    grad_x, grad_y = [int(not edge_l), 1, 1, int(not edge_r)], [
+        int(not edge_t),
+        1,
+        1,
+        int(not edge_b),
+    ]
     logger.debug("tile gradients: %s, %s, %s, %s", points_w, points_h, grad_x, grad_y)
 
     mult_x = [np.interp(i, points_w, grad_x) for i in range(tile_w)]
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index fb5ea0e8..a33fed75 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -660,8 +660,10 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                         region_noise_pred_uncond, region_noise_pred_text = np.split(
                             region_noise_pred, 2
                         )
-                        region_noise_pred = region_noise_pred_uncond + guidance_scale * (
-                            region_noise_pred_text - region_noise_pred_uncond
+                        region_noise_pred = (
+                            region_noise_pred_uncond
+                            + guidance_scale
+                            * (region_noise_pred_text - region_noise_pred_uncond)
                         )
 
                     # compute the previous noisy sample x_t -> x_t-1
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 650ed17a..c9b970a4 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -502,8 +502,10 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                         region_noise_pred_uncond, region_noise_pred_text = np.split(
                             region_noise_pred, 2
                         )
-                        region_noise_pred = region_noise_pred_uncond + guidance_scale * (
-                            region_noise_pred_text - region_noise_pred_uncond
+                        region_noise_pred = (
+                            region_noise_pred_uncond
+                            + guidance_scale
+                            * (region_noise_pred_text - region_noise_pred_uncond)
                         )
                         if guidance_rescale > 0.0:
                             # Based on 3.4. in https://arxiv.org/pdf/2305.08891.pdf
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index d37f55a0..651e861a 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -459,7 +459,9 @@ def slice_prompt(prompt: str, slice: int) -> str:
         return prompt
 
 
-Region = Tuple[int, int, int, int, float, Tuple[float, Tuple[bool, bool, bool, bool]], str]
+Region = Tuple[
+    int, int, int, int, float, Tuple[float, Tuple[bool, bool, bool, bool]], str
+]
 
 
 def parse_region_group(group: Tuple[str, ...]) -> Region:
@@ -478,12 +480,15 @@ def parse_region_group(group: Tuple[str, ...]) -> Region:
         int(bottom),
         int(right),
         float(weight),
-        (float(feather_radius), (
-            "T" in feather_edges,
-            "L" in feather_edges,
-            "B" in feather_edges,
-            "R" in feather_edges,
-        )),
+        (
+            float(feather_radius),
+            (
+                "T" in feather_edges,
+                "L" in feather_edges,
+                "B" in feather_edges,
+                "R" in feather_edges,
+            ),
+        ),
         prompt,
     )
 
diff --git a/api/onnx_web/models/meta.py b/api/onnx_web/models/meta.py
index 453e24b2..fd8b1297 100644
--- a/api/onnx_web/models/meta.py
+++ b/api/onnx_web/models/meta.py
@@ -8,7 +8,7 @@ class NetworkModel:
     tokens: List[str]
     type: NetworkType
 
-    def __init__(self, name: str, type: NetworkType, tokens = None) -> None:
+    def __init__(self, name: str, type: NetworkType, tokens=None) -> None:
         self.name = name
         self.tokens = tokens or []
         self.type = type
diff --git a/api/onnx_web/server/load.py b/api/onnx_web/server/load.py
index fa8f009b..0444cc82 100644
--- a/api/onnx_web/server/load.py
+++ b/api/onnx_web/server/load.py
@@ -213,7 +213,11 @@ def load_extras(server: ServerContext):
                                     labels[model_name] = model["label"]
 
                             if "tokens" in model:
-                                logger.debug("collecting tokens for model %s from %s", model_name, file)
+                                logger.debug(
+                                    "collecting tokens for model %s from %s",
+                                    model_name,
+                                    file,
+                                )
                                 extra_tokens[model_name] = model["tokens"]
 
                             if "inversions" in model:
@@ -359,7 +363,10 @@ def load_models(server: ServerContext) -> None:
     )
     logger.debug("loaded Textual Inversion models from disk: %s", inversion_models)
     network_models.extend(
-        [NetworkModel(model, "inversion", tokens=extra_tokens.get(model, [])) for model in inversion_models]
+        [
+            NetworkModel(model, "inversion", tokens=extra_tokens.get(model, []))
+            for model in inversion_models
+        ]
     )
 
     lora_models = list_model_globs(
@@ -370,7 +377,12 @@ def load_models(server: ServerContext) -> None:
         base_path=path.join(server.model_path, "lora"),
     )
     logger.debug("loaded LoRA models from disk: %s", lora_models)
-    network_models.extend([NetworkModel(model, "lora", tokens=extra_tokens.get(model, [])) for model in lora_models])
+    network_models.extend(
+        [
+            NetworkModel(model, "lora", tokens=extra_tokens.get(model, []))
+            for model in lora_models
+        ]
+    )
 
 
 def load_params(server: ServerContext) -> None:

From 31812d4cdd56e7d10b370a113c4150ef4da8ba90 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 16:41:08 -0600
Subject: [PATCH 142/240] readme phrasing

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 76d6daba..2e595c80 100644
--- a/README.md
+++ b/README.md
@@ -55,7 +55,7 @@ This is an incomplete list of new and interesting features, with links to the us
   - runs img2img on the results of the other pipelines
   - multiple iterations can produce 8k images and larger
 - [multi-stage](docs/user-guide.md#prompt-stages) and [region prompts](docs/user-guide.md#region-tokens)
-  - combine multiple prompts in the same image
+  - seamlessly combine multiple prompts in the same image
   - provide prompts for different areas in the image and blend them together
   - change the prompt for highres mode and refine details without recursion
 - infinite prompt length

From f24a3ab287a85b87efc1cb1028950c47883bb7cd Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 16:47:32 -0600
Subject: [PATCH 143/240] more readme tweaks

---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 2e595c80..564927f0 100644
--- a/README.md
+++ b/README.md
@@ -38,7 +38,7 @@ This is an incomplete list of new and interesting features, with links to the us
   - [txt2img](docs/user-guide.md#txt2img-tab)
   - [img2img](docs/user-guide.md#img2img-tab)
   - [inpainting](docs/user-guide.md#inpaint-tab), with mask drawing and upload
-  - [panorama](docs/user-guide.md#panorama-pipeline)
+  - [panorama](docs/user-guide.md#panorama-pipeline), for both SD v1.5 and SDXL
   - [upscaling](docs/user-guide.md#upscale-tab), with ONNX acceleration
 - [add and use your own models](docs/user-guide.md#adding-your-own-models)
   - [convert models from diffusers and SD checkpoints](docs/converting-models.md)
@@ -72,7 +72,7 @@ This is an incomplete list of new and interesting features, with links to the us
 - OCI containers provided
   - for all supported hardware accelerators
   - includes both the API and GUI bundle in a single container
-  - runs well on [RunPod](https://www.runpod.io/) and other GPU container hosting services
+  - runs well on [RunPod](https://www.runpod.io/), [Vast.ai](https://vast.ai/), and other GPU container hosting services
 
 ## Contents
 

From 4460625309ff05dcd8d67b0f3a79e9c649820d0d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 18:24:30 -0600
Subject: [PATCH 144/240] try replacing NaN and clipping large values to reduce
 noise

---
 api/onnx_web/diffusers/pipelines/panorama.py    | 4 +++-
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 4 +++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index a33fed75..dd737a1e 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -28,7 +28,7 @@ from transformers import CLIPImageProcessor, CLIPTokenizer
 
 from onnx_web.chain.tile import make_tile_mask
 
-from ..utils import LATENT_CHANNELS, LATENT_FACTOR, parse_regions
+from ..utils import LATENT_CHANNELS, LATENT_FACTOR, parse_regions, repair_nan
 
 logger = logging.get_logger(__name__)
 
@@ -701,6 +701,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
+            latents = repair_nan(latents)
+            latents = np.clip(latents, -4, +4)
 
             # call the callback, if provided
             if callback is not None and i % callback_steps == 0:
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index c9b970a4..e0e26621 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -14,7 +14,7 @@ from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise
 
 from onnx_web.chain.tile import make_tile_mask
 
-from ..utils import LATENT_FACTOR, parse_regions
+from ..utils import LATENT_FACTOR, parse_regions, repair_nan
 
 logger = logging.getLogger(__name__)
 
@@ -550,6 +550,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
+            latents = repair_nan(latents)
+            latents = np.clip(latents, -4, +4)
 
             # call the callback, if provided
             if i == len(timesteps) - 1 or (

From 95e2d6d71006b02b24b5ce72e6eb9078e4e0ffaa Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 21:13:52 -0600
Subject: [PATCH 145/240] feat(api): add denoise stage, use before highres

---
 api/onnx_web/chain/__init__.py                |  2 +
 api/onnx_web/chain/base.py                    |  5 ++-
 api/onnx_web/chain/blend_denoise.py           | 39 +++++++++++++++++++
 api/onnx_web/diffusers/pipelines/panorama.py  |  2 +-
 .../diffusers/pipelines/panorama_xl.py        |  2 +-
 api/onnx_web/diffusers/run.py                 |  9 ++++-
 6 files changed, 54 insertions(+), 5 deletions(-)
 create mode 100644 api/onnx_web/chain/blend_denoise.py

diff --git a/api/onnx_web/chain/__init__.py b/api/onnx_web/chain/__init__.py
index df2ac80e..b34372ee 100644
--- a/api/onnx_web/chain/__init__.py
+++ b/api/onnx_web/chain/__init__.py
@@ -1,4 +1,5 @@
 from .base import ChainPipeline, PipelineStage, StageParams
+from .blend_denoise import BlendDenoiseStage
 from .blend_img2img import BlendImg2ImgStage
 from .blend_grid import BlendGridStage
 from .blend_linear import BlendLinearStage
@@ -22,6 +23,7 @@ from .upscale_stable_diffusion import UpscaleStableDiffusionStage
 from .upscale_swinir import UpscaleSwinIRStage
 
 CHAIN_STAGES = {
+    "blend-denoise": BlendDenoiseStage,
     "blend-img2img": BlendImg2ImgStage,
     "blend-inpaint": UpscaleOutpaintStage,
     "blend-grid": BlendGridStage,
diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 79323081..cabb8da1 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -232,7 +232,10 @@ class ChainPipeline:
 
                 stage_sources = stage_outputs
             else:
-                logger.debug("image does not contain sources and is within tile size of %s, running stage", tile)
+                logger.debug(
+                    "image does not contain sources and is within tile size of %s, running stage",
+                    tile,
+                )
                 for i in range(worker.retries):
                     try:
                         stage_outputs = stage_pipe.run(
diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
new file mode 100644
index 00000000..9c23c609
--- /dev/null
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -0,0 +1,39 @@
+from logging import getLogger
+from typing import List, Optional
+
+import cv2
+import numpy as np
+from PIL import Image
+
+from ..params import ImageParams, SizeChart, StageParams
+from ..server import ServerContext
+from ..worker import ProgressCallback, WorkerContext
+from .stage import BaseStage
+
+logger = getLogger(__name__)
+
+
+class BlendDenoiseStage(BaseStage):
+    max_tile = SizeChart.max
+
+    def run(
+        self,
+        _worker: WorkerContext,
+        _server: ServerContext,
+        _stage: StageParams,
+        _params: ImageParams,
+        sources: List[Image.Image],
+        *,
+        stage_source: Optional[Image.Image] = None,
+        callback: Optional[ProgressCallback] = None,
+        **kwargs,
+    ) -> List[Image.Image]:
+        logger.info("denoising source images")
+
+        results = []
+        for source in sources:
+            data = cv2.cvtColor(np.array(source), cv2.COLOR_RGB2BGR)
+            data = cv2.fastNlMeansDenoisingColored(data)
+            results.append(Image.fromarray(cv2.cvtColor(data, cv2.COLOR_BGR2RGB)))
+
+        return results
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index dd737a1e..01d6d0ec 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -702,12 +702,12 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
             latents = repair_nan(latents)
-            latents = np.clip(latents, -4, +4)
 
             # call the callback, if provided
             if callback is not None and i % callback_steps == 0:
                 callback(i, t, latents)
 
+        latents = np.clip(latents, -4, +4)
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
         # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index e0e26621..446bc5d6 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -551,7 +551,6 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             # take the MultiDiffusion step. Eq. 5 in MultiDiffusion paper: https://arxiv.org/abs/2302.08113
             latents = np.where(count > 0, value / count, value)
             latents = repair_nan(latents)
-            latents = np.clip(latents, -4, +4)
 
             # call the callback, if provided
             if i == len(timesteps) - 1 or (
@@ -563,6 +562,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         if output_type == "latent":
             image = latents
         else:
+            latents = np.clip(latents, -4, +4)
             latents = latents / self.vae_decoder.config.get("scaling_factor", 0.18215)
             # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
             image = np.concatenate(
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index a18cb75d..a3cd66fe 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -4,15 +4,15 @@ from typing import Any, List, Optional
 
 from PIL import Image, ImageOps
 
-from onnx_web.chain.highres import stage_highres
-
 from ..chain import (
+    BlendDenoiseStage,
     BlendImg2ImgStage,
     BlendMaskStage,
     ChainPipeline,
     SourceTxt2ImgStage,
     UpscaleOutpaintStage,
 )
+from ..chain.highres import stage_highres
 from ..chain.upscale import split_upscale, stage_upscale_correction
 from ..image import expand_image
 from ..output import save_image
@@ -68,6 +68,11 @@ def run_txt2img_pipeline(
         highres_size = params.unet_tile
 
     stage = StageParams(tile_size=highres_size)
+    chain.stage(
+        BlendDenoiseStage(),
+        stage,
+    )
+
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(

From 35171e6f1284cdce4cd5cd1f1819b5f78aecb48d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 21:14:13 -0600
Subject: [PATCH 146/240] fix(gui): dedupe and sort available prompt tokens

---
 gui/src/components/input/PromptInput.tsx | 24 +++++++++++++-----------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/gui/src/components/input/PromptInput.tsx b/gui/src/components/input/PromptInput.tsx
index 6fbc7f09..cdaa6751 100644
--- a/gui/src/components/input/PromptInput.tsx
+++ b/gui/src/components/input/PromptInput.tsx
@@ -12,7 +12,7 @@ import { ClientContext, OnnxState, StateContext } from '../../state.js';
 import { QueryMenu } from '../input/QueryMenu.js';
 import { ModelResponse } from '../../types/api.js';
 
-const { useContext } = React;
+const { useContext, useMemo } = React;
 
 /**
  * @todo replace with a selector
@@ -64,8 +64,10 @@ export function PromptInput(props: PromptInputProps) {
     });
   }
 
-  const networks = extractNetworks(prompt);
-  const tokens = getNetworkTokens(models.data, networks);
+  const tokens = useMemo(() => {
+    const networks = extractNetworks(prompt);
+    return getNetworkTokens(models.data, networks);
+  }, [prompt, models.data]);
 
   return <Stack spacing={2}>
     <TextField
@@ -80,7 +82,7 @@ export function PromptInput(props: PromptInputProps) {
       }}
     />
     <Stack direction='row' spacing={2}>
-      {tokens.map(([token, _weight]) => <Chip
+      {tokens.map((token) => <Chip
         color={prompt.includes(token) ? 'primary' : 'default'}
         label={token}
         onClick={() => addToken(token)}
@@ -162,26 +164,26 @@ export function extractNetworks(prompt: string): PromptNetworks {
 }
 
 // eslint-disable-next-line sonarjs/cognitive-complexity
-export function getNetworkTokens(models: Maybe<ModelResponse>, networks: PromptNetworks): TokenList {
-  const tokens: TokenList = [];
+export function getNetworkTokens(models: Maybe<ModelResponse>, networks: PromptNetworks): Array<string> {
+  const tokens: Set<string> = new Set();
 
   if (doesExist(models)) {
-    for (const [name, weight] of networks.inversion) {
+    for (const [name, _weight] of networks.inversion) {
       const model = models.networks.find((it) => it.type === 'inversion' && it.name === name);
       if (doesExist(model) && model.type === 'inversion') {
-        tokens.push([model.token, weight]);
+        tokens.add(model.token);
       }
     }
 
-    for (const [name, weight] of networks.lora) {
+    for (const [name, _weight] of networks.lora) {
       const model = models.networks.find((it) => it.type === 'lora' && it.name === name);
       if (doesExist(model) && model.type === 'lora') {
         for (const token of mustDefault(model.tokens, [])) {
-          tokens.push([token, weight]);
+          tokens.add(token);
         }
       }
     }
   }
 
-  return tokens;
+  return Array.from(tokens).sort();
 }

From 21d1240e281e771bf2a3d78d21dc4531e01ec7b6 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 21:19:01 -0600
Subject: [PATCH 147/240] only add denoise stage after panorama pipeline

---
 api/onnx_web/diffusers/run.py | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index a3cd66fe..60e80e65 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -62,16 +62,16 @@ def run_txt2img_pipeline(
     )
 
     # apply upscaling and correction, before highres
-    if params.is_panorama() and server.panorama_tiles:
-        highres_size = tile_size * highres.scale
-    else:
-        highres_size = params.unet_tile
+    highres_size = params.unet_tile
+    if params.is_panorama():
+        stage = StageParams(tile_size=highres_size)
+        chain.stage(
+            BlendDenoiseStage(),
+            stage,
+        )
 
-    stage = StageParams(tile_size=highres_size)
-    chain.stage(
-        BlendDenoiseStage(),
-        stage,
-    )
+        if server.panorama_tiles:
+            highres_size = tile_size * highres.scale
 
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:

From 768f478884422b10ab511dc843151452b9f8204d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 21:30:01 -0600
Subject: [PATCH 148/240] feat(api): add strength param to denoise stage

---
 api/onnx_web/chain/blend_denoise.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
index 9c23c609..93f9f105 100644
--- a/api/onnx_web/chain/blend_denoise.py
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -24,6 +24,7 @@ class BlendDenoiseStage(BaseStage):
         _params: ImageParams,
         sources: List[Image.Image],
         *,
+        strength: int = 10,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
@@ -33,7 +34,7 @@ class BlendDenoiseStage(BaseStage):
         results = []
         for source in sources:
             data = cv2.cvtColor(np.array(source), cv2.COLOR_RGB2BGR)
-            data = cv2.fastNlMeansDenoisingColored(data)
+            data = cv2.fastNlMeansDenoisingColored(data, None, strength, strength)
             results.append(Image.fromarray(cv2.cvtColor(data, cv2.COLOR_BGR2RGB)))
 
         return results

From 2a27c3ffd1285d156783692bc864a7aac0ad0e7d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 21:41:19 -0600
Subject: [PATCH 149/240] fix(api): adjust region strength threshold to support
 up to 90% UNet overlap

---
 api/onnx_web/diffusers/pipelines/panorama.py    | 2 +-
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 2 +-
 docs/user-guide.md                              | 5 +++--
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 01d6d0ec..78151f12 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -688,7 +688,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                     else:
                         mask = 1
 
-                    if weight >= 10.0:
+                    if weight >= 100.0:
                         value[:, :, h_start:h_end, w_start:w_end] = (
                             latents_region_denoised * mask
                         )
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 446bc5d6..9d4dfc08 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -537,7 +537,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                     else:
                         mask = 1
 
-                    if weight >= 10.0:
+                    if weight >= 100.0:
                         value[:, :, h_start:h_end, w_start:w_end] = (
                             latents_region_denoised * mask
                         )
diff --git a/docs/user-guide.md b/docs/user-guide.md
index d186d628..3812c87c 100644
--- a/docs/user-guide.md
+++ b/docs/user-guide.md
@@ -447,10 +447,11 @@ than the other tokens and have more parameters, which may change in the future.
   - will be rounded down to the nearest multiple of 8
 - `strength` defines the ratio between the two prompts
   - must be a float or integer
-  - strength should be between 0.0 and 10.0
+  - strength should be between 0.0 and 100.0
     - 2.0 to 5.0 generally works
-    - 10.0 completely replaces the base prompt
+    - 100.0 completely replaces the base prompt
     - < 0 does weird things
+  - more UNet overlap will require greater strength
 - `feather` defines the blending between the two prompts
   - must be a float or integer
   - this is similar to UNet and VAE overlap

From def8ad73c549b5d891c20c77296c1609e293f73e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 22:53:43 -0600
Subject: [PATCH 150/240] feat(api): add feature flags, move panoramic tile
 feature into flags

---
 api/onnx_web/diffusers/run.py  |  2 +-
 api/onnx_web/server/context.py | 14 +++++++-------
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 60e80e65..11594468 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -70,7 +70,7 @@ def run_txt2img_pipeline(
             stage,
         )
 
-        if server.panorama_tiles:
+        if server.has_feature("panorama-highres"):
             highres_size = tile_size * highres.scale
 
     first_upscale, after_upscale = split_upscale(upscale)
diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index eb7f5a2a..98bf6af5 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -16,7 +16,6 @@ DEFAULT_JOB_LIMIT = 10
 DEFAULT_IMAGE_FORMAT = "png"
 DEFAULT_SERVER_VERSION = "v0.10.0"
 DEFAULT_SHOW_PROGRESS = True
-DEFAULT_PANORAMA_TILES = False
 DEFAULT_WORKER_RETRIES = 3
 
 
@@ -40,7 +39,7 @@ class ServerContext:
     admin_token: str
     server_version: str
     worker_retries: int
-    panorama_tiles: bool
+    feature_flags: List[str]
 
     def __init__(
         self,
@@ -63,7 +62,7 @@ class ServerContext:
         admin_token: Optional[str] = None,
         server_version: Optional[str] = DEFAULT_SERVER_VERSION,
         worker_retries: Optional[int] = DEFAULT_WORKER_RETRIES,
-        panorama_tiles: Optional[bool] = DEFAULT_PANORAMA_TILES,
+        feature_flags: Optional[List[str]] = None,
     ) -> None:
         self.bundle_path = bundle_path
         self.model_path = model_path
@@ -84,7 +83,7 @@ class ServerContext:
         self.admin_token = admin_token or token_urlsafe()
         self.server_version = server_version
         self.worker_retries = worker_retries
-        self.panorama_tiles = panorama_tiles
+        self.feature_flags = feature_flags or []
 
         self.cache = ModelCache(self.cache_limit)
 
@@ -124,11 +123,12 @@ class ServerContext:
             worker_retries=int(
                 environ.get("ONNX_WEB_WORKER_RETRIES", DEFAULT_WORKER_RETRIES)
             ),
-            panorama_tiles=get_boolean(
-                environ, "ONNX_WEB_PANORAMA_TILES", DEFAULT_PANORAMA_TILES
-            ),
+            feature_flags=environ.get("ONNX_WEB_FEATURE_FLAGS", "").split(","),
         )
 
+    def has_feature(self, flag: str) -> bool:
+        return flag in self.feature_flags
+
     def torch_dtype(self):
         if "torch-fp16" in self.optimizations:
             return torch.float16

From 7106e96e776f45f2f3df508f0108c95cf43fe116 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 23:01:53 -0600
Subject: [PATCH 151/240] fix(api): make tile blending symmetrical, correct
 bottom/right gradients

---
 api/onnx_web/chain/tile.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index eb4aebc4..3ec071ab 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -105,13 +105,13 @@ def make_tile_mask(
     adj_tile_w = int(float(tile_w) * (1.0 - overlap))
 
     # sort gradient points
-    p1_h = adj_tile_h
+    p1_h = adj_tile_h - 1
     p2_h = tile_h - adj_tile_h
-    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile_h]
+    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile_h - 1]
 
-    p1_w = adj_tile_w
+    p1_w = adj_tile_w - 1
     p2_w = tile_w - adj_tile_w
-    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w]
+    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w - 1]
 
     # build gradients
     edge_t, edge_l, edge_b, edge_r = edges
@@ -155,9 +155,9 @@ def blend_tiles(
 
         if adj_tile < tile:
             # sort gradient points
-            p1 = adj_tile * scale
+            p1 = (adj_tile * scale) - 1
             p2 = (tile - adj_tile) * scale
-            points = [0, min(p1, p2), max(p1, p2), tile * scale]
+            points = [0, min(p1, p2), max(p1, p2), (tile * scale) - 1]
 
             # gradient blending
             grad_x, grad_y = get_tile_grads(left, top, adj_tile, width, height)

From 43944b7001964bae7c4ca51beb83f1da22252a48 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 23:28:47 -0600
Subject: [PATCH 152/240] push blending out by 1

---
 api/onnx_web/chain/tile.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 3ec071ab..65ac3a46 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -107,11 +107,11 @@ def make_tile_mask(
     # sort gradient points
     p1_h = adj_tile_h - 1
     p2_h = tile_h - adj_tile_h
-    points_h = [0, min(p1_h, p2_h), max(p1_h, p2_h), tile_h - 1]
+    points_h = [-1, min(p1_h, p2_h), max(p1_h, p2_h), tile_h]
 
     p1_w = adj_tile_w - 1
     p2_w = tile_w - adj_tile_w
-    points_w = [0, min(p1_w, p2_w), max(p1_w, p2_w), tile_w - 1]
+    points_w = [-1, min(p1_w, p2_w), max(p1_w, p2_w), tile_w]
 
     # build gradients
     edge_t, edge_l, edge_b, edge_r = edges
@@ -156,8 +156,8 @@ def blend_tiles(
         if adj_tile < tile:
             # sort gradient points
             p1 = (adj_tile * scale) - 1
-            p2 = (tile - adj_tile) * scale
-            points = [0, min(p1, p2), max(p1, p2), (tile * scale) - 1]
+            p2 = (tile - adj_tile - 1) * scale
+            points = [-1, min(p1, p2), max(p1, p2), (tile * scale)]
 
             # gradient blending
             grad_x, grad_y = get_tile_grads(left, top, adj_tile, width, height)

From a3519f5610d57e0a6d9afd568771f5555fcf4472 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 12 Nov 2023 23:29:00 -0600
Subject: [PATCH 153/240] reduce default denoise strength

---
 api/onnx_web/chain/blend_denoise.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
index 93f9f105..94b8a1ff 100644
--- a/api/onnx_web/chain/blend_denoise.py
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -24,7 +24,7 @@ class BlendDenoiseStage(BaseStage):
         _params: ImageParams,
         sources: List[Image.Image],
         *,
-        strength: int = 10,
+        strength: int = 3,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,

From 14ddfb43bb26cf539613748bf7ec78f3e2508ccb Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 14 Nov 2023 20:32:23 -0600
Subject: [PATCH 154/240] fix(api): handle empty prompts when parsing

---
 api/onnx_web/diffusers/utils.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 651e861a..7eaee674 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -515,6 +515,9 @@ def parse_reseed(prompt: str) -> Tuple[str, List[Reseed]]:
     return get_tokens_from_prompt(prompt, RESEED_TOKEN, parser=parse_reseed_group)
 
 
-def remove_tokens(prompt: str) -> str:
+def remove_tokens(prompt: Optional[str]) -> Optional[str]:
+    if prompt is None:
+        return prompt
+
     remainder, tokens = get_tokens_from_prompt(prompt, ANY_TOKEN)
     return remainder

From 1bdfb4ac8ab5ac5e975f2b7223853986c7882970 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 14 Nov 2023 20:34:56 -0600
Subject: [PATCH 155/240] fix(api): do not parse tokens when removing them

---
 api/onnx_web/diffusers/utils.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 7eaee674..f308e2fa 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -3,7 +3,7 @@ from copy import deepcopy
 from logging import getLogger
 from math import ceil
 from re import Pattern, compile
-from typing import Dict, List, Optional, Tuple
+from typing import Any, Dict, List, Optional, Tuple
 
 import numpy as np
 import torch
@@ -515,9 +515,13 @@ def parse_reseed(prompt: str) -> Tuple[str, List[Reseed]]:
     return get_tokens_from_prompt(prompt, RESEED_TOKEN, parser=parse_reseed_group)
 
 
+def skip_group(group) -> Any:
+    return group
+
+
 def remove_tokens(prompt: Optional[str]) -> Optional[str]:
     if prompt is None:
         return prompt
 
-    remainder, tokens = get_tokens_from_prompt(prompt, ANY_TOKEN)
+    remainder, tokens = get_tokens_from_prompt(prompt, ANY_TOKEN, parser=skip_group)
     return remainder

From 5824149cc097aad0fcb92d0d1ac5eac5f51ed48c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 14 Nov 2023 20:59:51 -0600
Subject: [PATCH 156/240] fix(api): use full-size latents for all panorama
 pipelines

---
 api/onnx_web/chain/source_txt2img.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index ce1f04df..7485e5ea 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -64,7 +64,7 @@ class SourceTxt2ImgStage(BaseStage):
             params
         )
 
-        if params.is_xl():
+        if params.is_panorama() or params.is_xl():
             tile_size = max(stage.tile_size, params.unet_tile)
         else:
             tile_size = params.unet_tile

From 59685770e463150e07a10c4bb7a072a4eba3960d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 14 Nov 2023 23:23:23 -0600
Subject: [PATCH 157/240] feat(api): disable prompt alternatives for panorama
 to fix regions

---
 api/onnx_web/chain/source_txt2img.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 7485e5ea..d46b3711 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -130,7 +130,9 @@ class SourceTxt2ImgStage(BaseStage):
             )
         else:
             # encode and record alternative prompts outside of LPW
-            if not params.is_xl():
+            if params.is_panorama() or params.is_xl():
+                logger.debug("prompt alternatives are not supported for panorama or SDXL")
+            else:
                 prompt_embeds = encode_prompt(
                     pipe, prompt_pairs, params.batch, params.do_cfg()
                 )

From b31227ecb3d4156088c5ec1c134a837cb9c071bd Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 15 Nov 2023 23:14:48 -0600
Subject: [PATCH 158/240] fix(api): make sure stage params are declared for all
 txt2img pipelines

---
 api/onnx_web/diffusers/run.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 11594468..45ef3881 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -63,8 +63,9 @@ def run_txt2img_pipeline(
 
     # apply upscaling and correction, before highres
     highres_size = params.unet_tile
+    stage = StageParams(tile_size=highres_size)
+
     if params.is_panorama():
-        stage = StageParams(tile_size=highres_size)
         chain.stage(
             BlendDenoiseStage(),
             stage,

From eb3f1479f27bfe0035343f96818400129e3743a5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 16 Nov 2023 21:45:50 -0600
Subject: [PATCH 159/240] fix(api): only use optimum's fp16 mode for SDXL
 export when torch fp16 is enabled

---
 api/onnx_web/convert/__main__.py               |  2 +-
 api/onnx_web/convert/diffusion/diffusion_xl.py |  2 +-
 api/onnx_web/diffusers/load.py                 | 14 +++++++-------
 api/onnx_web/server/context.py                 |  5 ++++-
 4 files changed, 13 insertions(+), 10 deletions(-)

diff --git a/api/onnx_web/convert/__main__.py b/api/onnx_web/convert/__main__.py
index a969ca4c..5cbe7f07 100644
--- a/api/onnx_web/convert/__main__.py
+++ b/api/onnx_web/convert/__main__.py
@@ -599,7 +599,7 @@ def main(args=None) -> int:
     logger.info("CLI arguments: %s", args)
 
     server = ConversionContext.from_environ()
-    server.half = args.half or "onnx-fp16" in server.optimizations
+    server.half = args.half or server.has_optimization("onnx-fp16")
     server.opset = args.opset
     server.token = args.token
     logger.info(
diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index f6413cb7..f270f1d5 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -81,7 +81,7 @@ def convert_diffusion_diffusers_xl(
         output=dest_path,
         task="stable-diffusion-xl",
         device=device,
-        fp16=conversion.half,
+        fp16=conversion.has_optimization("torch-fp16"), # optimum's fp16 mode only works on CUDA or ROCm
         framework="pt",
     )
 
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 162a8699..894211fa 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -563,8 +563,8 @@ def optimize_pipeline(
     pipe: StableDiffusionPipeline,
 ) -> None:
     if (
-        "diffusers-attention-slicing" in server.optimizations
-        or "diffusers-attention-slicing-auto" in server.optimizations
+        server.has_optimization("diffusers-attention-slicing")
+        or server.has_optimization("diffusers-attention-slicing-auto")
     ):
         logger.debug("enabling auto attention slicing on SD pipeline")
         try:
@@ -572,28 +572,28 @@ def optimize_pipeline(
         except Exception as e:
             logger.warning("error while enabling auto attention slicing: %s", e)
 
-    if "diffusers-attention-slicing-max" in server.optimizations:
+    if server.has_optimization("diffusers-attention-slicing-max"):
         logger.debug("enabling max attention slicing on SD pipeline")
         try:
             pipe.enable_attention_slicing(slice_size="max")
         except Exception as e:
             logger.warning("error while enabling max attention slicing: %s", e)
 
-    if "diffusers-vae-slicing" in server.optimizations:
+    if server.has_optimization("diffusers-vae-slicing"):
         logger.debug("enabling VAE slicing on SD pipeline")
         try:
             pipe.enable_vae_slicing()
         except Exception as e:
             logger.warning("error while enabling VAE slicing: %s", e)
 
-    if "diffusers-cpu-offload-sequential" in server.optimizations:
+    if server.has_optimization("diffusers-cpu-offload-sequential"):
         logger.debug("enabling sequential CPU offload on SD pipeline")
         try:
             pipe.enable_sequential_cpu_offload()
         except Exception as e:
             logger.warning("error while enabling sequential CPU offload: %s", e)
 
-    elif "diffusers-cpu-offload-model" in server.optimizations:
+    elif server.has_optimization("diffusers-cpu-offload-model"):
         # TODO: check for accelerate
         logger.debug("enabling model CPU offload on SD pipeline")
         try:
@@ -601,7 +601,7 @@ def optimize_pipeline(
         except Exception as e:
             logger.warning("error while enabling model CPU offload: %s", e)
 
-    if "diffusers-memory-efficient-attention" in server.optimizations:
+    if server.has_optimization("diffusers-memory-efficient-attention"):
         # TODO: check for xformers
         logger.debug("enabling memory efficient attention for SD pipeline")
         try:
diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 98bf6af5..d4118205 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -129,8 +129,11 @@ class ServerContext:
     def has_feature(self, flag: str) -> bool:
         return flag in self.feature_flags
 
+    def has_optimization(self, opt: str) -> bool:
+        return opt in self.optimizations
+
     def torch_dtype(self):
-        if "torch-fp16" in self.optimizations:
+        if self.has_optimization("torch-fp16"):
             return torch.float16
         else:
             return torch.float32

From c8dd85e798564bd0e9bc6f442acaa174c584f098 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 16 Nov 2023 22:04:11 -0600
Subject: [PATCH 160/240] fix(api): correct file extension validity check

---
 api/onnx_web/convert/utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/convert/utils.py b/api/onnx_web/convert/utils.py
index 42cb7370..61b6547f 100644
--- a/api/onnx_web/convert/utils.py
+++ b/api/onnx_web/convert/utils.py
@@ -192,7 +192,7 @@ def check_ext(name: str, exts: List[str]) -> Tuple[bool, str]:
     _name, ext = path.splitext(name)
     ext = ext.strip(".")
 
-    return (name in exts, ext)
+    return (ext in exts, ext)
 
 
 def source_format(model: Dict) -> Optional[str]:

From d52c68d6074b1dc11daba1f3641adc5c0fd47016 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 17:18:23 -0600
Subject: [PATCH 161/240] feat(api): add chain pipeline stage result type

---
 api/onnx_web/chain/__init__.py                |  51 +--
 api/onnx_web/chain/base.py                    | 300 ++----------------
 api/onnx_web/chain/blend_denoise.py           |   2 +-
 api/onnx_web/chain/blend_grid.py              |   2 +-
 api/onnx_web/chain/blend_img2img.py           |   2 +-
 api/onnx_web/chain/blend_linear.py            |   2 +-
 api/onnx_web/chain/blend_mask.py              |   2 +-
 api/onnx_web/chain/correct_codeformer.py      |   2 +-
 api/onnx_web/chain/correct_gfpgan.py          |   2 +-
 api/onnx_web/chain/highres.py                 |   2 +-
 api/onnx_web/chain/persist_disk.py            |   2 +-
 api/onnx_web/chain/persist_s3.py              |   2 +-
 api/onnx_web/chain/pipeline.py                | 283 +++++++++++++++++
 api/onnx_web/chain/reduce_crop.py             |   2 +-
 api/onnx_web/chain/reduce_thumbnail.py        |   2 +-
 api/onnx_web/chain/result.py                  |  31 ++
 api/onnx_web/chain/source_noise.py            |   2 +-
 api/onnx_web/chain/source_s3.py               |   2 +-
 api/onnx_web/chain/source_txt2img.py          |   2 +-
 api/onnx_web/chain/source_url.py              |   2 +-
 api/onnx_web/chain/stage.py                   |  38 ---
 api/onnx_web/chain/stages.py                  |  64 ++++
 api/onnx_web/chain/upscale_bsrgan.py          |   2 +-
 api/onnx_web/chain/upscale_highres.py         |   2 +-
 api/onnx_web/chain/upscale_outpaint.py        |   2 +-
 api/onnx_web/chain/upscale_resrgan.py         |   2 +-
 api/onnx_web/chain/upscale_simple.py          |   2 +-
 .../chain/upscale_stable_diffusion.py         |   2 +-
 api/onnx_web/chain/upscale_swinir.py          |   2 +-
 api/onnx_web/worker/context.py                |   2 +-
 api/tests/chain/test_base.py                  |   2 +-
 31 files changed, 433 insertions(+), 384 deletions(-)
 create mode 100644 api/onnx_web/chain/pipeline.py
 create mode 100644 api/onnx_web/chain/result.py
 delete mode 100644 api/onnx_web/chain/stage.py
 create mode 100644 api/onnx_web/chain/stages.py

diff --git a/api/onnx_web/chain/__init__.py b/api/onnx_web/chain/__init__.py
index b34372ee..476e3e18 100644
--- a/api/onnx_web/chain/__init__.py
+++ b/api/onnx_web/chain/__init__.py
@@ -1,49 +1,2 @@
-from .base import ChainPipeline, PipelineStage, StageParams
-from .blend_denoise import BlendDenoiseStage
-from .blend_img2img import BlendImg2ImgStage
-from .blend_grid import BlendGridStage
-from .blend_linear import BlendLinearStage
-from .blend_mask import BlendMaskStage
-from .correct_codeformer import CorrectCodeformerStage
-from .correct_gfpgan import CorrectGFPGANStage
-from .persist_disk import PersistDiskStage
-from .persist_s3 import PersistS3Stage
-from .reduce_crop import ReduceCropStage
-from .reduce_thumbnail import ReduceThumbnailStage
-from .source_noise import SourceNoiseStage
-from .source_s3 import SourceS3Stage
-from .source_txt2img import SourceTxt2ImgStage
-from .source_url import SourceURLStage
-from .upscale_bsrgan import UpscaleBSRGANStage
-from .upscale_highres import UpscaleHighresStage
-from .upscale_outpaint import UpscaleOutpaintStage
-from .upscale_resrgan import UpscaleRealESRGANStage
-from .upscale_simple import UpscaleSimpleStage
-from .upscale_stable_diffusion import UpscaleStableDiffusionStage
-from .upscale_swinir import UpscaleSwinIRStage
-
-CHAIN_STAGES = {
-    "blend-denoise": BlendDenoiseStage,
-    "blend-img2img": BlendImg2ImgStage,
-    "blend-inpaint": UpscaleOutpaintStage,
-    "blend-grid": BlendGridStage,
-    "blend-linear": BlendLinearStage,
-    "blend-mask": BlendMaskStage,
-    "correct-codeformer": CorrectCodeformerStage,
-    "correct-gfpgan": CorrectGFPGANStage,
-    "persist-disk": PersistDiskStage,
-    "persist-s3": PersistS3Stage,
-    "reduce-crop": ReduceCropStage,
-    "reduce-thumbnail": ReduceThumbnailStage,
-    "source-noise": SourceNoiseStage,
-    "source-s3": SourceS3Stage,
-    "source-txt2img": SourceTxt2ImgStage,
-    "source-url": SourceURLStage,
-    "upscale-bsrgan": UpscaleBSRGANStage,
-    "upscale-highres": UpscaleHighresStage,
-    "upscale-outpaint": UpscaleOutpaintStage,
-    "upscale-resrgan": UpscaleRealESRGANStage,
-    "upscale-simple": UpscaleSimpleStage,
-    "upscale-stable-diffusion": UpscaleStableDiffusionStage,
-    "upscale-swinir": UpscaleSwinIRStage,
-}
+from .pipeline import ChainPipeline, PipelineStage, StageParams
+from .stages import *
\ No newline at end of file
diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index cabb8da1..0a220773 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -1,283 +1,39 @@
-from datetime import timedelta
-from logging import getLogger
-from time import monotonic
-from typing import Any, List, Optional, Tuple
+from typing import List, Optional
 
 from PIL import Image
 
-from ..errors import RetryException
-from ..output import save_image
-from ..params import ImageParams, Size, StageParams
-from ..server import ServerContext
-from ..utils import is_debug, run_gc
-from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
-from .tile import needs_tile, process_tile_order
-
-logger = getLogger(__name__)
+from .result import StageResult
+from ..params import ImageParams, Size, SizeChart, StageParams
+from ..server.context import ServerContext
+from ..worker.context import WorkerContext
 
 
-PipelineStage = Tuple[BaseStage, StageParams, Optional[dict]]
-
-
-class ChainProgress:
-    def __init__(self, parent: ProgressCallback, start=0) -> None:
-        self.parent = parent
-        self.step = start
-        self.total = 0
-
-    def __call__(self, step: int, timestep: int, latents: Any) -> None:
-        if step < self.step:
-            # accumulate on resets
-            self.total += self.step
-
-        self.step = step
-        self.parent(self.get_total(), timestep, latents)
-
-    def get_total(self) -> int:
-        return self.step + self.total
-
-    @classmethod
-    def from_progress(cls, parent: ProgressCallback):
-        start = parent.step if hasattr(parent, "step") else 0
-        return ChainProgress(parent, start=start)
-
-
-class ChainPipeline:
-    """
-    Run many stages in series, passing the image results from each to the next, and processing
-    tiles as needed.
-    """
-
-    def __init__(
-        self,
-        stages: Optional[List[PipelineStage]] = None,
-    ):
-        """
-        Create a new pipeline that will run the given stages.
-        """
-        self.stages = list(stages or [])
-
-    def append(self, stage: Optional[PipelineStage]):
-        """
-        Append an additional stage to this pipeline.
-
-        This requires an already-assembled `PipelineStage`. Use `ChainPipeline.stage` if you want the pipeline to
-        assemble the stage from loose arguments.
-        """
-        if stage is not None:
-            self.stages.append(stage)
+class BaseStage:
+    max_tile = SizeChart.auto
 
     def run(
         self,
-        worker: WorkerContext,
-        server: ServerContext,
-        params: ImageParams,
-        sources: List[Image.Image],
-        callback: Optional[ProgressCallback],
-        **kwargs
-    ) -> List[Image.Image]:
-        return self(
-            worker, server, params, sources=sources, callback=callback, **kwargs
-        )
+        _worker: WorkerContext,
+        _server: ServerContext,
+        _stage: StageParams,
+        _params: ImageParams,
+        _sources: List[Image.Image],
+        *args,
+        stage_source: Optional[Image.Image] = None,
+        **kwargs,
+    ) -> StageResult:
+        raise NotImplementedError()  # noqa
 
-    def stage(self, callback: BaseStage, params: StageParams, **kwargs):
-        self.stages.append((callback, params, kwargs))
-        return self
-
-    def steps(self, params: ImageParams, size: Size):
-        steps = 0
-        for callback, _params, kwargs in self.stages:
-            steps += callback.steps(kwargs.get("params", params), size)
-
-        return steps
-
-    def outputs(self, params: ImageParams, sources: int):
-        outputs = sources
-        for callback, _params, kwargs in self.stages:
-            outputs = callback.outputs(kwargs.get("params", params), outputs)
-
-        return outputs
-
-    def __call__(
+    def steps(
         self,
-        worker: WorkerContext,
-        server: ServerContext,
-        params: ImageParams,
-        sources: List[Image.Image],
-        callback: Optional[ProgressCallback] = None,
-        **pipeline_kwargs
-    ) -> List[Image.Image]:
-        """
-        DEPRECATED: use `run` instead
-        """
-        if callback is None:
-            callback = worker.get_progress_callback()
-        else:
-            callback = ChainProgress.from_progress(callback)
+        _params: ImageParams,
+        _size: Size,
+    ) -> int:
+        return 1  # noqa
 
-        start = monotonic()
-
-        if len(sources) > 0:
-            logger.info(
-                "running pipeline on %s source images",
-                len(sources),
-            )
-        else:
-            logger.info("running pipeline without source images")
-
-        stage_sources = sources
-        for stage_pipe, stage_params, stage_kwargs in self.stages:
-            name = stage_params.name or stage_pipe.__class__.__name__
-            kwargs = stage_kwargs or {}
-            kwargs = {**pipeline_kwargs, **kwargs}
-            logger.debug(
-                "running stage %s with %s source images, parameters: %s",
-                name,
-                len(stage_sources) - stage_sources.count(None),
-                kwargs.keys(),
-            )
-
-            per_stage_params = params
-            if "params" in kwargs:
-                per_stage_params = kwargs["params"]
-                kwargs.pop("params")
-
-            # the stage must be split and tiled if any image is larger than the selected/max tile size
-            must_tile = any(
-                [
-                    needs_tile(
-                        stage_pipe.max_tile,
-                        stage_params.tile_size,
-                        size=kwargs.get("size", None),
-                        source=source,
-                    )
-                    for source in stage_sources
-                ]
-            )
-
-            tile = stage_params.tile_size
-            if stage_pipe.max_tile > 0:
-                tile = min(stage_pipe.max_tile, stage_params.tile_size)
-
-            if stage_sources or must_tile:
-                stage_outputs = []
-                for source in stage_sources:
-                    logger.info(
-                        "image contains sources or is larger than tile size of %s, tiling stage",
-                        tile,
-                    )
-
-                    extra_tiles = []
-
-                    def stage_tile(
-                        source_tile: Image.Image,
-                        tile_mask: Image.Image,
-                        dims: Tuple[int, int, int],
-                    ) -> Image.Image:
-                        for _i in range(worker.retries):
-                            try:
-                                output_tile = stage_pipe.run(
-                                    worker,
-                                    server,
-                                    stage_params,
-                                    per_stage_params,
-                                    [source_tile],
-                                    tile_mask=tile_mask,
-                                    callback=callback,
-                                    dims=dims,
-                                    **kwargs,
-                                )
-
-                                if len(output_tile) > 1:
-                                    while len(extra_tiles) < len(output_tile):
-                                        extra_tiles.append([])
-
-                                    for tile, layer in zip(output_tile, extra_tiles):
-                                        layer.append((tile, dims))
-
-                                if is_debug():
-                                    save_image(server, "last-tile.png", output_tile[0])
-
-                                return output_tile[0]
-                            except Exception:
-                                worker.retries = worker.retries - 1
-                                logger.exception(
-                                    "error while running stage pipeline for tile, %s retries left",
-                                    worker.retries,
-                                )
-                                server.cache.clear()
-                                run_gc([worker.get_device()])
-
-                        raise RetryException("exhausted retries on tile")
-
-                    output = process_tile_order(
-                        stage_params.tile_order,
-                        source,
-                        tile,
-                        stage_params.outscale,
-                        [stage_tile],
-                        **kwargs,
-                    )
-
-                    stage_outputs.append(output)
-
-                    if len(extra_tiles) > 1:
-                        for layer in extra_tiles:
-                            layer_output = Image.new("RGB", output.size)
-                            for layer_tile, dims in layer:
-                                layer_output.paste(layer_tile, (dims[0], dims[1]))
-
-                            stage_outputs.append(layer_output)
-
-                stage_sources = stage_outputs
-            else:
-                logger.debug(
-                    "image does not contain sources and is within tile size of %s, running stage",
-                    tile,
-                )
-                for i in range(worker.retries):
-                    try:
-                        stage_outputs = stage_pipe.run(
-                            worker,
-                            server,
-                            stage_params,
-                            per_stage_params,
-                            stage_sources,
-                            callback=callback,
-                            dims=(0, 0, tile),
-                            **kwargs,
-                        )
-                        # doing this on the same line as stage_pipe.run can leave sources as None, which the pipeline
-                        # does not like, so it throws
-                        stage_sources = stage_outputs
-                        break
-                    except Exception:
-                        worker.retries = worker.retries - 1
-                        logger.exception(
-                            "error while running stage pipeline, %s retries left",
-                            worker.retries,
-                        )
-                        server.cache.clear()
-                        run_gc([worker.get_device()])
-
-                if worker.retries <= 0:
-                    raise RetryException("exhausted retries on stage")
-
-            logger.debug(
-                "finished stage %s with %s results",
-                name,
-                len(stage_sources),
-            )
-
-            if is_debug():
-                save_image(server, "last-stage.png", stage_sources[0])
-
-        end = monotonic()
-        duration = timedelta(seconds=(end - start))
-        logger.info(
-            "finished pipeline in %s with %s results",
-            duration,
-            len(stage_sources),
-        )
-        return stage_sources
+    def outputs(
+        self,
+        _params: ImageParams,
+        sources: int,
+    ) -> int:
+        return sources
diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
index 94b8a1ff..efc5b2b3 100644
--- a/api/onnx_web/chain/blend_denoise.py
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -8,7 +8,7 @@ from PIL import Image
 from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 19af2fbd..a6cab0fe 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index 274ab407..d44e52cc 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -10,7 +10,7 @@ from ..diffusers.utils import encode_prompt, parse_prompt, slice_prompt
 from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/blend_linear.py b/api/onnx_web/chain/blend_linear.py
index 6317ef13..1eae984a 100644
--- a/api/onnx_web/chain/blend_linear.py
+++ b/api/onnx_web/chain/blend_linear.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index 1038d3ea..d4cd4001 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -8,7 +8,7 @@ from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..utils import is_debug
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/correct_codeformer.py b/api/onnx_web/chain/correct_codeformer.py
index 121a5cb3..f649acc6 100644
--- a/api/onnx_web/chain/correct_codeformer.py
+++ b/api/onnx_web/chain/correct_codeformer.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/correct_gfpgan.py b/api/onnx_web/chain/correct_gfpgan.py
index 145ff36b..6b0e17be 100644
--- a/api/onnx_web/chain/correct_gfpgan.py
+++ b/api/onnx_web/chain/correct_gfpgan.py
@@ -9,7 +9,7 @@ from ..params import DeviceParams, ImageParams, StageParams, UpscaleParams
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/highres.py b/api/onnx_web/chain/highres.py
index 482b86c7..088c16ad 100644
--- a/api/onnx_web/chain/highres.py
+++ b/api/onnx_web/chain/highres.py
@@ -1,7 +1,7 @@
 from logging import getLogger
 from typing import Optional
 
-from ..chain.base import ChainPipeline
+from .pipeline import ChainPipeline
 from ..chain.blend_img2img import BlendImg2ImgStage
 from ..chain.upscale import stage_upscale_correction
 from ..chain.upscale_simple import UpscaleSimpleStage
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 124f0989..38ec2b3f 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -7,7 +7,7 @@ from ..output import save_image
 from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/persist_s3.py b/api/onnx_web/chain/persist_s3.py
index 27f4026f..f2becfc2 100644
--- a/api/onnx_web/chain/persist_s3.py
+++ b/api/onnx_web/chain/persist_s3.py
@@ -8,7 +8,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
new file mode 100644
index 00000000..edba28c9
--- /dev/null
+++ b/api/onnx_web/chain/pipeline.py
@@ -0,0 +1,283 @@
+from datetime import timedelta
+from logging import getLogger
+from time import monotonic
+from typing import Any, List, Optional, Tuple
+
+from PIL import Image
+
+from ..errors import RetryException
+from ..output import save_image
+from ..params import ImageParams, Size, StageParams
+from ..server import ServerContext
+from ..utils import is_debug, run_gc
+from ..worker import ProgressCallback, WorkerContext
+from .base import BaseStage
+from .tile import needs_tile, process_tile_order
+
+logger = getLogger(__name__)
+
+
+PipelineStage = Tuple[BaseStage, StageParams, Optional[dict]]
+
+
+class ChainProgress:
+    def __init__(self, parent: ProgressCallback, start=0) -> None:
+        self.parent = parent
+        self.step = start
+        self.total = 0
+
+    def __call__(self, step: int, timestep: int, latents: Any) -> None:
+        if step < self.step:
+            # accumulate on resets
+            self.total += self.step
+
+        self.step = step
+        self.parent(self.get_total(), timestep, latents)
+
+    def get_total(self) -> int:
+        return self.step + self.total
+
+    @classmethod
+    def from_progress(cls, parent: ProgressCallback):
+        start = parent.step if hasattr(parent, "step") else 0
+        return ChainProgress(parent, start=start)
+
+
+class ChainPipeline:
+    """
+    Run many stages in series, passing the image results from each to the next, and processing
+    tiles as needed.
+    """
+
+    def __init__(
+        self,
+        stages: Optional[List[PipelineStage]] = None,
+    ):
+        """
+        Create a new pipeline that will run the given stages.
+        """
+        self.stages = list(stages or [])
+
+    def append(self, stage: Optional[PipelineStage]):
+        """
+        Append an additional stage to this pipeline.
+
+        This requires an already-assembled `PipelineStage`. Use `ChainPipeline.stage` if you want the pipeline to
+        assemble the stage from loose arguments.
+        """
+        if stage is not None:
+            self.stages.append(stage)
+
+    def run(
+        self,
+        worker: WorkerContext,
+        server: ServerContext,
+        params: ImageParams,
+        sources: List[Image.Image],
+        callback: Optional[ProgressCallback],
+        **kwargs
+    ) -> List[Image.Image]:
+        return self(
+            worker, server, params, sources=sources, callback=callback, **kwargs
+        )
+
+    def stage(self, callback: BaseStage, params: StageParams, **kwargs):
+        self.stages.append((callback, params, kwargs))
+        return self
+
+    def steps(self, params: ImageParams, size: Size):
+        steps = 0
+        for callback, _params, kwargs in self.stages:
+            steps += callback.steps(kwargs.get("params", params), size)
+
+        return steps
+
+    def outputs(self, params: ImageParams, sources: int):
+        outputs = sources
+        for callback, _params, kwargs in self.stages:
+            outputs = callback.outputs(kwargs.get("params", params), outputs)
+
+        return outputs
+
+    def __call__(
+        self,
+        worker: WorkerContext,
+        server: ServerContext,
+        params: ImageParams,
+        sources: List[Image.Image],
+        callback: Optional[ProgressCallback] = None,
+        **pipeline_kwargs
+    ) -> List[Image.Image]:
+        """
+        DEPRECATED: use `run` instead
+        """
+        if callback is None:
+            callback = worker.get_progress_callback()
+        else:
+            callback = ChainProgress.from_progress(callback)
+
+        start = monotonic()
+
+        if len(sources) > 0:
+            logger.info(
+                "running pipeline on %s source images",
+                len(sources),
+            )
+        else:
+            logger.info("running pipeline without source images")
+
+        stage_sources = sources
+        for stage_pipe, stage_params, stage_kwargs in self.stages:
+            name = stage_params.name or stage_pipe.__class__.__name__
+            kwargs = stage_kwargs or {}
+            kwargs = {**pipeline_kwargs, **kwargs}
+            logger.debug(
+                "running stage %s with %s source images, parameters: %s",
+                name,
+                len(stage_sources) - stage_sources.count(None),
+                kwargs.keys(),
+            )
+
+            per_stage_params = params
+            if "params" in kwargs:
+                per_stage_params = kwargs["params"]
+                kwargs.pop("params")
+
+            # the stage must be split and tiled if any image is larger than the selected/max tile size
+            must_tile = any(
+                [
+                    needs_tile(
+                        stage_pipe.max_tile,
+                        stage_params.tile_size,
+                        size=kwargs.get("size", None),
+                        source=source,
+                    )
+                    for source in stage_sources
+                ]
+            )
+
+            tile = stage_params.tile_size
+            if stage_pipe.max_tile > 0:
+                tile = min(stage_pipe.max_tile, stage_params.tile_size)
+
+            if stage_sources or must_tile:
+                stage_outputs = []
+                for source in stage_sources:
+                    logger.info(
+                        "image contains sources or is larger than tile size of %s, tiling stage",
+                        tile,
+                    )
+
+                    extra_tiles = []
+
+                    def stage_tile(
+                        source_tile: Image.Image,
+                        tile_mask: Image.Image,
+                        dims: Tuple[int, int, int],
+                    ) -> Image.Image:
+                        for _i in range(worker.retries):
+                            try:
+                                output_tile = stage_pipe.run(
+                                    worker,
+                                    server,
+                                    stage_params,
+                                    per_stage_params,
+                                    [source_tile],
+                                    tile_mask=tile_mask,
+                                    callback=callback,
+                                    dims=dims,
+                                    **kwargs,
+                                )
+
+                                if len(output_tile) > 1:
+                                    while len(extra_tiles) < len(output_tile):
+                                        extra_tiles.append([])
+
+                                    for tile, layer in zip(output_tile, extra_tiles):
+                                        layer.append((tile, dims))
+
+                                if is_debug():
+                                    save_image(server, "last-tile.png", output_tile[0])
+
+                                return output_tile[0]
+                            except Exception:
+                                worker.retries = worker.retries - 1
+                                logger.exception(
+                                    "error while running stage pipeline for tile, %s retries left",
+                                    worker.retries,
+                                )
+                                server.cache.clear()
+                                run_gc([worker.get_device()])
+
+                        raise RetryException("exhausted retries on tile")
+
+                    output = process_tile_order(
+                        stage_params.tile_order,
+                        source,
+                        tile,
+                        stage_params.outscale,
+                        [stage_tile],
+                        **kwargs,
+                    )
+
+                    stage_outputs.append(output)
+
+                    if len(extra_tiles) > 1:
+                        for layer in extra_tiles:
+                            layer_output = Image.new("RGB", output.size)
+                            for layer_tile, dims in layer:
+                                layer_output.paste(layer_tile, (dims[0], dims[1]))
+
+                            stage_outputs.append(layer_output)
+
+                stage_sources = stage_outputs
+            else:
+                logger.debug(
+                    "image does not contain sources and is within tile size of %s, running stage",
+                    tile,
+                )
+                for i in range(worker.retries):
+                    try:
+                        stage_outputs = stage_pipe.run(
+                            worker,
+                            server,
+                            stage_params,
+                            per_stage_params,
+                            stage_sources,
+                            callback=callback,
+                            dims=(0, 0, tile),
+                            **kwargs,
+                        )
+                        # doing this on the same line as stage_pipe.run can leave sources as None, which the pipeline
+                        # does not like, so it throws
+                        stage_sources = stage_outputs
+                        break
+                    except Exception:
+                        worker.retries = worker.retries - 1
+                        logger.exception(
+                            "error while running stage pipeline, %s retries left",
+                            worker.retries,
+                        )
+                        server.cache.clear()
+                        run_gc([worker.get_device()])
+
+                if worker.retries <= 0:
+                    raise RetryException("exhausted retries on stage")
+
+            logger.debug(
+                "finished stage %s with %s results",
+                name,
+                len(stage_sources),
+            )
+
+            if is_debug():
+                save_image(server, "last-stage.png", stage_sources[0])
+
+        end = monotonic()
+        duration = timedelta(seconds=(end - start))
+        logger.info(
+            "finished pipeline in %s with %s results",
+            duration,
+            len(stage_sources),
+        )
+        return stage_sources
diff --git a/api/onnx_web/chain/reduce_crop.py b/api/onnx_web/chain/reduce_crop.py
index 2e258075..24974e36 100644
--- a/api/onnx_web/chain/reduce_crop.py
+++ b/api/onnx_web/chain/reduce_crop.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/reduce_thumbnail.py b/api/onnx_web/chain/reduce_thumbnail.py
index d7a0efee..c22ba3fe 100644
--- a/api/onnx_web/chain/reduce_thumbnail.py
+++ b/api/onnx_web/chain/reduce_thumbnail.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
new file mode 100644
index 00000000..627c5197
--- /dev/null
+++ b/api/onnx_web/chain/result.py
@@ -0,0 +1,31 @@
+from PIL.Image import Image, fromarray
+from typing import List, Optional
+
+import numpy as np
+
+class StageResult:
+  """
+  Chain pipeline stage result.
+  Can contain PIL images or numpy arrays, with helpers to convert between them.
+  """
+  arrays: Optional[List[np.ndarray]]
+  images: Optional[List[Image]]
+
+  def __init__(self, arrays = None, images = None) -> None:
+    if arrays is not None and images is not None:
+      raise ValueError("stages must only return one type of result")
+
+    self.arrays = arrays
+    self.images = images
+
+  def as_numpy(self) -> List[np.ndarray]:
+    if self.arrays is not None:
+      return self.arrays
+
+    return [np.array(i) for i in self.images]
+
+  def as_image(self) -> List[Image]:
+    if self.images is not None:
+      return self.images
+
+    return [fromarray(i) for i in self.arrays]
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 89e65abc..2cf5b6b0 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/source_s3.py b/api/onnx_web/chain/source_s3.py
index 1493088c..32eb4357 100644
--- a/api/onnx_web/chain/source_s3.py
+++ b/api/onnx_web/chain/source_s3.py
@@ -8,7 +8,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index d46b3711..6eb20285 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -18,7 +18,7 @@ from ..diffusers.utils import (
 from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 33e5ac78..2dfcb855 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -8,7 +8,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/stage.py b/api/onnx_web/chain/stage.py
deleted file mode 100644
index c9c6eafd..00000000
--- a/api/onnx_web/chain/stage.py
+++ /dev/null
@@ -1,38 +0,0 @@
-from typing import List, Optional
-
-from PIL import Image
-
-from ..params import ImageParams, Size, SizeChart, StageParams
-from ..server.context import ServerContext
-from ..worker.context import WorkerContext
-
-
-class BaseStage:
-    max_tile = SizeChart.auto
-
-    def run(
-        self,
-        _worker: WorkerContext,
-        _server: ServerContext,
-        _stage: StageParams,
-        _params: ImageParams,
-        _sources: List[Image.Image],
-        *args,
-        stage_source: Optional[Image.Image] = None,
-        **kwargs,
-    ) -> List[Image.Image]:
-        raise NotImplementedError()  # noqa
-
-    def steps(
-        self,
-        _params: ImageParams,
-        _size: Size,
-    ) -> int:
-        return 1  # noqa
-
-    def outputs(
-        self,
-        _params: ImageParams,
-        sources: int,
-    ) -> int:
-        return sources
diff --git a/api/onnx_web/chain/stages.py b/api/onnx_web/chain/stages.py
new file mode 100644
index 00000000..f7b6801a
--- /dev/null
+++ b/api/onnx_web/chain/stages.py
@@ -0,0 +1,64 @@
+from logging import getLogger
+
+from .base import BaseStage
+from .blend_denoise import BlendDenoiseStage
+from .blend_img2img import BlendImg2ImgStage
+from .blend_grid import BlendGridStage
+from .blend_linear import BlendLinearStage
+from .blend_mask import BlendMaskStage
+from .correct_codeformer import CorrectCodeformerStage
+from .correct_gfpgan import CorrectGFPGANStage
+from .persist_disk import PersistDiskStage
+from .persist_s3 import PersistS3Stage
+from .reduce_crop import ReduceCropStage
+from .reduce_thumbnail import ReduceThumbnailStage
+from .source_noise import SourceNoiseStage
+from .source_s3 import SourceS3Stage
+from .source_txt2img import SourceTxt2ImgStage
+from .source_url import SourceURLStage
+from .upscale_bsrgan import UpscaleBSRGANStage
+from .upscale_highres import UpscaleHighresStage
+from .upscale_outpaint import UpscaleOutpaintStage
+from .upscale_resrgan import UpscaleRealESRGANStage
+from .upscale_simple import UpscaleSimpleStage
+from .upscale_stable_diffusion import UpscaleStableDiffusionStage
+from .upscale_swinir import UpscaleSwinIRStage
+
+logger = getLogger(__name__)
+
+CHAIN_STAGES = {
+    "blend-denoise": BlendDenoiseStage,
+    "blend-img2img": BlendImg2ImgStage,
+    "blend-inpaint": UpscaleOutpaintStage,
+    "blend-grid": BlendGridStage,
+    "blend-linear": BlendLinearStage,
+    "blend-mask": BlendMaskStage,
+    "correct-codeformer": CorrectCodeformerStage,
+    "correct-gfpgan": CorrectGFPGANStage,
+    "persist-disk": PersistDiskStage,
+    "persist-s3": PersistS3Stage,
+    "reduce-crop": ReduceCropStage,
+    "reduce-thumbnail": ReduceThumbnailStage,
+    "source-noise": SourceNoiseStage,
+    "source-s3": SourceS3Stage,
+    "source-txt2img": SourceTxt2ImgStage,
+    "source-url": SourceURLStage,
+    "upscale-bsrgan": UpscaleBSRGANStage,
+    "upscale-highres": UpscaleHighresStage,
+    "upscale-outpaint": UpscaleOutpaintStage,
+    "upscale-resrgan": UpscaleRealESRGANStage,
+    "upscale-simple": UpscaleSimpleStage,
+    "upscale-stable-diffusion": UpscaleStableDiffusionStage,
+    "upscale-swinir": UpscaleSwinIRStage,
+}
+
+
+def add_stage(name: str, stage: BaseStage) -> bool:
+  global CHAIN_STAGES
+
+  if name in CHAIN_STAGES:
+    logger.warning("cannot replace stage: %s", name)
+    return False
+  else:
+    CHAIN_STAGES[name] = stage
+    return True
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index 0137750e..9afe54ae 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -10,7 +10,7 @@ from ..params import DeviceParams, ImageParams, Size, StageParams, UpscaleParams
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_highres.py b/api/onnx_web/chain/upscale_highres.py
index e19f75fb..5ed28f9b 100644
--- a/api/onnx_web/chain/upscale_highres.py
+++ b/api/onnx_web/chain/upscale_highres.py
@@ -8,7 +8,7 @@ from ..params import HighresParams, ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from ..worker.context import ProgressCallback
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index cdc3a067..29883cc0 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -18,7 +18,7 @@ from ..params import Border, ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..utils import is_debug
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_resrgan.py b/api/onnx_web/chain/upscale_resrgan.py
index e680af53..7fbb6901 100644
--- a/api/onnx_web/chain/upscale_resrgan.py
+++ b/api/onnx_web/chain/upscale_resrgan.py
@@ -10,7 +10,7 @@ from ..params import DeviceParams, ImageParams, StageParams, UpscaleParams
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_simple.py b/api/onnx_web/chain/upscale_simple.py
index 7dd44200..36095339 100644
--- a/api/onnx_web/chain/upscale_simple.py
+++ b/api/onnx_web/chain/upscale_simple.py
@@ -6,7 +6,7 @@ from PIL import Image
 from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index cf784b05..763871e0 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -10,7 +10,7 @@ from ..diffusers.utils import encode_prompt, parse_prompt
 from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/upscale_swinir.py b/api/onnx_web/chain/upscale_swinir.py
index a49b99e5..52114bba 100644
--- a/api/onnx_web/chain/upscale_swinir.py
+++ b/api/onnx_web/chain/upscale_swinir.py
@@ -10,7 +10,7 @@ from ..params import DeviceParams, ImageParams, StageParams, UpscaleParams
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
-from .stage import BaseStage
+from .base import BaseStage
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/worker/context.py b/api/onnx_web/worker/context.py
index a24613ed..2d6d0278 100644
--- a/api/onnx_web/worker/context.py
+++ b/api/onnx_web/worker/context.py
@@ -86,7 +86,7 @@ class WorkerContext:
         return 0
 
     def get_progress_callback(self) -> ProgressCallback:
-        from ..chain.base import ChainProgress
+        from ..chain.pipeline import ChainProgress
 
         def on_progress(step: int, timestep: int, latents: Any):
             on_progress.step = step
diff --git a/api/tests/chain/test_base.py b/api/tests/chain/test_base.py
index a2530600..a0f5463b 100644
--- a/api/tests/chain/test_base.py
+++ b/api/tests/chain/test_base.py
@@ -1,6 +1,6 @@
 import unittest
 
-from onnx_web.chain.base import ChainProgress
+from onnx_web.chain.pipeline import ChainProgress
 
 
 class ChainProgressTests(unittest.TestCase):

From 535b685a5775501a9088a75e30154e8c8dcf36e8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 17:20:13 -0600
Subject: [PATCH 162/240] feat(api): add basic plugin system

---
 api/onnx_web/diffusers/load.py | 12 ++++++++++++
 api/onnx_web/main.py           | 12 ++++++++++++
 api/onnx_web/server/context.py |  1 +
 3 files changed, 25 insertions(+)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 894211fa..d2d96cd7 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -90,6 +90,18 @@ pipeline_schedulers = {
 }
 
 
+def add_pipeline(name: str, pipeline: Any) -> bool:
+    global available_pipelines
+
+    if name in available_pipelines:
+        # TODO: decide if this should be allowed or not
+        logger.warning("cannot replace existing pipeline: %s", name)
+        return False
+    else:
+        available_pipelines[name] = pipeline
+        return False
+
+
 def get_available_pipelines() -> List[str]:
     return list(available_pipelines.keys())
 
diff --git a/api/onnx_web/main.py b/api/onnx_web/main.py
index 9e47cc27..d6e4c678 100644
--- a/api/onnx_web/main.py
+++ b/api/onnx_web/main.py
@@ -23,6 +23,7 @@ from .server.load import (
     load_platforms,
     load_wildcards,
 )
+from .server.plugin import load_plugins, register_plugins
 from .server.static import register_static_routes
 from .server.utils import check_paths
 from .utils import is_debug
@@ -43,12 +44,23 @@ def main():
     server = ServerContext.from_environ()
     apply_patches(server)
     check_paths(server)
+
+    # register plugins
+    exports = load_plugins(server)
+    success = register_plugins(exports)
+    if success:
+        logger.info("all plugins loaded successfully")
+    else:
+        logger.warning("error loading plugins")
+
+    # load additional resources
     load_extras(server)
     load_models(server)
     load_params(server)
     load_platforms(server)
     load_wildcards(server)
 
+    # debug and misc server options
     if is_debug():
         gc.set_debug(gc.DEBUG_STATS)
 
diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index d4118205..0a4221a2 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -40,6 +40,7 @@ class ServerContext:
     server_version: str
     worker_retries: int
     feature_flags: List[str]
+    plugins: List[str]
 
     def __init__(
         self,

From 5a517704ea2b1de1f7a3f2b62ebdb4a2db2f31b1 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 17:20:45 -0600
Subject: [PATCH 163/240] fix(tests): expand worker tests

---
 api/onnx_web/server/hacks.py    |  31 ++++++---
 api/onnx_web/worker/worker.py   |  10 +--
 api/tests/worker/test_pool.py   |   6 ++
 api/tests/worker/test_worker.py | 108 ++++++++++++++++++++++++++++----
 4 files changed, 131 insertions(+), 24 deletions(-)

diff --git a/api/onnx_web/server/hacks.py b/api/onnx_web/server/hacks.py
index b59bb73a..69053b75 100644
--- a/api/onnx_web/server/hacks.py
+++ b/api/onnx_web/server/hacks.py
@@ -134,25 +134,40 @@ def patch_cache_path(server: ServerContext, url: str, **kwargs) -> str:
 
 def apply_patch_basicsr(server: ServerContext):
     logger.debug("patching BasicSR module")
-    import basicsr.utils.download_util
+    try:
+        import basicsr.utils.download_util
 
-    basicsr.utils.download_util.download_file_from_google_drive = patch_not_impl
-    basicsr.utils.download_util.load_file_from_url = partial(patch_cache_path, server)
+        basicsr.utils.download_util.download_file_from_google_drive = patch_not_impl
+        basicsr.utils.download_util.load_file_from_url = partial(patch_cache_path, server)
+    except ImportError:
+        logger.info("unable to import basicsr utils for patching")
+    except AttributeError:
+        logger.warning("unable to patch basicsr utils")
 
 
 def apply_patch_codeformer(server: ServerContext):
     logger.debug("patching CodeFormer module")
-    import codeformer.facelib.utils.misc
+    try:
+        import codeformer.facelib.utils.misc
 
-    codeformer.facelib.utils.misc.download_pretrained_models = patch_not_impl
-    codeformer.facelib.utils.misc.load_file_from_url = partial(patch_cache_path, server)
+        codeformer.facelib.utils.misc.download_pretrained_models = patch_not_impl
+        codeformer.facelib.utils.misc.load_file_from_url = partial(patch_cache_path, server)
+    except ImportError:
+        logger.info("unable to import codeformer utils for patching")
+    except AttributeError:
+        logger.warning("unable to patch codeformer utils")
 
 
 def apply_patch_facexlib(server: ServerContext):
     logger.debug("patching Facexlib module")
-    import facexlib.utils
+    try:
+        import facexlib.utils
 
-    facexlib.utils.load_file_from_url = partial(patch_cache_path, server)
+        facexlib.utils.load_file_from_url = partial(patch_cache_path, server)
+    except ImportError:
+        logger.info("unable to import facexlib for patching")
+    except AttributeError:
+        logger.warning("unable to patch facexlib utils")
 
 
 def apply_patches(server: ServerContext):
diff --git a/api/onnx_web/worker/worker.py b/api/onnx_web/worker/worker.py
index a55ba4a2..55ebcaac 100644
--- a/api/onnx_web/worker/worker.py
+++ b/api/onnx_web/worker/worker.py
@@ -50,7 +50,7 @@ def worker_main(
                     getpid(),
                     worker.get_active(),
                 )
-                exit(EXIT_REPLACED)
+                return exit(EXIT_REPLACED)
 
             # wait briefly for the next job
             job = worker.pending.get(timeout=worker.timeout)
@@ -73,15 +73,15 @@ def worker_main(
         except KeyboardInterrupt:
             logger.debug("worker got keyboard interrupt")
             worker.fail()
-            exit(EXIT_INTERRUPT)
+            return exit(EXIT_INTERRUPT)
         except RetryException:
             logger.exception("retry error in worker, exiting")
             worker.fail()
-            exit(EXIT_ERROR)
+            return exit(EXIT_ERROR)
         except ValueError:
             logger.exception("value error in worker, exiting")
             worker.fail()
-            exit(EXIT_ERROR)
+            return exit(EXIT_ERROR)
         except Exception as e:
             e_str = str(e)
             # restart the worker on memory errors
@@ -89,7 +89,7 @@ def worker_main(
                 if e_mem in e_str:
                     logger.error("detected out-of-memory error, exiting: %s", e)
                     worker.fail()
-                    exit(EXIT_MEMORY)
+                    return exit(EXIT_MEMORY)
 
             # carry on for other errors
             logger.exception(
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index 7ea73451..d0a36982 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -77,6 +77,9 @@ class TestWorkerPool(unittest.TestCase):
     self.assertEqual(self.pool.get_next_device(needs_device=device2), 1)
 
   def test_done_running(self):
+    """
+    TODO: flaky
+    """
     device = DeviceParams("cpu", "CPUProvider")
     server = ServerContext()
 
@@ -104,6 +107,9 @@ class TestWorkerPool(unittest.TestCase):
     lock.set()
 
   def test_done_finished(self):
+    """
+    TODO: flaky
+    """
     device = DeviceParams("cpu", "CPUProvider")
     server = ServerContext()
 
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
index 06c0822d..f0c3e89c 100644
--- a/api/tests/worker/test_worker.py
+++ b/api/tests/worker/test_worker.py
@@ -1,11 +1,23 @@
 import unittest
 from multiprocessing import Queue, Value
+from os import getpid
+from onnx_web.errors import RetryException
 
 from onnx_web.server.context import ServerContext
+from onnx_web.worker.command import JobCommand
 from onnx_web.worker.context import WorkerContext
-from onnx_web.worker.worker import EXIT_INTERRUPT, worker_main
+from onnx_web.worker.worker import EXIT_ERROR, EXIT_INTERRUPT, EXIT_MEMORY, EXIT_REPLACED, MEMORY_ERRORS, worker_main
 from tests.helpers import test_device
 
+def main_memory(_worker):
+  raise Exception(MEMORY_ERRORS[0])
+
+def main_retry(_worker):
+  raise RetryException()
+
+def main_interrupt(_worker):
+  raise KeyboardInterrupt()
+
 
 class WorkerMainTests(unittest.TestCase):
   def test_pending_exception_empty(self):
@@ -15,28 +27,102 @@ class WorkerMainTests(unittest.TestCase):
     status = None
 
     def exit(exit_status):
+      nonlocal status
+      status = exit_status
+
+    job = JobCommand("test", "test", main_interrupt, [], {})
+    cancel = Value("L", False)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    pid = Value("L", getpid())
+    idle = Value("L", False)
+
+    pending.put(job)
+    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+
+    self.assertEqual(status, EXIT_INTERRUPT)
+    pass
+
+  def test_pending_exception_retry(self):
+    status = None
+
+    def exit(exit_status):
+      nonlocal status
+      status = exit_status
+
+    job = JobCommand("test", "test", main_retry, [], {})
+    cancel = Value("L", False)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    pid = Value("L", getpid())
+    idle = Value("L", False)
+
+    pending.put(job)
+    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+
+    self.assertEqual(status, EXIT_ERROR)
+    pass
+
+  def test_pending_exception_value(self):
+    status = None
+
+    def exit(exit_status):
+      nonlocal status
       status = exit_status
 
     cancel = Value("L", False)
     logs = Queue()
     pending = Queue()
     progress = Queue()
-    pid = Value("L", False)
+    pid = Value("L", getpid())
     idle = Value("L", False)
 
     pending.close()
-    # worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
 
-    self.assertEqual(status, EXIT_INTERRUPT)
-
-  def test_pending_exception_retry(self):
-    pass
-
-  def test_pending_exception_value(self):
-    pass
+    self.assertEqual(status, EXIT_ERROR)
 
   def test_pending_exception_other_memory(self):
-    pass
+    status = None
+
+    def exit(exit_status):
+      nonlocal status
+      status = exit_status
+
+    job = JobCommand("test", "test", main_memory, [], {})
+    cancel = Value("L", False)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    pid = Value("L", getpid())
+    idle = Value("L", False)
+
+    pending.put(job)
+    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+
+    self.assertEqual(status, EXIT_MEMORY)
+
 
   def test_pending_exception_other_unknown(self):
     pass
+
+  def test_pending_replaced(self):
+    status = None
+
+    def exit(exit_status):
+      nonlocal status
+      status = exit_status
+
+    cancel = Value("L", False)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    pid = Value("L", 0)
+    idle = Value("L", False)
+
+    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+
+    self.assertEqual(status, EXIT_REPLACED)
+

From a63669c76bc0ea398bb6b02163c8d7e223e41793 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 18:08:38 -0600
Subject: [PATCH 164/240] start replacing image output with results

---
 api/onnx_web/chain/base.py                    |  2 +-
 api/onnx_web/chain/blend_denoise.py           | 13 ++---
 api/onnx_web/chain/blend_grid.py              |  7 +--
 api/onnx_web/chain/blend_img2img.py           |  9 ++--
 api/onnx_web/chain/blend_linear.py            |  7 +--
 api/onnx_web/chain/blend_mask.py              |  7 +--
 api/onnx_web/chain/correct_codeformer.py      |  7 +--
 api/onnx_web/chain/correct_gfpgan.py          | 17 +++---
 api/onnx_web/chain/persist_disk.py            |  5 +-
 api/onnx_web/chain/persist_s3.py              |  7 +--
 api/onnx_web/chain/pipeline.py                | 52 +++++++------------
 api/onnx_web/chain/reduce_crop.py             |  9 ++--
 api/onnx_web/chain/reduce_thumbnail.py        |  9 ++--
 api/onnx_web/chain/result.py                  | 18 +++++--
 api/onnx_web/chain/source_noise.py            | 11 ++--
 api/onnx_web/chain/source_s3.py               |  9 ++--
 api/onnx_web/chain/source_txt2img.py          | 11 ++--
 api/onnx_web/chain/source_url.py              |  7 +--
 api/onnx_web/chain/tile.py                    |  3 +-
 api/onnx_web/chain/upscale_bsrgan.py          | 11 ++--
 api/onnx_web/chain/upscale_highres.py         |  9 ++--
 api/onnx_web/chain/upscale_outpaint.py        |  9 ++--
 api/onnx_web/chain/upscale_resrgan.py         | 24 ++++-----
 api/onnx_web/chain/upscale_simple.py          |  7 +--
 .../chain/upscale_stable_diffusion.py         |  7 +--
 api/onnx_web/chain/upscale_swinir.py          | 29 +++++------
 api/onnx_web/diffusers/run.py                 |  2 +-
 27 files changed, 159 insertions(+), 149 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 0a220773..89d48400 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -17,7 +17,7 @@ class BaseStage:
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        _sources: List[Image.Image],
+        _sources: StageResult,
         *args,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
index efc5b2b3..beabb871 100644
--- a/api/onnx_web/chain/blend_denoise.py
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -9,6 +9,7 @@ from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -22,19 +23,19 @@ class BlendDenoiseStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         strength: int = 3,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("denoising source images")
 
         results = []
-        for source in sources:
-            data = cv2.cvtColor(np.array(source), cv2.COLOR_RGB2BGR)
+        for source in sources.as_numpy():
+            data = cv2.cvtColor(source, cv2.COLOR_RGB2BGR)
             data = cv2.fastNlMeansDenoisingColored(data, None, strength, strength)
-            results.append(Image.fromarray(cv2.cvtColor(data, cv2.COLOR_BGR2RGB)))
+            results.append(cv2.cvtColor(data, cv2.COLOR_BGR2RGB))
 
-        return results
+        return StageResult(arrays=results)
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index a6cab0fe..b31ef7bd 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,7 +21,7 @@ class BlendGridStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         height: int,
         width: int,
@@ -31,7 +32,7 @@ class BlendGridStage(BaseStage):
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("combining source images using grid layout")
 
         size = sources[0].size
@@ -49,7 +50,7 @@ class BlendGridStage(BaseStage):
             n = order[i]
             output.paste(sources[n], (x * size[0], y * size[1]))
 
-        return [*sources, output]
+        return StageResult(images=[*sources, output])
 
     def outputs(
         self,
diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index d44e52cc..aa5aaa5e 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -11,6 +11,7 @@ from ..params import ImageParams, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -24,14 +25,14 @@ class BlendImg2ImgStage(BaseStage):
         server: ServerContext,
         _stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         strength: float,
         callback: Optional[ProgressCallback] = None,
         stage_source: Optional[Image.Image] = None,
         prompt_index: Optional[int] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         params = params.with_args(**kwargs)
 
         # multi-stage prompting
@@ -65,7 +66,7 @@ class BlendImg2ImgStage(BaseStage):
             pipe_params["strength"] = strength
 
         outputs = []
-        for source in sources:
+        for source in sources.as_image():
             if params.is_lpw():
                 logger.debug("using LPW pipeline for img2img")
                 rng = torch.manual_seed(params.seed)
@@ -101,7 +102,7 @@ class BlendImg2ImgStage(BaseStage):
 
             outputs.extend(result.images)
 
-        return outputs
+        return StageResult(images=outputs)
 
     def steps(
         self,
diff --git a/api/onnx_web/chain/blend_linear.py b/api/onnx_web/chain/blend_linear.py
index 1eae984a..6b2c8d6c 100644
--- a/api/onnx_web/chain/blend_linear.py
+++ b/api/onnx_web/chain/blend_linear.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,13 +19,13 @@ class BlendLinearStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         alpha: float,
         stage_source: Optional[Image.Image] = None,
         _callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("blending source images using linear interpolation")
 
-        return [Image.blend(source, stage_source, alpha) for source in sources]
+        return StageResult(images=[Image.blend(source, stage_source, alpha) for source in sources])
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index d4cd4001..75cdcc9f 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -9,6 +9,7 @@ from ..server import ServerContext
 from ..utils import is_debug
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,13 +21,13 @@ class BlendMaskStage(BaseStage):
         server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         stage_source: Optional[Image.Image] = None,
         stage_mask: Optional[Image.Image] = None,
         _callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("blending image using mask")
 
         mult_mask = Image.new("RGBA", stage_mask.size, color="black")
@@ -37,4 +38,4 @@ class BlendMaskStage(BaseStage):
             save_image(server, "last-mask.png", stage_mask)
             save_image(server, "last-mult-mask.png", mult_mask)
 
-        return [Image.composite(stage_source, source, mult_mask) for source in sources]
+        return StageResult(images=[Image.composite(stage_source, source, mult_mask) for source in sources])
diff --git a/api/onnx_web/chain/correct_codeformer.py b/api/onnx_web/chain/correct_codeformer.py
index f649acc6..66c6d454 100644
--- a/api/onnx_web/chain/correct_codeformer.py
+++ b/api/onnx_web/chain/correct_codeformer.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,12 +19,12 @@ class CorrectCodeformerStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         stage_source: Optional[Image.Image] = None,
         upscale: UpscaleParams,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         # must be within the load function for patch to take effect
         # TODO: rewrite and remove
         from codeformer import CodeFormer
@@ -32,4 +33,4 @@ class CorrectCodeformerStage(BaseStage):
 
         device = worker.get_device()
         pipe = CodeFormer(upscale=upscale.face_outscale).to(device.torch_str())
-        return [pipe(source) for source in sources]
+        return StageResult(images=[pipe(source) for source in sources])
diff --git a/api/onnx_web/chain/correct_gfpgan.py b/api/onnx_web/chain/correct_gfpgan.py
index 6b0e17be..56aaa849 100644
--- a/api/onnx_web/chain/correct_gfpgan.py
+++ b/api/onnx_web/chain/correct_gfpgan.py
@@ -10,6 +10,7 @@ from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -57,12 +58,12 @@ class CorrectGFPGANStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         upscale = upscale.with_args(**kwargs)
 
         if upscale.correction_model is None:
@@ -73,16 +74,12 @@ class CorrectGFPGANStage(BaseStage):
         device = worker.get_device()
         gfpgan = self.load(server, stage, upscale, device)
 
-        outputs = []
-        for source in sources:
-            output = np.array(source)
-            _, _, output = gfpgan.enhance(
-                output,
+        outputs = [gfpgan.enhance(
+                source,
                 has_aligned=False,
                 only_center_face=False,
                 paste_back=True,
                 weight=upscale.face_strength,
-            )
-            outputs.append(Image.fromarray(output, "RGB"))
+            ) for source in sources.as_numpy()]
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 38ec2b3f..f55d54e1 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -8,6 +8,7 @@ from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -21,13 +22,13 @@ class PersistDiskStage(BaseStage):
         server: ServerContext,
         _stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         output: List[str],
         size: Optional[Size] = None,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info(
             "persisting images to disk: %s, %s", [s.size for s in sources], output
         )
diff --git a/api/onnx_web/chain/persist_s3.py b/api/onnx_web/chain/persist_s3.py
index f2becfc2..91d946e5 100644
--- a/api/onnx_web/chain/persist_s3.py
+++ b/api/onnx_web/chain/persist_s3.py
@@ -9,6 +9,7 @@ from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,7 +21,7 @@ class PersistS3Stage(BaseStage):
         server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         output: str,
         bucket: str,
@@ -28,11 +29,11 @@ class PersistS3Stage(BaseStage):
         profile_name: Optional[str] = None,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         session = Session(profile_name=profile_name)
         s3 = session.client("s3", endpoint_url=endpoint_url)
 
-        for source in sources:
+        for source in sources.as_image():
             data = BytesIO()
             source.save(data, format=server.image_format)
             data.seek(0)
diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index edba28c9..d3d0ebfb 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -13,6 +13,7 @@ from ..utils import is_debug, run_gc
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
 from .tile import needs_tile, process_tile_order
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -73,26 +74,27 @@ class ChainPipeline:
         worker: WorkerContext,
         server: ServerContext,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         callback: Optional[ProgressCallback],
         **kwargs
-    ) -> List[Image.Image]:
-        return self(
+    ) -> StageResult:
+        result = self(
             worker, server, params, sources=sources, callback=callback, **kwargs
         )
+        return result.as_image()
 
     def stage(self, callback: BaseStage, params: StageParams, **kwargs):
         self.stages.append((callback, params, kwargs))
         return self
 
-    def steps(self, params: ImageParams, size: Size):
+    def steps(self, params: ImageParams, size: Size) -> int:
         steps = 0
         for callback, _params, kwargs in self.stages:
             steps += callback.steps(kwargs.get("params", params), size)
 
         return steps
 
-    def outputs(self, params: ImageParams, sources: int):
+    def outputs(self, params: ImageParams, sources: int) -> int:
         outputs = sources
         for callback, _params, kwargs in self.stages:
             outputs = callback.outputs(kwargs.get("params", params), outputs)
@@ -104,10 +106,10 @@ class ChainPipeline:
         worker: WorkerContext,
         server: ServerContext,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         callback: Optional[ProgressCallback] = None,
         **pipeline_kwargs
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         """
         DEPRECATED: use `run` instead
         """
@@ -161,23 +163,21 @@ class ChainPipeline:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
             if stage_sources or must_tile:
-                stage_outputs = []
+                stage_results = []
                 for source in stage_sources:
                     logger.info(
                         "image contains sources or is larger than tile size of %s, tiling stage",
                         tile,
                     )
 
-                    extra_tiles = []
-
                     def stage_tile(
                         source_tile: Image.Image,
                         tile_mask: Image.Image,
                         dims: Tuple[int, int, int],
-                    ) -> Image.Image:
+                    ) -> StageResult:
                         for _i in range(worker.retries):
                             try:
-                                output_tile = stage_pipe.run(
+                                tile_result = stage_pipe.run(
                                     worker,
                                     server,
                                     stage_params,
@@ -189,17 +189,11 @@ class ChainPipeline:
                                     **kwargs,
                                 )
 
-                                if len(output_tile) > 1:
-                                    while len(extra_tiles) < len(output_tile):
-                                        extra_tiles.append([])
-
-                                    for tile, layer in zip(output_tile, extra_tiles):
-                                        layer.append((tile, dims))
-
                                 if is_debug():
-                                    save_image(server, "last-tile.png", output_tile[0])
+                                    for j, image in enumerate(tile_result.as_image()):
+                                        save_image(server, f"last-tile-{j}.png", image)
 
-                                return output_tile[0]
+                                return tile_result
                             except Exception:
                                 worker.retries = worker.retries - 1
                                 logger.exception(
@@ -220,17 +214,9 @@ class ChainPipeline:
                         **kwargs,
                     )
 
-                    stage_outputs.append(output)
+                    stage_results.append(output)
 
-                    if len(extra_tiles) > 1:
-                        for layer in extra_tiles:
-                            layer_output = Image.new("RGB", output.size)
-                            for layer_tile, dims in layer:
-                                layer_output.paste(layer_tile, (dims[0], dims[1]))
-
-                            stage_outputs.append(layer_output)
-
-                stage_sources = stage_outputs
+                stage_sources = StageResult(images=stage_results)
             else:
                 logger.debug(
                     "image does not contain sources and is within tile size of %s, running stage",
@@ -238,7 +224,7 @@ class ChainPipeline:
                 )
                 for i in range(worker.retries):
                     try:
-                        stage_outputs = stage_pipe.run(
+                        stage_result = stage_pipe.run(
                             worker,
                             server,
                             stage_params,
@@ -250,7 +236,7 @@ class ChainPipeline:
                         )
                         # doing this on the same line as stage_pipe.run can leave sources as None, which the pipeline
                         # does not like, so it throws
-                        stage_sources = stage_outputs
+                        stage_sources = stage_result
                         break
                     except Exception:
                         worker.retries = worker.retries - 1
diff --git a/api/onnx_web/chain/reduce_crop.py b/api/onnx_web/chain/reduce_crop.py
index 24974e36..31e16b54 100644
--- a/api/onnx_web/chain/reduce_crop.py
+++ b/api/onnx_web/chain/reduce_crop.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,20 +19,20 @@ class ReduceCropStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         origin: Size,
         size: Size,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         outputs = []
 
-        for source in sources:
+        for source in sources.as_image():
             image = source.crop((origin.width, origin.height, size.width, size.height))
             logger.info(
                 "created thumbnail with dimensions: %sx%s", image.width, image.height
             )
             outputs.append(image)
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/reduce_thumbnail.py b/api/onnx_web/chain/reduce_thumbnail.py
index c22ba3fe..6c909232 100644
--- a/api/onnx_web/chain/reduce_thumbnail.py
+++ b/api/onnx_web/chain/reduce_thumbnail.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,15 +19,15 @@ class ReduceThumbnailStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         size: Size,
         stage_source: Image.Image,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         outputs = []
 
-        for source in sources:
+        for source in sources.as_image():
             image = source.copy()
 
             image = image.thumbnail((size.width, size.height))
@@ -37,4 +38,4 @@ class ReduceThumbnailStage(BaseStage):
 
             outputs.append(image)
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index 627c5197..028c63d2 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -1,4 +1,4 @@
-from PIL.Image import Image, fromarray
+from PIL import Image
 from typing import List, Optional
 
 import numpy as np
@@ -7,25 +7,35 @@ class StageResult:
   """
   Chain pipeline stage result.
   Can contain PIL images or numpy arrays, with helpers to convert between them.
+  This class intentionally does not provide `__iter__`, to ensure clients get results in the format
+  they are expected.
   """
   arrays: Optional[List[np.ndarray]]
-  images: Optional[List[Image]]
+  images: Optional[List[Image.Image]]
 
   def __init__(self, arrays = None, images = None) -> None:
     if arrays is not None and images is not None:
       raise ValueError("stages must only return one type of result")
+    elif arrays is None and images is None:
+      raise ValueError("stages must return results")
 
     self.arrays = arrays
     self.images = images
 
+  def __len__(self) -> int:
+    if self.arrays is not None:
+      return len(self.arrays)
+    else:
+      return len(self.images)
+
   def as_numpy(self) -> List[np.ndarray]:
     if self.arrays is not None:
       return self.arrays
 
     return [np.array(i) for i in self.images]
 
-  def as_image(self) -> List[Image]:
+  def as_image(self) -> List[Image.Image]:
     if self.images is not None:
       return self.images
 
-    return [fromarray(i) for i in self.arrays]
+    return [Image.fromarray(i, "RGB") for i in self.arrays]
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index 2cf5b6b0..d7a606d6 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,13 +19,13 @@ class SourceNoiseStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         size: Size,
         noise_source: Callable,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("generating image from noise source")
 
         if len(sources) > 0:
@@ -32,16 +33,16 @@ class SourceNoiseStage(BaseStage):
                 "source images were passed to a source stage, new images will be appended"
             )
 
-        outputs = list(sources)
+        outputs = []
 
         # TODO: looping over sources and ignoring params does not make much sense for a source stage
-        for source in sources:
+        for source in sources.as_image():
             output = noise_source(source, (size.width, size.height), (0, 0))
 
             logger.info("final output image size: %sx%s", output.width, output.height)
             outputs.append(output)
 
-        return outputs
+        return StageResult(images=outputs)
 
     def outputs(
         self,
diff --git a/api/onnx_web/chain/source_s3.py b/api/onnx_web/chain/source_s3.py
index 32eb4357..d9a53aca 100644
--- a/api/onnx_web/chain/source_s3.py
+++ b/api/onnx_web/chain/source_s3.py
@@ -9,6 +9,7 @@ from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,14 +21,14 @@ class SourceS3Stage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         source_keys: List[str],
         bucket: str,
         endpoint_url: Optional[str] = None,
         profile_name: Optional[str] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         session = Session(profile_name=profile_name)
         s3 = session.client("s3", endpoint_url=endpoint_url)
 
@@ -36,7 +37,7 @@ class SourceS3Stage(BaseStage):
                 "source images were passed to a source stage, new images will be appended"
             )
 
-        outputs = list(sources)
+        outputs = sources.as_image()
         for key in source_keys:
             try:
                 logger.info("loading image from s3://%s/%s", bucket, key)
@@ -48,7 +49,7 @@ class SourceS3Stage(BaseStage):
             except Exception:
                 logger.exception("error loading image from S3")
 
-        return outputs
+        return StageResult(outputs)
 
     def outputs(
         self,
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 6eb20285..f41ebbbf 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -19,6 +19,7 @@ from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -32,7 +33,7 @@ class SourceTxt2ImgStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         dims: Tuple[int, int, int] = None,
         size: Size,
@@ -153,10 +154,10 @@ class SourceTxt2ImgStage(BaseStage):
                 callback=callback,
             )
 
-        output = list(sources)
-        output.extend(result.images)
-        logger.debug("produced %s outputs", len(output))
-        return output
+        outputs = list(sources)
+        outputs.extend(result.images)
+        logger.debug("produced %s outputs", len(outputs))
+        return StageResult(images=outputs)
 
     def steps(
         self,
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index 2dfcb855..c8d100e1 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -9,6 +9,7 @@ from ..params import ImageParams, StageParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,12 +21,12 @@ class SourceURLStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         source_urls: List[str],
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("loading image from URL source")
 
         if len(sources) > 0:
@@ -41,7 +42,7 @@ class SourceURLStage(BaseStage):
             logger.info("final output image size: %sx%s", output.width, output.height)
             outputs.append(output)
 
-        return outputs
+        return StageResult(images=outputs)
 
     def outputs(
         self,
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 65ac3a46..bc6bfdf5 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -9,6 +9,7 @@ from PIL import Image
 
 from ..image.noise_source import noise_source_histogram
 from ..params import Size, TileOrder
+from .result import StageResult
 
 # from skimage.exposure import match_histograms
 
@@ -21,7 +22,7 @@ class TileCallback(Protocol):
     Definition for a tile job function.
     """
 
-    def __call__(self, image: Image.Image, dims: Tuple[int, int, int]) -> Image.Image:
+    def __call__(self, image: Image.Image, dims: Tuple[int, int, int]) -> StageResult:
         """
         Run this stage against a single tile.
         """
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index 9afe54ae..5dabaf32 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -11,6 +11,7 @@ from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -54,12 +55,12 @@ class UpscaleBSRGANStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         upscale = upscale.with_args(**kwargs)
 
         if upscale.upscale_model is None:
@@ -71,8 +72,8 @@ class UpscaleBSRGANStage(BaseStage):
         bsrgan = self.load(server, stage, upscale, device)
 
         outputs = []
-        for source in sources:
-            image = np.array(source) / 255.0
+        for source in sources.as_numpy():
+            image = source / 255.0
             image = image[:, :, [2, 1, 0]].astype(np.float32).transpose((2, 0, 1))
             image = np.expand_dims(image, axis=0)
             logger.trace("BSRGAN input shape: %s", image.shape)
@@ -99,7 +100,7 @@ class UpscaleBSRGANStage(BaseStage):
 
             outputs.append(output)
 
-        return outputs
+        return StageResult(images=outputs)
 
     def steps(
         self,
diff --git a/api/onnx_web/chain/upscale_highres.py b/api/onnx_web/chain/upscale_highres.py
index 5ed28f9b..2564b033 100644
--- a/api/onnx_web/chain/upscale_highres.py
+++ b/api/onnx_web/chain/upscale_highres.py
@@ -9,6 +9,7 @@ from ..server import ServerContext
 from ..worker import WorkerContext
 from ..worker.context import ProgressCallback
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -20,20 +21,20 @@ class UpscaleHighresStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *args,
         highres: HighresParams,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         if highres.scale <= 1:
             return sources
 
         chain = stage_highres(stage, params, highres, upscale)
 
-        return [
+        outputs = [
             chain(
                 worker,
                 server,
@@ -43,3 +44,5 @@ class UpscaleHighresStage(BaseStage):
             )
             for source in sources
         ]
+
+        return StageResult(images=outputs)
\ No newline at end of file
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 29883cc0..3a321f91 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -19,6 +19,7 @@ from ..server import ServerContext
 from ..utils import is_debug
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -32,7 +33,7 @@ class UpscaleOutpaintStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         border: Border,
         dims: Tuple[int, int, int],
@@ -45,7 +46,7 @@ class UpscaleOutpaintStage(BaseStage):
         stage_source: Optional[Image.Image] = None,
         stage_mask: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         prompt_pairs, loras, inversions, (prompt, negative_prompt) = parse_prompt(
             params
         )
@@ -61,7 +62,7 @@ class UpscaleOutpaintStage(BaseStage):
         )
 
         outputs = []
-        for source in sources:
+        for source in sources.as_image():
             if is_debug():
                 save_image(server, "tile-source.png", source)
                 save_image(server, "tile-mask.png", tile_mask)
@@ -122,4 +123,4 @@ class UpscaleOutpaintStage(BaseStage):
 
             outputs.extend(result.images)
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/upscale_resrgan.py b/api/onnx_web/chain/upscale_resrgan.py
index 7fbb6901..0cd6322d 100644
--- a/api/onnx_web/chain/upscale_resrgan.py
+++ b/api/onnx_web/chain/upscale_resrgan.py
@@ -11,6 +11,7 @@ from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -77,25 +78,22 @@ class UpscaleRealESRGANStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         logger.info("upscaling image with Real ESRGAN: x%s", upscale.scale)
 
+        upsampler = self.load(
+            server, upscale, worker.get_device(), tile=stage.tile_size
+        )
+
         outputs = []
-        for source in sources:
-            output = np.array(source)
-            upsampler = self.load(
-                server, upscale, worker.get_device(), tile=stage.tile_size
-            )
-
-            output, _ = upsampler.enhance(output, outscale=upscale.outscale)
-
-            output = Image.fromarray(output, "RGB")
-            logger.info("final output image size: %sx%s", output.width, output.height)
+        for source in sources.as_numpy():
+            output, _ = upsampler.enhance(source, outscale=upscale.outscale)
+            logger.info("final output image size: %s", output.shape)
             outputs.append(output)
 
-        return outputs
+        return StageResult(arrays=outputs)
diff --git a/api/onnx_web/chain/upscale_simple.py b/api/onnx_web/chain/upscale_simple.py
index 36095339..33046842 100644
--- a/api/onnx_web/chain/upscale_simple.py
+++ b/api/onnx_web/chain/upscale_simple.py
@@ -7,6 +7,7 @@ from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -18,13 +19,13 @@ class UpscaleSimpleStage(BaseStage):
         _server: ServerContext,
         _stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         method: str,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         if upscale.scale <= 1:
             logger.debug(
                 "simple upscale stage run with scale of %s, skipping", upscale.scale
@@ -32,7 +33,7 @@ class UpscaleSimpleStage(BaseStage):
             return sources
 
         outputs = []
-        for source in sources:
+        for source in sources.as_image():
             scaled_size = (source.width * upscale.scale, source.height * upscale.scale)
 
             if method == "bilinear":
diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index 763871e0..1bc62417 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -11,6 +11,7 @@ from ..params import ImageParams, StageParams, UpscaleParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -22,13 +23,13 @@ class UpscaleStableDiffusionStage(BaseStage):
         server: ServerContext,
         _stage: StageParams,
         params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         params = params.with_args(**kwargs)
         upscale = upscale.with_args(**kwargs)
         logger.info(
@@ -58,7 +59,7 @@ class UpscaleStableDiffusionStage(BaseStage):
             pipeline.unet.set_prompts(prompt_embeds)
 
         outputs = []
-        for source in sources:
+        for source in sources.as_image():
             result = pipeline(
                 prompt,
                 source,
diff --git a/api/onnx_web/chain/upscale_swinir.py b/api/onnx_web/chain/upscale_swinir.py
index 52114bba..94f63d86 100644
--- a/api/onnx_web/chain/upscale_swinir.py
+++ b/api/onnx_web/chain/upscale_swinir.py
@@ -11,6 +11,7 @@ from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
 from .base import BaseStage
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -54,12 +55,12 @@ class UpscaleSwinIRStage(BaseStage):
         server: ServerContext,
         stage: StageParams,
         _params: ImageParams,
-        sources: List[Image.Image],
+        sources: StageResult,
         *,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         upscale = upscale.with_args(**kwargs)
 
         if upscale.upscale_model is None:
@@ -71,31 +72,27 @@ class UpscaleSwinIRStage(BaseStage):
         swinir = self.load(server, stage, upscale, device)
 
         outputs = []
-        for source in sources:
+        for source in sources.as_numpy():
             # TODO: add support for grayscale (1-channel) images
-            image = np.array(source) / 255.0
+            image = source / 255.0
             image = image[:, :, [2, 1, 0]].astype(np.float32).transpose((2, 0, 1))
             image = np.expand_dims(image, axis=0)
             logger.trace("SwinIR input shape: %s", image.shape)
 
             scale = upscale.outscale
-            dest = np.zeros(
-                (
+            logger.trace("SwinIR output shape: %s", (
                     image.shape[0],
                     image.shape[1],
                     image.shape[2] * scale,
                     image.shape[3] * scale,
-                )
-            )
-            logger.trace("SwinIR output shape: %s", dest.shape)
+                ))
 
-            dest = swinir(image)
-            dest = np.clip(np.squeeze(dest, axis=0), 0, 1)
-            dest = dest[[2, 1, 0], :, :].transpose((1, 2, 0))
-            dest = (dest * 255.0).round().astype(np.uint8)
+            output = swinir(image)
+            output = np.clip(np.squeeze(output, axis=0), 0, 1)
+            output = output[[2, 1, 0], :, :].transpose((1, 2, 0))
+            output = (output * 255.0).round().astype(np.uint8)
 
-            output = Image.fromarray(dest, "RGB")
-            logger.info("output image size: %s x %s", output.width, output.height)
+            logger.info("output image size: %s", output.shape)
             outputs.append(output)
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 45ef3881..6bd226d5 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -486,7 +486,7 @@ def run_blend_pipeline(
     outputs: List[str],
     upscale: UpscaleParams,
     # highres: HighresParams,
-    sources: List[Image.Image],
+    sources: StageResult,
     mask: Image.Image,
 ) -> None:
     # set up the chain pipeline and base stage

From 7e6749e0d7a0be8f9a3948dc18b25cfa7ac0b5a0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 18:13:13 -0600
Subject: [PATCH 165/240] apply lint, add missing file

---
 api/onnx_web/chain/__init__.py                |  2 +-
 api/onnx_web/chain/base.py                    |  4 +-
 api/onnx_web/chain/blend_denoise.py           |  3 +-
 api/onnx_web/chain/blend_grid.py              |  2 +-
 api/onnx_web/chain/blend_img2img.py           |  2 +-
 api/onnx_web/chain/blend_linear.py            |  6 +-
 api/onnx_web/chain/blend_mask.py              |  8 ++-
 api/onnx_web/chain/correct_codeformer.py      |  2 +-
 api/onnx_web/chain/correct_gfpgan.py          | 10 +--
 api/onnx_web/chain/highres.py                 |  2 +-
 api/onnx_web/chain/persist_s3.py              |  2 +-
 api/onnx_web/chain/pipeline.py                |  8 +--
 api/onnx_web/chain/reduce_crop.py             |  2 +-
 api/onnx_web/chain/reduce_thumbnail.py        |  1 -
 api/onnx_web/chain/result.py                  | 60 +++++++++---------
 api/onnx_web/chain/source_noise.py            |  2 +-
 api/onnx_web/chain/source_txt2img.py          |  6 +-
 api/onnx_web/chain/stages.py                  | 16 ++---
 api/onnx_web/chain/upscale_bsrgan.py          |  2 +-
 api/onnx_web/chain/upscale_highres.py         |  4 +-
 api/onnx_web/chain/upscale_outpaint.py        |  2 +-
 api/onnx_web/chain/upscale_resrgan.py         |  3 +-
 api/onnx_web/chain/upscale_simple.py          |  2 +-
 .../chain/upscale_stable_diffusion.py         |  2 +-
 api/onnx_web/chain/upscale_swinir.py          |  9 ++-
 .../convert/diffusion/diffusion_xl.py         |  4 +-
 api/onnx_web/diffusers/load.py                |  7 +--
 api/onnx_web/diffusers/run.py                 |  1 +
 api/onnx_web/params.py                        |  5 ++
 api/onnx_web/server/hacks.py                  |  8 ++-
 api/onnx_web/server/plugin.py                 | 61 +++++++++++++++++++
 api/tests/worker/test_worker.py               | 12 +++-
 32 files changed, 176 insertions(+), 84 deletions(-)
 create mode 100644 api/onnx_web/server/plugin.py

diff --git a/api/onnx_web/chain/__init__.py b/api/onnx_web/chain/__init__.py
index 476e3e18..f222ce73 100644
--- a/api/onnx_web/chain/__init__.py
+++ b/api/onnx_web/chain/__init__.py
@@ -1,2 +1,2 @@
 from .pipeline import ChainPipeline, PipelineStage, StageParams
-from .stages import *
\ No newline at end of file
+from .stages import *  # NOQA
diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 89d48400..84034fb8 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -1,11 +1,11 @@
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
-from .result import StageResult
 from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server.context import ServerContext
 from ..worker.context import WorkerContext
+from .result import StageResult
 
 
 class BaseStage:
diff --git a/api/onnx_web/chain/blend_denoise.py b/api/onnx_web/chain/blend_denoise.py
index beabb871..e40a30a2 100644
--- a/api/onnx_web/chain/blend_denoise.py
+++ b/api/onnx_web/chain/blend_denoise.py
@@ -1,8 +1,7 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 import cv2
-import numpy as np
 from PIL import Image
 
 from ..params import ImageParams, SizeChart, StageParams
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index b31ef7bd..d5f41b03 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/blend_img2img.py b/api/onnx_web/chain/blend_img2img.py
index aa5aaa5e..4528946f 100644
--- a/api/onnx_web/chain/blend_img2img.py
+++ b/api/onnx_web/chain/blend_img2img.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 import numpy as np
 import torch
diff --git a/api/onnx_web/chain/blend_linear.py b/api/onnx_web/chain/blend_linear.py
index 6b2c8d6c..4200e3fb 100644
--- a/api/onnx_web/chain/blend_linear.py
+++ b/api/onnx_web/chain/blend_linear.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
@@ -28,4 +28,6 @@ class BlendLinearStage(BaseStage):
     ) -> StageResult:
         logger.info("blending source images using linear interpolation")
 
-        return StageResult(images=[Image.blend(source, stage_source, alpha) for source in sources])
+        return StageResult(
+            images=[Image.blend(source, stage_source, alpha) for source in sources]
+        )
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index 75cdcc9f..2e1b2ca0 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
@@ -38,4 +38,8 @@ class BlendMaskStage(BaseStage):
             save_image(server, "last-mask.png", stage_mask)
             save_image(server, "last-mult-mask.png", mult_mask)
 
-        return StageResult(images=[Image.composite(stage_source, source, mult_mask) for source in sources])
+        return StageResult(
+            images=[
+                Image.composite(stage_source, source, mult_mask) for source in sources
+            ]
+        )
diff --git a/api/onnx_web/chain/correct_codeformer.py b/api/onnx_web/chain/correct_codeformer.py
index 66c6d454..8f72b636 100644
--- a/api/onnx_web/chain/correct_codeformer.py
+++ b/api/onnx_web/chain/correct_codeformer.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/correct_gfpgan.py b/api/onnx_web/chain/correct_gfpgan.py
index 56aaa849..e1db8bcb 100644
--- a/api/onnx_web/chain/correct_gfpgan.py
+++ b/api/onnx_web/chain/correct_gfpgan.py
@@ -1,8 +1,7 @@
 from logging import getLogger
 from os import path
-from typing import List, Optional
+from typing import Optional
 
-import numpy as np
 from PIL import Image
 
 from ..params import DeviceParams, ImageParams, StageParams, UpscaleParams
@@ -74,12 +73,15 @@ class CorrectGFPGANStage(BaseStage):
         device = worker.get_device()
         gfpgan = self.load(server, stage, upscale, device)
 
-        outputs = [gfpgan.enhance(
+        outputs = [
+            gfpgan.enhance(
                 source,
                 has_aligned=False,
                 only_center_face=False,
                 paste_back=True,
                 weight=upscale.face_strength,
-            ) for source in sources.as_numpy()]
+            )
+            for source in sources.as_numpy()
+        ]
 
         return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/highres.py b/api/onnx_web/chain/highres.py
index 088c16ad..523b9a3a 100644
--- a/api/onnx_web/chain/highres.py
+++ b/api/onnx_web/chain/highres.py
@@ -1,11 +1,11 @@
 from logging import getLogger
 from typing import Optional
 
-from .pipeline import ChainPipeline
 from ..chain.blend_img2img import BlendImg2ImgStage
 from ..chain.upscale import stage_upscale_correction
 from ..chain.upscale_simple import UpscaleSimpleStage
 from ..params import HighresParams, ImageParams, StageParams, UpscaleParams
+from .pipeline import ChainPipeline
 
 logger = getLogger(__name__)
 
diff --git a/api/onnx_web/chain/persist_s3.py b/api/onnx_web/chain/persist_s3.py
index 91d946e5..6bd03f72 100644
--- a/api/onnx_web/chain/persist_s3.py
+++ b/api/onnx_web/chain/persist_s3.py
@@ -1,6 +1,6 @@
 from io import BytesIO
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from boto3 import Session
 from PIL import Image
diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index d3d0ebfb..732f20e9 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -12,8 +12,8 @@ from ..server import ServerContext
 from ..utils import is_debug, run_gc
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
-from .tile import needs_tile, process_tile_order
 from .result import StageResult
+from .tile import needs_tile, process_tile_order
 
 logger = getLogger(__name__)
 
@@ -76,7 +76,7 @@ class ChainPipeline:
         params: ImageParams,
         sources: StageResult,
         callback: Optional[ProgressCallback],
-        **kwargs
+        **kwargs,
     ) -> StageResult:
         result = self(
             worker, server, params, sources=sources, callback=callback, **kwargs
@@ -108,10 +108,10 @@ class ChainPipeline:
         params: ImageParams,
         sources: StageResult,
         callback: Optional[ProgressCallback] = None,
-        **pipeline_kwargs
+        **pipeline_kwargs,
     ) -> StageResult:
         """
-        DEPRECATED: use `run` instead
+        DEPRECATED: use `.run()` instead
         """
         if callback is None:
             callback = worker.get_progress_callback()
diff --git a/api/onnx_web/chain/reduce_crop.py b/api/onnx_web/chain/reduce_crop.py
index 31e16b54..fe98fbd3 100644
--- a/api/onnx_web/chain/reduce_crop.py
+++ b/api/onnx_web/chain/reduce_crop.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/reduce_thumbnail.py b/api/onnx_web/chain/reduce_thumbnail.py
index 6c909232..9c65a819 100644
--- a/api/onnx_web/chain/reduce_thumbnail.py
+++ b/api/onnx_web/chain/reduce_thumbnail.py
@@ -1,5 +1,4 @@
 from logging import getLogger
-from typing import List
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index 028c63d2..b6fbc0bf 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -1,41 +1,43 @@
-from PIL import Image
 from typing import List, Optional
 
 import numpy as np
+from PIL import Image
+
 
 class StageResult:
-  """
-  Chain pipeline stage result.
-  Can contain PIL images or numpy arrays, with helpers to convert between them.
-  This class intentionally does not provide `__iter__`, to ensure clients get results in the format
-  they are expected.
-  """
-  arrays: Optional[List[np.ndarray]]
-  images: Optional[List[Image.Image]]
+    """
+    Chain pipeline stage result.
+    Can contain PIL images or numpy arrays, with helpers to convert between them.
+    This class intentionally does not provide `__iter__`, to ensure clients get results in the format
+    they are expected.
+    """
 
-  def __init__(self, arrays = None, images = None) -> None:
-    if arrays is not None and images is not None:
-      raise ValueError("stages must only return one type of result")
-    elif arrays is None and images is None:
-      raise ValueError("stages must return results")
+    arrays: Optional[List[np.ndarray]]
+    images: Optional[List[Image.Image]]
 
-    self.arrays = arrays
-    self.images = images
+    def __init__(self, arrays=None, images=None) -> None:
+        if arrays is not None and images is not None:
+            raise ValueError("stages must only return one type of result")
+        elif arrays is None and images is None:
+            raise ValueError("stages must return results")
 
-  def __len__(self) -> int:
-    if self.arrays is not None:
-      return len(self.arrays)
-    else:
-      return len(self.images)
+        self.arrays = arrays
+        self.images = images
 
-  def as_numpy(self) -> List[np.ndarray]:
-    if self.arrays is not None:
-      return self.arrays
+    def __len__(self) -> int:
+        if self.arrays is not None:
+            return len(self.arrays)
+        else:
+            return len(self.images)
 
-    return [np.array(i) for i in self.images]
+    def as_numpy(self) -> List[np.ndarray]:
+        if self.arrays is not None:
+            return self.arrays
 
-  def as_image(self) -> List[Image.Image]:
-    if self.images is not None:
-      return self.images
+        return [np.array(i) for i in self.images]
 
-    return [Image.fromarray(i, "RGB") for i in self.arrays]
+    def as_image(self) -> List[Image.Image]:
+        if self.images is not None:
+            return self.images
+
+        return [Image.fromarray(np.uint8(i), "RGB") for i in self.arrays]
diff --git a/api/onnx_web/chain/source_noise.py b/api/onnx_web/chain/source_noise.py
index d7a606d6..d1b2eac2 100644
--- a/api/onnx_web/chain/source_noise.py
+++ b/api/onnx_web/chain/source_noise.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Callable, List, Optional
+from typing import Callable, Optional
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index f41ebbbf..49d63d44 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional, Tuple
+from typing import Optional, Tuple
 
 import numpy as np
 import torch
@@ -132,7 +132,9 @@ class SourceTxt2ImgStage(BaseStage):
         else:
             # encode and record alternative prompts outside of LPW
             if params.is_panorama() or params.is_xl():
-                logger.debug("prompt alternatives are not supported for panorama or SDXL")
+                logger.debug(
+                    "prompt alternatives are not supported for panorama or SDXL"
+                )
             else:
                 prompt_embeds = encode_prompt(
                     pipe, prompt_pairs, params.batch, params.do_cfg()
diff --git a/api/onnx_web/chain/stages.py b/api/onnx_web/chain/stages.py
index f7b6801a..4ae14346 100644
--- a/api/onnx_web/chain/stages.py
+++ b/api/onnx_web/chain/stages.py
@@ -2,8 +2,8 @@ from logging import getLogger
 
 from .base import BaseStage
 from .blend_denoise import BlendDenoiseStage
-from .blend_img2img import BlendImg2ImgStage
 from .blend_grid import BlendGridStage
+from .blend_img2img import BlendImg2ImgStage
 from .blend_linear import BlendLinearStage
 from .blend_mask import BlendMaskStage
 from .correct_codeformer import CorrectCodeformerStage
@@ -54,11 +54,11 @@ CHAIN_STAGES = {
 
 
 def add_stage(name: str, stage: BaseStage) -> bool:
-  global CHAIN_STAGES
+    global CHAIN_STAGES
 
-  if name in CHAIN_STAGES:
-    logger.warning("cannot replace stage: %s", name)
-    return False
-  else:
-    CHAIN_STAGES[name] = stage
-    return True
+    if name in CHAIN_STAGES:
+        logger.warning("cannot replace stage: %s", name)
+        return False
+    else:
+        CHAIN_STAGES[name] = stage
+        return True
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index 5dabaf32..41182f73 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -1,6 +1,6 @@
 from logging import getLogger
 from os import path
-from typing import List, Optional
+from typing import Optional
 
 import numpy as np
 from PIL import Image
diff --git a/api/onnx_web/chain/upscale_highres.py b/api/onnx_web/chain/upscale_highres.py
index 2564b033..0e027ca1 100644
--- a/api/onnx_web/chain/upscale_highres.py
+++ b/api/onnx_web/chain/upscale_highres.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
@@ -45,4 +45,4 @@ class UpscaleHighresStage(BaseStage):
             for source in sources
         ]
 
-        return StageResult(images=outputs)
\ No newline at end of file
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/upscale_outpaint.py b/api/onnx_web/chain/upscale_outpaint.py
index 3a321f91..464f5920 100644
--- a/api/onnx_web/chain/upscale_outpaint.py
+++ b/api/onnx_web/chain/upscale_outpaint.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Callable, List, Optional, Tuple
+from typing import Callable, Optional, Tuple
 
 import numpy as np
 import torch
diff --git a/api/onnx_web/chain/upscale_resrgan.py b/api/onnx_web/chain/upscale_resrgan.py
index 0cd6322d..49b06ee4 100644
--- a/api/onnx_web/chain/upscale_resrgan.py
+++ b/api/onnx_web/chain/upscale_resrgan.py
@@ -1,8 +1,7 @@
 from logging import getLogger
 from os import path
-from typing import List, Optional
+from typing import Optional
 
-import numpy as np
 from PIL import Image
 
 from ..onnx import OnnxRRDBNet
diff --git a/api/onnx_web/chain/upscale_simple.py b/api/onnx_web/chain/upscale_simple.py
index 33046842..f19f3b84 100644
--- a/api/onnx_web/chain/upscale_simple.py
+++ b/api/onnx_web/chain/upscale_simple.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import List, Optional
+from typing import Optional
 
 from PIL import Image
 
diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index 1bc62417..8ff01f68 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -1,6 +1,6 @@
 from logging import getLogger
 from os import path
-from typing import List, Optional
+from typing import Optional
 
 import torch
 from PIL import Image
diff --git a/api/onnx_web/chain/upscale_swinir.py b/api/onnx_web/chain/upscale_swinir.py
index 94f63d86..62bd6102 100644
--- a/api/onnx_web/chain/upscale_swinir.py
+++ b/api/onnx_web/chain/upscale_swinir.py
@@ -1,6 +1,6 @@
 from logging import getLogger
 from os import path
-from typing import List, Optional
+from typing import Optional
 
 import numpy as np
 from PIL import Image
@@ -80,12 +80,15 @@ class UpscaleSwinIRStage(BaseStage):
             logger.trace("SwinIR input shape: %s", image.shape)
 
             scale = upscale.outscale
-            logger.trace("SwinIR output shape: %s", (
+            logger.trace(
+                "SwinIR output shape: %s",
+                (
                     image.shape[0],
                     image.shape[1],
                     image.shape[2] * scale,
                     image.shape[3] * scale,
-                ))
+                ),
+            )
 
             output = swinir(image)
             output = np.clip(np.squeeze(output, axis=0), 0, 1)
diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index f270f1d5..a4f11dd9 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -81,7 +81,9 @@ def convert_diffusion_diffusers_xl(
         output=dest_path,
         task="stable-diffusion-xl",
         device=device,
-        fp16=conversion.has_optimization("torch-fp16"), # optimum's fp16 mode only works on CUDA or ROCm
+        fp16=conversion.has_optimization(
+            "torch-fp16"
+        ),  # optimum's fp16 mode only works on CUDA or ROCm
         framework="pt",
     )
 
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index d2d96cd7..d7ffe749 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -574,10 +574,9 @@ def optimize_pipeline(
     server: ServerContext,
     pipe: StableDiffusionPipeline,
 ) -> None:
-    if (
-        server.has_optimization("diffusers-attention-slicing")
-        or server.has_optimization("diffusers-attention-slicing-auto")
-    ):
+    if server.has_optimization(
+        "diffusers-attention-slicing"
+    ) or server.has_optimization("diffusers-attention-slicing-auto"):
         logger.debug("enabling auto attention slicing on SD pipeline")
         try:
             pipe.enable_attention_slicing(slice_size="auto")
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 6bd226d5..a622c693 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -13,6 +13,7 @@ from ..chain import (
     UpscaleOutpaintStage,
 )
 from ..chain.highres import stage_highres
+from ..chain.result import StageResult
 from ..chain.upscale import split_upscale, stage_upscale_correction
 from ..image import expand_image
 from ..output import save_image
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 3b896cae..efac3742 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -208,6 +208,7 @@ class ImageParams:
     unet_overlap: float
     vae_tile: int
     vae_overlap: float
+    denoise: int
 
     def __init__(
         self,
@@ -230,6 +231,7 @@ class ImageParams:
         unet_tile: int = 512,
         vae_overlap: float = 0.25,
         vae_tile: int = 512,
+        denoise: int = 3,
     ) -> None:
         self.model = model
         self.pipeline = pipeline
@@ -250,6 +252,7 @@ class ImageParams:
         self.unet_tile = unet_tile
         self.vae_overlap = vae_overlap
         self.vae_tile = vae_tile
+        self.denoise = denoise
 
     def do_cfg(self):
         return self.cfg > 1.0
@@ -320,6 +323,7 @@ class ImageParams:
             "unet_tile": self.unet_tile,
             "vae_overlap": self.vae_overlap,
             "vae_tile": self.vae_tile,
+            "denoise": self.denoise,
         }
 
     def with_args(self, **kwargs):
@@ -343,6 +347,7 @@ class ImageParams:
             kwargs.get("unet_tile", self.unet_tile),
             kwargs.get("vae_overlap", self.vae_overlap),
             kwargs.get("vae_tile", self.vae_tile),
+            kwargs.get("denoise", self.denoise),
         )
 
 
diff --git a/api/onnx_web/server/hacks.py b/api/onnx_web/server/hacks.py
index 69053b75..052a5c42 100644
--- a/api/onnx_web/server/hacks.py
+++ b/api/onnx_web/server/hacks.py
@@ -138,7 +138,9 @@ def apply_patch_basicsr(server: ServerContext):
         import basicsr.utils.download_util
 
         basicsr.utils.download_util.download_file_from_google_drive = patch_not_impl
-        basicsr.utils.download_util.load_file_from_url = partial(patch_cache_path, server)
+        basicsr.utils.download_util.load_file_from_url = partial(
+            patch_cache_path, server
+        )
     except ImportError:
         logger.info("unable to import basicsr utils for patching")
     except AttributeError:
@@ -151,7 +153,9 @@ def apply_patch_codeformer(server: ServerContext):
         import codeformer.facelib.utils.misc
 
         codeformer.facelib.utils.misc.download_pretrained_models = patch_not_impl
-        codeformer.facelib.utils.misc.load_file_from_url = partial(patch_cache_path, server)
+        codeformer.facelib.utils.misc.load_file_from_url = partial(
+            patch_cache_path, server
+        )
     except ImportError:
         logger.info("unable to import codeformer utils for patching")
     except AttributeError:
diff --git a/api/onnx_web/server/plugin.py b/api/onnx_web/server/plugin.py
new file mode 100644
index 00000000..022047df
--- /dev/null
+++ b/api/onnx_web/server/plugin.py
@@ -0,0 +1,61 @@
+from importlib import import_module
+from logging import getLogger
+from typing import Any, Callable, Dict
+
+from onnx_web.chain.stages import add_stage
+from onnx_web.diffusers.load import add_pipeline
+from onnx_web.server.context import ServerContext
+
+logger = getLogger(__name__)
+
+
+class PluginExports:
+    pipelines: Dict[str, Any]
+    stages: Dict[str, Any]
+
+    def __init__(self, pipelines=None, stages=None) -> None:
+        self.pipelines = pipelines or {}
+        self.stages = stages or {}
+
+
+PluginModule = Callable[[ServerContext], PluginExports]
+
+
+def load_plugins(server: ServerContext) -> PluginExports:
+    combined_exports = PluginExports()
+
+    for plugin in server.plugins:
+        logger.info("loading plugin module: %s", plugin)
+        try:
+            module: PluginModule = import_module(plugin)
+            exports = module(server)
+
+            for name, pipeline in exports.pipelines.items():
+                if name in combined_exports.pipelines:
+                    logger.warning(
+                        "multiple plugins exported a pipeline named %s", name
+                    )
+                else:
+                    combined_exports.pipelines[name] = pipeline
+
+            for name, stage in exports.stages.items():
+                if name in combined_exports.stages:
+                    logger.warning("multiple plugins exported a stage named %s", name)
+                else:
+                    combined_exports.stages[name] = stage
+        except Exception:
+            logger.exception("error importing plugin")
+
+    return combined_exports
+
+
+def register_plugins(exports: PluginExports) -> bool:
+    success = True
+
+    for name, pipeline in exports.pipelines.items():
+        success = success and add_pipeline(name, pipeline)
+
+    for name, stage in exports.stages.items():
+        success = success and add_stage(name, stage)
+
+    return success
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
index f0c3e89c..9f02d4e9 100644
--- a/api/tests/worker/test_worker.py
+++ b/api/tests/worker/test_worker.py
@@ -1,14 +1,22 @@
 import unittest
 from multiprocessing import Queue, Value
 from os import getpid
-from onnx_web.errors import RetryException
 
+from onnx_web.errors import RetryException
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.command import JobCommand
 from onnx_web.worker.context import WorkerContext
-from onnx_web.worker.worker import EXIT_ERROR, EXIT_INTERRUPT, EXIT_MEMORY, EXIT_REPLACED, MEMORY_ERRORS, worker_main
+from onnx_web.worker.worker import (
+    EXIT_ERROR,
+    EXIT_INTERRUPT,
+    EXIT_MEMORY,
+    EXIT_REPLACED,
+    MEMORY_ERRORS,
+    worker_main,
+)
 from tests.helpers import test_device
 
+
 def main_memory(_worker):
   raise Exception(MEMORY_ERRORS[0])
 

From eb77c83d808af0f58b4d95d80ed0da5b90a07c98 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 21:35:00 -0600
Subject: [PATCH 166/240] move stages and tests to using stage result

---
 api/onnx_web/chain/blend_grid.py              |  9 ++++----
 api/onnx_web/chain/blend_linear.py            |  2 +-
 api/onnx_web/chain/blend_mask.py              |  2 +-
 api/onnx_web/chain/correct_codeformer.py      |  2 +-
 api/onnx_web/chain/persist_disk.py            |  2 +-
 api/onnx_web/chain/pipeline.py                | 19 ++++++++++-------
 api/onnx_web/chain/result.py                  |  4 ++++
 api/onnx_web/chain/source_txt2img.py          |  2 +-
 api/onnx_web/chain/source_url.py              |  2 +-
 api/onnx_web/chain/upscale_bsrgan.py          | 21 +++++++------------
 api/onnx_web/chain/upscale_highres.py         |  2 +-
 api/onnx_web/chain/upscale_simple.py          |  8 +++----
 .../chain/upscale_stable_diffusion.py         |  2 +-
 api/onnx_web/diffusers/run.py                 | 12 +++++------
 api/tests/chain/test_blend_grid.py            |  8 +++----
 api/tests/chain/test_blend_linear.py          |  7 ++++---
 api/tests/chain/test_blend_mask.py            |  3 ++-
 api/tests/chain/test_correct_codeformer.py    |  2 +-
 api/tests/chain/test_reduce_crop.py           |  3 ++-
 api/tests/chain/test_reduce_thumbnail.py      |  4 ++--
 api/tests/chain/test_source_noise.py          |  3 ++-
 api/tests/chain/test_source_s3.py             |  3 ++-
 api/tests/chain/test_source_url.py            |  3 ++-
 api/tests/chain/test_upscale_highres.py       |  3 ++-
 24 files changed, 68 insertions(+), 60 deletions(-)

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index d5f41b03..234f6c3b 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -35,22 +35,23 @@ class BlendGridStage(BaseStage):
     ) -> StageResult:
         logger.info("combining source images using grid layout")
 
-        size = sources[0].size
+        images = sources.as_image()
+        size = images[0].size
 
         output = Image.new("RGB", (size[0] * width, size[1] * height))
 
         # TODO: labels
         if order is None:
-            order = range(len(sources))
+            order = range(len(images))
 
         for i in range(len(order)):
             x = i % width
             y = i // width
 
             n = order[i]
-            output.paste(sources[n], (x * size[0], y * size[1]))
+            output.paste(images[n], (x * size[0], y * size[1]))
 
-        return StageResult(images=[*sources, output])
+        return StageResult(images=[*images, output])
 
     def outputs(
         self,
diff --git a/api/onnx_web/chain/blend_linear.py b/api/onnx_web/chain/blend_linear.py
index 4200e3fb..e4a98d9d 100644
--- a/api/onnx_web/chain/blend_linear.py
+++ b/api/onnx_web/chain/blend_linear.py
@@ -29,5 +29,5 @@ class BlendLinearStage(BaseStage):
         logger.info("blending source images using linear interpolation")
 
         return StageResult(
-            images=[Image.blend(source, stage_source, alpha) for source in sources]
+            images=[Image.blend(source, stage_source, alpha) for source in sources.as_image()]
         )
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index 2e1b2ca0..926331a3 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -40,6 +40,6 @@ class BlendMaskStage(BaseStage):
 
         return StageResult(
             images=[
-                Image.composite(stage_source, source, mult_mask) for source in sources
+                Image.composite(stage_source, source, mult_mask) for source in sources.as_image()
             ]
         )
diff --git a/api/onnx_web/chain/correct_codeformer.py b/api/onnx_web/chain/correct_codeformer.py
index 8f72b636..1169d4fb 100644
--- a/api/onnx_web/chain/correct_codeformer.py
+++ b/api/onnx_web/chain/correct_codeformer.py
@@ -33,4 +33,4 @@ class CorrectCodeformerStage(BaseStage):
 
         device = worker.get_device()
         pipe = CodeFormer(upscale=upscale.face_outscale).to(device.torch_str())
-        return StageResult(images=[pipe(source) for source in sources])
+        return StageResult(images=[pipe(source) for source in sources.as_image()])
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index f55d54e1..f7d988cc 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -30,7 +30,7 @@ class PersistDiskStage(BaseStage):
         **kwargs,
     ) -> StageResult:
         logger.info(
-            "persisting images to disk: %s, %s", [s.size for s in sources], output
+            "persisting %s images to disk: %s", len(sources), output
         )
 
         for source, name in zip(sources, output):
diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 732f20e9..40a43ccf 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -12,8 +12,8 @@ from ..server import ServerContext
 from ..utils import is_debug, run_gc
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
-from .result import StageResult
 from .tile import needs_tile, process_tile_order
+from .result import StageResult
 
 logger = getLogger(__name__)
 
@@ -77,7 +77,7 @@ class ChainPipeline:
         sources: StageResult,
         callback: Optional[ProgressCallback],
         **kwargs,
-    ) -> StageResult:
+    ) -> List[Image.Image]:
         result = self(
             worker, server, params, sources=sources, callback=callback, **kwargs
         )
@@ -136,7 +136,7 @@ class ChainPipeline:
             logger.debug(
                 "running stage %s with %s source images, parameters: %s",
                 name,
-                len(stage_sources) - stage_sources.count(None),
+                len(stage_sources),
                 kwargs.keys(),
             )
 
@@ -154,7 +154,7 @@ class ChainPipeline:
                         size=kwargs.get("size", None),
                         source=source,
                     )
-                    for source in stage_sources
+                    for source in stage_sources.as_image()
                 ]
             )
 
@@ -162,9 +162,10 @@ class ChainPipeline:
             if stage_pipe.max_tile > 0:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
+            # TODO: stage_sources will always be defined here
             if stage_sources or must_tile:
                 stage_results = []
-                for source in stage_sources:
+                for source in stage_sources.as_image():
                     logger.info(
                         "image contains sources or is larger than tile size of %s, tiling stage",
                         tile,
@@ -182,7 +183,7 @@ class ChainPipeline:
                                     server,
                                     stage_params,
                                     per_stage_params,
-                                    [source_tile],
+                                    StageResult(images=[source_tile]),
                                     tile_mask=tile_mask,
                                     callback=callback,
                                     dims=dims,
@@ -193,7 +194,8 @@ class ChainPipeline:
                                     for j, image in enumerate(tile_result.as_image()):
                                         save_image(server, f"last-tile-{j}.png", image)
 
-                                return tile_result
+                                # TODO: return whole result
+                                return tile_result.as_image()[0]
                             except Exception:
                                 worker.retries = worker.retries - 1
                                 logger.exception(
@@ -257,7 +259,8 @@ class ChainPipeline:
             )
 
             if is_debug():
-                save_image(server, "last-stage.png", stage_sources[0])
+                for j, image in enumerate(stage_sources.as_image()):
+                    save_image(server, f"last-stage-{j}.png", image)
 
         end = monotonic()
         duration = timedelta(seconds=(end - start))
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index b6fbc0bf..3bc54e43 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -15,6 +15,10 @@ class StageResult:
     arrays: Optional[List[np.ndarray]]
     images: Optional[List[Image.Image]]
 
+    @staticmethod
+    def empty():
+        return StageResult(images=[])
+
     def __init__(self, arrays=None, images=None) -> None:
         if arrays is not None and images is not None:
             raise ValueError("stages must only return one type of result")
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 49d63d44..21881e18 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -156,7 +156,7 @@ class SourceTxt2ImgStage(BaseStage):
                 callback=callback,
             )
 
-        outputs = list(sources)
+        outputs = sources.as_image()
         outputs.extend(result.images)
         logger.debug("produced %s outputs", len(outputs))
         return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/source_url.py b/api/onnx_web/chain/source_url.py
index c8d100e1..b6aa62cd 100644
--- a/api/onnx_web/chain/source_url.py
+++ b/api/onnx_web/chain/source_url.py
@@ -34,7 +34,7 @@ class SourceURLStage(BaseStage):
                 "source images were passed to a source stage, new images will be appended"
             )
 
-        outputs = list(sources)
+        outputs = sources.as_image()
         for url in source_urls:
             response = requests.get(url)
             output = Image.open(BytesIO(response.content))
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index 41182f73..d68c0042 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -79,28 +79,23 @@ class UpscaleBSRGANStage(BaseStage):
             logger.trace("BSRGAN input shape: %s", image.shape)
 
             scale = upscale.outscale
-            dest = np.zeros(
-                (
+            logger.trace("BSRGAN output shape: %s", (
                     image.shape[0],
                     image.shape[1],
                     image.shape[2] * scale,
                     image.shape[3] * scale,
-                )
-            )
-            logger.trace("BSRGAN output shape: %s", dest.shape)
+                ))
 
-            dest = bsrgan(image)
+            output = bsrgan(image)
 
-            dest = np.clip(np.squeeze(dest, axis=0), 0, 1)
-            dest = dest[[2, 1, 0], :, :].transpose((1, 2, 0))
-            dest = (dest * 255.0).round().astype(np.uint8)
-
-            output = Image.fromarray(dest, "RGB")
-            logger.debug("output image size: %s x %s", output.width, output.height)
+            output = np.clip(np.squeeze(output, axis=0), 0, 1)
+            output = output[[2, 1, 0], :, :].transpose((1, 2, 0))
+            output = (output * 255.0).round().astype(np.uint8)
 
+            logger.debug("output image shape: %s", output.shape)
             outputs.append(output)
 
-        return StageResult(images=outputs)
+        return StageResult(arrays=outputs)
 
     def steps(
         self,
diff --git a/api/onnx_web/chain/upscale_highres.py b/api/onnx_web/chain/upscale_highres.py
index 0e027ca1..bd7f826a 100644
--- a/api/onnx_web/chain/upscale_highres.py
+++ b/api/onnx_web/chain/upscale_highres.py
@@ -42,7 +42,7 @@ class UpscaleHighresStage(BaseStage):
                 source,
                 callback=callback,
             )
-            for source in sources
+            for source in sources.as_image()
         ]
 
         return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/upscale_simple.py b/api/onnx_web/chain/upscale_simple.py
index f19f3b84..0ec0499c 100644
--- a/api/onnx_web/chain/upscale_simple.py
+++ b/api/onnx_web/chain/upscale_simple.py
@@ -38,13 +38,11 @@ class UpscaleSimpleStage(BaseStage):
 
             if method == "bilinear":
                 logger.debug("using bilinear interpolation for highres")
-                source = source.resize(scaled_size, resample=Image.Resampling.BILINEAR)
+                outputs.append(source.resize(scaled_size, resample=Image.Resampling.BILINEAR))
             elif method == "lanczos":
                 logger.debug("using Lanczos interpolation for highres")
-                source = source.resize(scaled_size, resample=Image.Resampling.LANCZOS)
+                outputs.append(source.resize(scaled_size, resample=Image.Resampling.LANCZOS))
             else:
                 logger.warning("unknown upscaling method: %s", method)
 
-            outputs.append(source)
-
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index 8ff01f68..bf2fa7ea 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -73,4 +73,4 @@ class UpscaleStableDiffusionStage(BaseStage):
             )
             outputs.extend(result.images)
 
-        return outputs
+        return StageResult(images=outputs)
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index a622c693..317c73c5 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -105,7 +105,7 @@ def run_txt2img_pipeline(
     # run and save
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, [], callback=progress, latents=latents)
+    images = chain.run(worker, server, params, StageResult.empty(), callback=progress, latents=latents)
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
 
@@ -200,7 +200,7 @@ def run_img2img_pipeline(
 
     # run and append the filtered source
     progress = worker.get_progress_callback()
-    images = chain(worker, server, params, [source], callback=progress)
+    images = chain.run(worker, server, params, StageResult(images=[source]), callback=progress)
 
     if source_filter is not None and source_filter != "none":
         images.append(source)
@@ -380,7 +380,7 @@ def run_inpaint_pipeline(
     # run and save
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
-    images = chain(worker, server, params, [source], callback=progress, latents=latents)
+    images = chain.run(worker, server, params, [source], callback=progress, latents=latents)
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
     for image, output in zip(images, outputs):
@@ -455,7 +455,7 @@ def run_upscale_pipeline(
 
     # run and save
     progress = worker.get_progress_callback()
-    images = chain(worker, server, params, [source], callback=progress)
+    images = chain.run(worker, server, params, StageResult(images=[source]), callback=progress)
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
     for image, output in zip(images, outputs):
@@ -487,7 +487,7 @@ def run_blend_pipeline(
     outputs: List[str],
     upscale: UpscaleParams,
     # highres: HighresParams,
-    sources: StageResult,
+    sources: List[Image.Image],
     mask: Image.Image,
 ) -> None:
     # set up the chain pipeline and base stage
@@ -505,7 +505,7 @@ def run_blend_pipeline(
 
     # run and save
     progress = worker.get_progress_callback()
-    images = chain(worker, server, params, sources, callback=progress)
+    images = chain.run(worker, server, params, StageResult(images=sources), callback=progress)
 
     for image, output in zip(images, outputs):
         dest = save_image(server, output, image, params, size, upscale=upscale)
diff --git a/api/tests/chain/test_blend_grid.py b/api/tests/chain/test_blend_grid.py
index 8244df5e..b1623019 100644
--- a/api/tests/chain/test_blend_grid.py
+++ b/api/tests/chain/test_blend_grid.py
@@ -3,19 +3,19 @@ import unittest
 from PIL import Image
 
 from onnx_web.chain.blend_grid import BlendGridStage
-from onnx_web.chain.blend_linear import BlendLinearStage
+from onnx_web.chain.result import StageResult
 
 
 class BlendGridStageTests(unittest.TestCase):
     def test_stage(self):
         stage = BlendGridStage()
-        sources = [
+        sources = StageResult(images=[
             Image.new("RGB", (64, 64), "black"),
             Image.new("RGB", (64, 64), "white"),
             Image.new("RGB", (64, 64), "black"),
             Image.new("RGB", (64, 64), "white"),
-        ]
+        ])
         result = stage.run(None, None, None, None, sources, height=2, width=2)
 
         self.assertEqual(len(result), 5)
-        self.assertEqual(result[-1].getpixel((0,0)), (0, 0, 0))
\ No newline at end of file
+        self.assertEqual(result.as_image()[-1].getpixel((0,0)), (0, 0, 0))
\ No newline at end of file
diff --git a/api/tests/chain/test_blend_linear.py b/api/tests/chain/test_blend_linear.py
index 9d20fe55..a983a2e1 100644
--- a/api/tests/chain/test_blend_linear.py
+++ b/api/tests/chain/test_blend_linear.py
@@ -3,16 +3,17 @@ import unittest
 from PIL import Image
 
 from onnx_web.chain.blend_linear import BlendLinearStage
+from onnx_web.chain.result import StageResult
 
 
 class BlendLinearStageTests(unittest.TestCase):
     def test_stage(self):
         stage = BlendLinearStage()
-        sources = [
+        sources = StageResult(images=[
             Image.new("RGB", (64, 64), "black"),
-        ]
+        ])
         stage_source = Image.new("RGB", (64, 64), "white")
         result = stage.run(None, None, None, None, sources, alpha=0.5, stage_source=stage_source)
 
         self.assertEqual(len(result), 1)
-        self.assertEqual(result[0].getpixel((0,0)), (127, 127, 127))
\ No newline at end of file
+        self.assertEqual(result.as_image()[0].getpixel((0,0)), (127, 127, 127))
\ No newline at end of file
diff --git a/api/tests/chain/test_blend_mask.py b/api/tests/chain/test_blend_mask.py
index cf70535f..4fcb8130 100644
--- a/api/tests/chain/test_blend_mask.py
+++ b/api/tests/chain/test_blend_mask.py
@@ -3,13 +3,14 @@ import unittest
 from PIL import Image
 
 from onnx_web.chain.blend_mask import BlendMaskStage
+from onnx_web.chain.result import StageResult
 from onnx_web.params import HighresParams, UpscaleParams
 
 
 class BlendMaskStageTests(unittest.TestCase):
     def test_empty(self):
         stage = BlendMaskStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_correct_codeformer.py b/api/tests/chain/test_correct_codeformer.py
index 8203e876..9cc24de0 100644
--- a/api/tests/chain/test_correct_codeformer.py
+++ b/api/tests/chain/test_correct_codeformer.py
@@ -25,7 +25,7 @@ class CorrectCodeformerStageTests(unittest.TestCase):
             0,
         )
         stage = CorrectCodeformerStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(worker, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
 
         self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_reduce_crop.py b/api/tests/chain/test_reduce_crop.py
index 4e79d8f8..bfc7adc4 100644
--- a/api/tests/chain/test_reduce_crop.py
+++ b/api/tests/chain/test_reduce_crop.py
@@ -1,13 +1,14 @@
 import unittest
 
 from onnx_web.chain.reduce_crop import ReduceCropStage
+from onnx_web.chain.result import StageResult
 from onnx_web.params import HighresParams, Size, UpscaleParams
 
 
 class ReduceCropStageTests(unittest.TestCase):
     def test_empty(self):
         stage = ReduceCropStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_reduce_thumbnail.py b/api/tests/chain/test_reduce_thumbnail.py
index 14cb12a7..8b129672 100644
--- a/api/tests/chain/test_reduce_thumbnail.py
+++ b/api/tests/chain/test_reduce_thumbnail.py
@@ -2,8 +2,8 @@ import unittest
 
 from PIL import Image
 
-from onnx_web.chain.reduce_crop import ReduceCropStage
 from onnx_web.chain.reduce_thumbnail import ReduceThumbnailStage
+from onnx_web.chain.result import StageResult
 from onnx_web.params import HighresParams, Size, UpscaleParams
 
 
@@ -11,7 +11,7 @@ class ReduceThumbnailStageTests(unittest.TestCase):
     def test_empty(self):
         stage_source = Image.new("RGB", (64, 64))
         stage = ReduceThumbnailStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_source_noise.py b/api/tests/chain/test_source_noise.py
index 8187a751..f43a8f86 100644
--- a/api/tests/chain/test_source_noise.py
+++ b/api/tests/chain/test_source_noise.py
@@ -1,4 +1,5 @@
 import unittest
+from onnx_web.chain.result import StageResult
 
 from onnx_web.chain.source_noise import SourceNoiseStage
 from onnx_web.image.noise_source import noise_source_fill_edge
@@ -8,7 +9,7 @@ from onnx_web.params import HighresParams, Size, UpscaleParams
 class SourceNoiseStageTests(unittest.TestCase):
     def test_empty(self):
         stage = SourceNoiseStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_source_s3.py b/api/tests/chain/test_source_s3.py
index aad37c5b..9b1e11ea 100644
--- a/api/tests/chain/test_source_s3.py
+++ b/api/tests/chain/test_source_s3.py
@@ -1,4 +1,5 @@
 import unittest
+from onnx_web.chain.result import StageResult
 
 from onnx_web.chain.source_s3 import SourceS3Stage
 from onnx_web.params import HighresParams, Size, UpscaleParams
@@ -7,7 +8,7 @@ from onnx_web.params import HighresParams, Size, UpscaleParams
 class SourceS3StageTests(unittest.TestCase):
     def test_empty(self):
         stage = SourceS3Stage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_source_url.py b/api/tests/chain/test_source_url.py
index 1f185b7b..fe7588c7 100644
--- a/api/tests/chain/test_source_url.py
+++ b/api/tests/chain/test_source_url.py
@@ -1,4 +1,5 @@
 import unittest
+from onnx_web.chain.result import StageResult
 
 from onnx_web.chain.source_url import SourceURLStage
 from onnx_web.params import HighresParams, Size, UpscaleParams
@@ -7,7 +8,7 @@ from onnx_web.params import HighresParams, Size, UpscaleParams
 class SourceURLStageTests(unittest.TestCase):
     def test_empty(self):
         stage = SourceURLStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(
             None,
             None,
diff --git a/api/tests/chain/test_upscale_highres.py b/api/tests/chain/test_upscale_highres.py
index 95897c2c..8789e447 100644
--- a/api/tests/chain/test_upscale_highres.py
+++ b/api/tests/chain/test_upscale_highres.py
@@ -1,4 +1,5 @@
 import unittest
+from onnx_web.chain.result import StageResult
 
 from onnx_web.chain.upscale_highres import UpscaleHighresStage
 from onnx_web.params import HighresParams, UpscaleParams
@@ -7,7 +8,7 @@ from onnx_web.params import HighresParams, UpscaleParams
 class UpscaleHighresStageTests(unittest.TestCase):
     def test_empty(self):
         stage = UpscaleHighresStage()
-        sources = []
+        sources = StageResult.empty()
         result = stage.run(None, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
 
         self.assertEqual(len(result), 0)

From e64e514e7fb55cf1c3e7a1285ea7b505d6675253 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 18 Nov 2023 21:35:57 -0600
Subject: [PATCH 167/240] fix(api): add out channels to upscaling config

---
 api/onnx_web/diffusers/pipelines/upscale.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index deb2c8c3..a9c6f843 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -51,9 +51,15 @@ def preprocess(image):
 
 
 class FakeConfig:
+    block_out_channels: List[int]
     scaling_factor: float
 
     def __init__(self) -> None:
+        self.block_out_channels = [
+            128,
+            256,
+            512
+        ]
         self.scaling_factor = 0.08333
 
 

From 98fcc0752457beb9952ddbd928b593f2ebc1fc31 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 18:39:39 -0600
Subject: [PATCH 168/240] rewrite tile handling for image stacks

---
 api/onnx_web/chain/blend_linear.py      |   5 +-
 api/onnx_web/chain/blend_mask.py        |   3 +-
 api/onnx_web/chain/persist_disk.py      |   4 +-
 api/onnx_web/chain/pipeline.py          |  95 +++++----
 api/onnx_web/chain/tile.py              | 251 +++++++++++++-----------
 api/onnx_web/chain/upscale_bsrgan.py    |   7 +-
 api/onnx_web/chain/upscale_simple.py    |   8 +-
 api/onnx_web/diffusers/run.py           |  20 +-
 api/tests/chain/test_source_noise.py    |   2 +-
 api/tests/chain/test_source_s3.py       |   2 +-
 api/tests/chain/test_source_url.py      |   2 +-
 api/tests/chain/test_tile.py            |  54 ++---
 api/tests/chain/test_upscale_highres.py |   2 +-
 13 files changed, 254 insertions(+), 201 deletions(-)

diff --git a/api/onnx_web/chain/blend_linear.py b/api/onnx_web/chain/blend_linear.py
index e4a98d9d..1b40a5fd 100644
--- a/api/onnx_web/chain/blend_linear.py
+++ b/api/onnx_web/chain/blend_linear.py
@@ -29,5 +29,8 @@ class BlendLinearStage(BaseStage):
         logger.info("blending source images using linear interpolation")
 
         return StageResult(
-            images=[Image.blend(source, stage_source, alpha) for source in sources.as_image()]
+            images=[
+                Image.blend(source, stage_source, alpha)
+                for source in sources.as_image()
+            ]
         )
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index 926331a3..4ebb1498 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -40,6 +40,7 @@ class BlendMaskStage(BaseStage):
 
         return StageResult(
             images=[
-                Image.composite(stage_source, source, mult_mask) for source in sources.as_image()
+                Image.composite(stage_source, source, mult_mask)
+                for source in sources.as_image()
             ]
         )
diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index f7d988cc..7a2007ce 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -29,9 +29,7 @@ class PersistDiskStage(BaseStage):
         stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> StageResult:
-        logger.info(
-            "persisting %s images to disk: %s", len(sources), output
-        )
+        logger.info("persisting %s images to disk: %s", len(sources), output)
 
         for source, name in zip(sources, output):
             dest = save_image(server, name, source, params=params, size=size)
diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 40a43ccf..50122d7d 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -12,8 +12,8 @@ from ..server import ServerContext
 from ..utils import is_debug, run_gc
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
-from .tile import needs_tile, process_tile_order
 from .result import StageResult
+from .tile import needs_tile, process_tile_order
 
 logger = getLogger(__name__)
 
@@ -163,60 +163,55 @@ class ChainPipeline:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
             # TODO: stage_sources will always be defined here
-            if stage_sources or must_tile:
-                stage_results = []
-                for source in stage_sources.as_image():
-                    logger.info(
-                        "image contains sources or is larger than tile size of %s, tiling stage",
-                        tile,
-                    )
+            if must_tile:
+                logger.info(
+                    "image contains sources or is larger than tile size of %s, tiling stage",
+                    tile,
+                )
 
-                    def stage_tile(
-                        source_tile: Image.Image,
-                        tile_mask: Image.Image,
-                        dims: Tuple[int, int, int],
-                    ) -> StageResult:
-                        for _i in range(worker.retries):
-                            try:
-                                tile_result = stage_pipe.run(
-                                    worker,
-                                    server,
-                                    stage_params,
-                                    per_stage_params,
-                                    StageResult(images=[source_tile]),
-                                    tile_mask=tile_mask,
-                                    callback=callback,
-                                    dims=dims,
-                                    **kwargs,
-                                )
+                def stage_tile(
+                    source_tile: List[Image.Image],
+                    tile_mask: Image.Image,
+                    dims: Tuple[int, int, int],
+                ) -> List[Image.Image]:
+                    for _i in range(worker.retries):
+                        try:
+                            tile_result = stage_pipe.run(
+                                worker,
+                                server,
+                                stage_params,
+                                per_stage_params,
+                                StageResult(images=[source_tile]),
+                                tile_mask=tile_mask,
+                                callback=callback,
+                                dims=dims,
+                                **kwargs,
+                            )
 
-                                if is_debug():
-                                    for j, image in enumerate(tile_result.as_image()):
-                                        save_image(server, f"last-tile-{j}.png", image)
+                            if is_debug():
+                                for j, image in enumerate(tile_result.as_image()):
+                                    save_image(server, f"last-tile-{j}.png", image)
 
-                                # TODO: return whole result
-                                return tile_result.as_image()[0]
-                            except Exception:
-                                worker.retries = worker.retries - 1
-                                logger.exception(
-                                    "error while running stage pipeline for tile, %s retries left",
-                                    worker.retries,
-                                )
-                                server.cache.clear()
-                                run_gc([worker.get_device()])
+                            return tile_result.as_image()
+                        except Exception:
+                            worker.retries = worker.retries - 1
+                            logger.exception(
+                                "error while running stage pipeline for tile, %s retries left",
+                                worker.retries,
+                            )
+                            server.cache.clear()
+                            run_gc([worker.get_device()])
 
-                        raise RetryException("exhausted retries on tile")
+                    raise RetryException("exhausted retries on tile")
 
-                    output = process_tile_order(
-                        stage_params.tile_order,
-                        source,
-                        tile,
-                        stage_params.outscale,
-                        [stage_tile],
-                        **kwargs,
-                    )
-
-                    stage_results.append(output)
+                stage_results = process_tile_order(
+                    stage_params.tile_order,
+                    stage_sources,
+                    tile,
+                    stage_params.outscale,
+                    [stage_tile],
+                    **kwargs,
+                )
 
                 stage_sources = StageResult(images=stage_results)
             else:
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index bc6bfdf5..aae71af1 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -2,7 +2,7 @@ import itertools
 from enum import Enum
 from logging import getLogger
 from math import ceil
-from typing import Any, List, Optional, Protocol, Tuple
+from typing import Any, Callable, List, Optional, Protocol, Tuple
 
 import numpy as np
 from PIL import Image
@@ -17,12 +17,17 @@ from .result import StageResult
 logger = getLogger(__name__)
 
 
+TileGenerator = Callable[[int, int, int, Optional[float]], List[Tuple[int, int]]]
+
+
 class TileCallback(Protocol):
     """
     Definition for a tile job function.
     """
 
-    def __call__(self, image: Image.Image, dims: Tuple[int, int, int]) -> StageResult:
+    def __call__(
+        self, image: Image.Image, dims: Tuple[int, int, int]
+    ) -> List[Image.Image]:
         """
         Run this stage against a single tile.
         """
@@ -33,6 +38,9 @@ def complete_tile(
     source: Image.Image,
     tile: int,
 ) -> Image.Image:
+    """
+    TODO: clean up
+    """
     if source is None:
         return source
 
@@ -67,7 +75,7 @@ def needs_tile(
     return False
 
 
-def get_tile_grads(
+def make_tile_grads(
     left: int,
     top: int,
     tile: int,
@@ -161,7 +169,7 @@ def blend_tiles(
             points = [-1, min(p1, p2), max(p1, p2), (tile * scale)]
 
             # gradient blending
-            grad_x, grad_y = get_tile_grads(left, top, adj_tile, width, height)
+            grad_x, grad_y = make_tile_grads(left, top, adj_tile, width, height)
             logger.debug("tile gradients: %s, %s, %s", points, grad_x, grad_y)
 
             mult_x = [np.interp(i, points, grad_x) for i in range(tile * scale)]
@@ -225,60 +233,18 @@ def blend_tiles(
     return Image.fromarray(np.uint8(pixels))
 
 
-def process_tile_grid(
-    source: Image.Image,
-    tile: int,
-    scale: int,
-    filters: List[TileCallback],
-    overlap: float = 0.0,
-    **kwargs,
-) -> Image.Image:
-    width, height = kwargs.get("size", source.size if source else None)
-
-    adj_tile = int(float(tile) * (1.0 - overlap))
-    tiles_x = ceil(width / adj_tile)
-    tiles_y = ceil(height / adj_tile)
-    total = tiles_x * tiles_y
-    logger.debug(
-        "processing %s tiles (%s x %s) with adjusted size of %s, %s overlap",
-        total,
-        tiles_x,
-        tiles_y,
-        adj_tile,
-        overlap,
-    )
-
-    tiles: List[Tuple[int, int, Image.Image]] = []
-
-    for y in range(tiles_y):
-        for x in range(tiles_x):
-            idx = (y * tiles_x) + x
-            left = x * adj_tile
-            top = y * adj_tile
-            logger.info("processing tile %s of %s, %s.%s", idx + 1, total, y, x)
-
-            tile_image = (
-                source.crop((left, top, left + tile, top + tile)) if source else None
-            )
-            tile_image = complete_tile(tile_image, tile)
-
-            for filter in filters:
-                tile_image = filter(tile_image, (left, top, tile))
-
-            tiles.append((left, top, tile_image))
-
-    return blend_tiles(tiles, scale, width, height, tile, overlap)
-
-
-def process_tile_spiral(
-    source: Image.Image,
+def process_tile_stack(
+    stack: StageResult,
     tile: int,
     scale: int,
     filters: List[TileCallback],
+    tile_generator: TileGenerator,
     overlap: float = 0.5,
     **kwargs,
-) -> Image.Image:
-    width, height = kwargs.get("size", source.size if source else None)
+) -> List[Image.Image]:
+    sources = stack.as_image()
+
+    width, height = kwargs.get("size", sources[0].size if len(sources) > 0 else None)
     mask = kwargs.get("mask", None)
     noise_source = kwargs.get("noise_source", noise_source_histogram)
     fill_color = kwargs.get("fill_color", None)
@@ -286,18 +252,9 @@ def process_tile_spiral(
         tile_mask = None
 
     tiles: List[Tuple[int, int, Image.Image]] = []
+    tile_coords = tile_generator(width, height, tile, overlap)
 
-    # tile tuples is source, multiply by scale for dest
-    counter = 0
-    tile_coords = generate_tile_spiral(width, height, tile, overlap=overlap)
-
-    if len(tile_coords) == 1:
-        single_tile = True
-    else:
-        single_tile = False
-
-    for left, top in tile_coords:
-        counter += 1
+    for counter, (left, top) in enumerate(tile_coords):
         logger.info(
             "processing tile %s of %s, %sx%s", counter, len(tile_coords), left, top
         )
@@ -321,26 +278,31 @@ def process_tile_spiral(
             needs_margin = True
             bottom_margin = height - bottom
 
-        # if no source given, we don't have a source image
-        if not source:
-            tile_image = None
-        elif needs_margin:
-            # in the special case where the image is smaller than the specified tile size, just use the image
-            if single_tile:
-                logger.debug("creating and processing single-tile subtile")
-                tile_image = source
-                if mask:
-                    tile_mask = mask
-            # otherwise use add histogram noise outside of the image border
-            else:
-                logger.debug(
-                    "tiling and adding margins: %s, %s, %s, %s",
-                    left_margin,
-                    top_margin,
-                    right_margin,
-                    bottom_margin,
-                )
-                base_image = source.crop(
+        if needs_margin:
+            logger.debug(
+                "tiling with added margins: %s, %s, %s, %s",
+                left_margin,
+                top_margin,
+                right_margin,
+                bottom_margin,
+            )
+            tile_stack = add_margin(
+                stack,
+                left,
+                top,
+                right,
+                bottom,
+                left_margin,
+                top_margin,
+                right_margin,
+                bottom_margin,
+                tile,
+                noise_source,
+                fill_color,
+            )
+
+            if mask:
+                base_mask = mask.crop(
                     (
                         left + left_margin,
                         top + top_margin,
@@ -348,43 +310,35 @@ def process_tile_spiral(
                         bottom + bottom_margin,
                     )
                 )
-                tile_image = noise_source(
-                    base_image, (tile, tile), (0, 0), fill=fill_color
-                )
-                tile_image.paste(base_image, (left_margin, top_margin))
-
-                if mask:
-                    base_mask = mask.crop(
-                        (
-                            left + left_margin,
-                            top + top_margin,
-                            right + right_margin,
-                            bottom + bottom_margin,
-                        )
-                    )
-                    tile_mask = Image.new("L", (tile, tile), color=0)
-                    tile_mask.paste(base_mask, (left_margin, top_margin))
+                tile_mask = Image.new("L", (tile, tile), color=0)
+                tile_mask.paste(base_mask, (left_margin, top_margin))
 
         else:
             logger.debug("tiling normally")
-            tile_image = source.crop((left, top, right, bottom))
+            tile_stack = get_result_tile(stack, (left, top), Size(tile, tile))
             if mask:
                 tile_mask = mask.crop((left, top, right, bottom))
 
         for image_filter in filters:
-            tile_image = image_filter(tile_image, tile_mask, (left, top, tile))
+            tile_stack = image_filter(tile_stack, tile_mask, (left, top, tile))
 
-        tiles.append((left, top, tile_image))
+        tiles.append((left, top, tile_stack))
 
-    if single_tile:
-        return tile_image
-    else:
-        return blend_tiles(tiles, scale, width, height, tile, overlap)
+    lefts, tops, stacks = list(zip(*tiles))
+    coords = list(zip(lefts, tops))
+    stacks = list(zip(*stacks))
+
+    result = []
+    for stack in stacks:
+        stack_tiles = zip(coords, stack)
+        result.append(blend_tiles(stack_tiles, scale, width, height, tile, overlap))
+
+    return result
 
 
 def process_tile_order(
     order: TileOrder,
-    source: Image.Image,
+    stack: StageResult,
     tile: int,
     scale: int,
     filters: List[TileCallback],
@@ -395,13 +349,17 @@ def process_tile_order(
     """
     if order == TileOrder.grid:
         logger.debug("using grid tile order with tile size: %s", tile)
-        return process_tile_grid(source, tile, scale, filters, **kwargs)
+        return process_tile_stack(
+            stack, tile, scale, filters, generate_tile_grid, **kwargs
+        )
     elif order == TileOrder.kernel:
         logger.debug("using kernel tile order with tile size: %s", tile)
         raise NotImplementedError()
     elif order == TileOrder.spiral:
         logger.debug("using spiral tile order with tile size: %s", tile)
-        return process_tile_spiral(source, tile, scale, filters, **kwargs)
+        return process_tile_stack(
+            stack, tile, scale, filters, generate_tile_spiral, **kwargs
+        )
     else:
         logger.warning("unknown tile order: %s", order)
         raise ValueError()
@@ -495,3 +453,76 @@ def generate_tile_spiral(
         height_tile_target -= abs(state.value[1])
 
     return tile_coords
+
+
+def generate_tile_grid(
+    width: int,
+    height: int,
+    tile: int,
+    overlap: float = 0.0,
+) -> List[Tuple[int, int]]:
+    adj_tile = int(float(tile) * (1.0 - overlap))
+    tiles_x = ceil(width / adj_tile)
+    tiles_y = ceil(height / adj_tile)
+    total = tiles_x * tiles_y
+    logger.debug(
+        "processing %s tiles (%s x %s) with adjusted size of %s, %s overlap",
+        total,
+        tiles_x,
+        tiles_y,
+        adj_tile,
+        overlap,
+    )
+
+    tiles: List[Tuple[int, int, Image.Image]] = []
+
+    for y in range(tiles_y):
+        for x in range(tiles_x):
+            left = x * adj_tile
+            top = y * adj_tile
+
+            tiles.append((int(left), int(top)))
+
+    return tiles
+
+
+def get_result_tile(
+    result: StageResult,
+    origin: Tuple[int, int],
+    tile: Size,
+) -> List[Image.Image]:
+    top, left = origin
+    return [
+        layer.crop((top, left, top + tile.height, left + tile.width))
+        for layer in result.as_image()
+    ]
+
+
+def add_margin(
+    stack: List[Image.Image],
+    left: int,
+    top: int,
+    right: int,
+    bottom: int,
+    left_margin: int,
+    top_margin: int,
+    right_margin: int,
+    bottom_margin: int,
+    tile: int,
+    noise_source,
+    fill_color,
+) -> List[Image.Image]:
+    results = []
+    for source in stack:
+        base_image = source.crop(
+            (
+                left + left_margin,
+                top + top_margin,
+                right + right_margin,
+                bottom + bottom_margin,
+            )
+        )
+        tile_image = noise_source(base_image, (tile, tile), (0, 0), fill=fill_color)
+        tile_image.paste(base_image, (left_margin, top_margin))
+
+    return results
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index d68c0042..6ade9580 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -79,12 +79,15 @@ class UpscaleBSRGANStage(BaseStage):
             logger.trace("BSRGAN input shape: %s", image.shape)
 
             scale = upscale.outscale
-            logger.trace("BSRGAN output shape: %s", (
+            logger.trace(
+                "BSRGAN output shape: %s",
+                (
                     image.shape[0],
                     image.shape[1],
                     image.shape[2] * scale,
                     image.shape[3] * scale,
-                ))
+                ),
+            )
 
             output = bsrgan(image)
 
diff --git a/api/onnx_web/chain/upscale_simple.py b/api/onnx_web/chain/upscale_simple.py
index 0ec0499c..7e939bd4 100644
--- a/api/onnx_web/chain/upscale_simple.py
+++ b/api/onnx_web/chain/upscale_simple.py
@@ -38,10 +38,14 @@ class UpscaleSimpleStage(BaseStage):
 
             if method == "bilinear":
                 logger.debug("using bilinear interpolation for highres")
-                outputs.append(source.resize(scaled_size, resample=Image.Resampling.BILINEAR))
+                outputs.append(
+                    source.resize(scaled_size, resample=Image.Resampling.BILINEAR)
+                )
             elif method == "lanczos":
                 logger.debug("using Lanczos interpolation for highres")
-                outputs.append(source.resize(scaled_size, resample=Image.Resampling.LANCZOS))
+                outputs.append(
+                    source.resize(scaled_size, resample=Image.Resampling.LANCZOS)
+                )
             else:
                 logger.warning("unknown upscaling method: %s", method)
 
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 317c73c5..e80734a0 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -105,7 +105,9 @@ def run_txt2img_pipeline(
     # run and save
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, StageResult.empty(), callback=progress, latents=latents)
+    images = chain.run(
+        worker, server, params, StageResult.empty(), callback=progress, latents=latents
+    )
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
 
@@ -200,7 +202,9 @@ def run_img2img_pipeline(
 
     # run and append the filtered source
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, StageResult(images=[source]), callback=progress)
+    images = chain.run(
+        worker, server, params, StageResult(images=[source]), callback=progress
+    )
 
     if source_filter is not None and source_filter != "none":
         images.append(source)
@@ -380,7 +384,9 @@ def run_inpaint_pipeline(
     # run and save
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, [source], callback=progress, latents=latents)
+    images = chain.run(
+        worker, server, params, [source], callback=progress, latents=latents
+    )
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
     for image, output in zip(images, outputs):
@@ -455,7 +461,9 @@ def run_upscale_pipeline(
 
     # run and save
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, StageResult(images=[source]), callback=progress)
+    images = chain.run(
+        worker, server, params, StageResult(images=[source]), callback=progress
+    )
 
     _pairs, loras, inversions, _rest = parse_prompt(params)
     for image, output in zip(images, outputs):
@@ -505,7 +513,9 @@ def run_blend_pipeline(
 
     # run and save
     progress = worker.get_progress_callback()
-    images = chain.run(worker, server, params, StageResult(images=sources), callback=progress)
+    images = chain.run(
+        worker, server, params, StageResult(images=sources), callback=progress
+    )
 
     for image, output in zip(images, outputs):
         dest = save_image(server, output, image, params, size, upscale=upscale)
diff --git a/api/tests/chain/test_source_noise.py b/api/tests/chain/test_source_noise.py
index f43a8f86..37c99bfa 100644
--- a/api/tests/chain/test_source_noise.py
+++ b/api/tests/chain/test_source_noise.py
@@ -1,6 +1,6 @@
 import unittest
-from onnx_web.chain.result import StageResult
 
+from onnx_web.chain.result import StageResult
 from onnx_web.chain.source_noise import SourceNoiseStage
 from onnx_web.image.noise_source import noise_source_fill_edge
 from onnx_web.params import HighresParams, Size, UpscaleParams
diff --git a/api/tests/chain/test_source_s3.py b/api/tests/chain/test_source_s3.py
index 9b1e11ea..59bbb72f 100644
--- a/api/tests/chain/test_source_s3.py
+++ b/api/tests/chain/test_source_s3.py
@@ -1,6 +1,6 @@
 import unittest
-from onnx_web.chain.result import StageResult
 
+from onnx_web.chain.result import StageResult
 from onnx_web.chain.source_s3 import SourceS3Stage
 from onnx_web.params import HighresParams, Size, UpscaleParams
 
diff --git a/api/tests/chain/test_source_url.py b/api/tests/chain/test_source_url.py
index fe7588c7..4d03dedb 100644
--- a/api/tests/chain/test_source_url.py
+++ b/api/tests/chain/test_source_url.py
@@ -1,6 +1,6 @@
 import unittest
-from onnx_web.chain.result import StageResult
 
+from onnx_web.chain.result import StageResult
 from onnx_web.chain.source_url import SourceURLStage
 from onnx_web.params import HighresParams, Size, UpscaleParams
 
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index 7f599db2..6323c0bb 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -4,11 +4,11 @@ from PIL import Image
 
 from onnx_web.chain.tile import (
     complete_tile,
+    generate_tile_grid,
     generate_tile_spiral,
-    get_tile_grads,
+    make_tile_grads,
     needs_tile,
-    process_tile_grid,
-    process_tile_spiral,
+    process_tile_stack,
 )
 from onnx_web.params import Size
 
@@ -59,24 +59,46 @@ class TestNeedsTile(unittest.TestCase):
 
 class TestTileGrads(unittest.TestCase):
   def test_center_tile(self):
-    grad_x, grad_y = get_tile_grads(32, 32, 8, 64, 64)
+    grad_x, grad_y = make_tile_grads(32, 32, 8, 64, 64)
 
     self.assertEqual(grad_x, [0, 1, 1, 0])
     self.assertEqual(grad_y, [0, 1, 1, 0])
 
   def test_vertical_edge_tile(self):
-    grad_x, grad_y = get_tile_grads(32, 0, 8, 64, 8)
+    grad_x, grad_y = make_tile_grads(32, 0, 8, 64, 8)
 
     self.assertEqual(grad_x, [0, 1, 1, 0])
     self.assertEqual(grad_y, [1, 1, 1, 1])
 
   def test_horizontal_edge_tile(self):
-    grad_x, grad_y = get_tile_grads(0, 32, 8, 8, 64)
+    grad_x, grad_y = make_tile_grads(0, 32, 8, 8, 64)
 
     self.assertEqual(grad_x, [1, 1, 1, 1])
     self.assertEqual(grad_y, [0, 1, 1, 0])
 
 
+class TestGenerateTileGrid(unittest.TestCase):
+  def test_grid_complete(self):
+    tiles = generate_tile_grid(16, 16, 8, 0.0)
+
+    self.assertEqual(len(tiles), 4)
+    self.assertEqual(tiles, [(0, 0), (8, 0), (8, 8), (0, 8)])
+
+  def test_grid_no_overlap(self):
+    tiles = generate_tile_grid(64, 64, 8, 0.0)
+
+    self.assertEqual(len(tiles), 64)
+    self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
+    self.assertEqual(tiles[-5:-1], [(16, 24), (24, 24), (32, 24), (32, 32)])
+
+  def test_grid_50_overlap(self):
+    tiles = generate_tile_grid(64, 64, 8, 0.5)
+
+    self.assertEqual(len(tiles), 225)
+    self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
+    self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
+
+
 class TestGenerateTileSpiral(unittest.TestCase):
   def test_spiral_complete(self):
     tiles = generate_tile_spiral(16, 16, 8, 0.0)
@@ -99,29 +121,15 @@ class TestGenerateTileSpiral(unittest.TestCase):
     self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
 
 
-class TestProcessTileGrid(unittest.TestCase):
+class TestProcessTileStack(unittest.TestCase):
   def test_grid_full(self):
     source = Image.new("RGB", (64, 64))
-    blend = process_tile_grid(source, 32, 1, [])
+    blend = process_tile_stack(source, 32, 1, [])
 
     self.assertEqual(blend.size, (64, 64))
 
   def test_grid_partial(self):
     source = Image.new("RGB", (72, 72))
-    blend = process_tile_grid(source, 32, 1, [])
-
-    self.assertEqual(blend.size, (72, 72))
-
-
-class TestProcessTileSpiral(unittest.TestCase):
-  def test_grid_full(self):
-    source = Image.new("RGB", (64, 64))
-    blend = process_tile_spiral(source, 32, 1, [])
-
-    self.assertEqual(blend.size, (64, 64))
-
-  def test_grid_partial(self):
-    source = Image.new("RGB", (72, 72))
-    blend = process_tile_spiral(source, 32, 1, [])
+    blend = process_tile_stack(source, 32, 1, [])
 
     self.assertEqual(blend.size, (72, 72))
diff --git a/api/tests/chain/test_upscale_highres.py b/api/tests/chain/test_upscale_highres.py
index 8789e447..72437fc8 100644
--- a/api/tests/chain/test_upscale_highres.py
+++ b/api/tests/chain/test_upscale_highres.py
@@ -1,6 +1,6 @@
 import unittest
-from onnx_web.chain.result import StageResult
 
+from onnx_web.chain.result import StageResult
 from onnx_web.chain.upscale_highres import UpscaleHighresStage
 from onnx_web.params import HighresParams, UpscaleParams
 

From 8a3174aaff4a028725afd10fc610803d391d8707 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 18:41:55 -0600
Subject: [PATCH 169/240] load plugins from env

---
 api/onnx_web/server/context.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 0a4221a2..7d51dfd4 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -64,6 +64,7 @@ class ServerContext:
         server_version: Optional[str] = DEFAULT_SERVER_VERSION,
         worker_retries: Optional[int] = DEFAULT_WORKER_RETRIES,
         feature_flags: Optional[List[str]] = None,
+        plugins: Optional[List[str]] = None,
     ) -> None:
         self.bundle_path = bundle_path
         self.model_path = model_path
@@ -85,6 +86,7 @@ class ServerContext:
         self.server_version = server_version
         self.worker_retries = worker_retries
         self.feature_flags = feature_flags or []
+        self.plugins = plugins or []
 
         self.cache = ModelCache(self.cache_limit)
 
@@ -125,6 +127,7 @@ class ServerContext:
                 environ.get("ONNX_WEB_WORKER_RETRIES", DEFAULT_WORKER_RETRIES)
             ),
             feature_flags=environ.get("ONNX_WEB_FEATURE_FLAGS", "").split(","),
+            plugins=environ.get("ONNX_WEB_PLUGINS", "").split(","),
         )
 
     def has_feature(self, flag: str) -> bool:

From c1f1bf2b36425d7615b97e370aeb2ed29ac6055e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 21:05:21 -0600
Subject: [PATCH 170/240] various stack fixes

---
 api/onnx_web/chain/pipeline.py | 4 ++--
 api/onnx_web/chain/tile.py     | 7 ++++---
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 50122d7d..359e2bfb 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -181,7 +181,7 @@ class ChainPipeline:
                                 server,
                                 stage_params,
                                 per_stage_params,
-                                StageResult(images=[source_tile]),
+                                StageResult(images=source_tile),
                                 tile_mask=tile_mask,
                                 callback=callback,
                                 dims=dims,
@@ -192,7 +192,7 @@ class ChainPipeline:
                                 for j, image in enumerate(tile_result.as_image()):
                                     save_image(server, f"last-tile-{j}.png", image)
 
-                            return tile_result.as_image()
+                            return tile_result
                         except Exception:
                             worker.retries = worker.retries - 1
                             logger.exception(
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index aae71af1..a2c3da9a 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -27,7 +27,7 @@ class TileCallback(Protocol):
 
     def __call__(
         self, image: Image.Image, dims: Tuple[int, int, int]
-    ) -> List[Image.Image]:
+    ) -> StageResult:
         """
         Run this stage against a single tile.
         """
@@ -287,7 +287,7 @@ def process_tile_stack(
                 bottom_margin,
             )
             tile_stack = add_margin(
-                stack,
+                stack.as_image(),
                 left,
                 top,
                 right,
@@ -322,7 +322,7 @@ def process_tile_stack(
         for image_filter in filters:
             tile_stack = image_filter(tile_stack, tile_mask, (left, top, tile))
 
-        tiles.append((left, top, tile_stack))
+        tiles.append((left, top, tile_stack.as_image()))
 
     lefts, tops, stacks = list(zip(*tiles))
     coords = list(zip(lefts, tops))
@@ -331,6 +331,7 @@ def process_tile_stack(
     result = []
     for stack in stacks:
         stack_tiles = zip(coords, stack)
+        stack_tiles = [(left, top, tile) for (left, top), tile in stack_tiles]
         result.append(blend_tiles(stack_tiles, scale, width, height, tile, overlap))
 
     return result

From 781b34151c306d7d40684b6b350611166bcb7a73 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 21:05:39 -0600
Subject: [PATCH 171/240] feat(api): add flag to launch debugger

---
 api/onnx_web/main.py           | 13 +++++++++----
 api/onnx_web/server/context.py |  4 ++++
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/main.py b/api/onnx_web/main.py
index d6e4c678..4255242e 100644
--- a/api/onnx_web/main.py
+++ b/api/onnx_web/main.py
@@ -45,6 +45,14 @@ def main():
     apply_patches(server)
     check_paths(server)
 
+    # debug options
+    if server.debug:
+        import debugpy
+        debugpy.listen(5678)
+        logger.warning("waiting for debugger")
+        debugpy.wait_for_client()
+        gc.set_debug(gc.DEBUG_STATS)
+
     # register plugins
     exports = load_plugins(server)
     success = register_plugins(exports)
@@ -60,10 +68,7 @@ def main():
     load_platforms(server)
     load_wildcards(server)
 
-    # debug and misc server options
-    if is_debug():
-        gc.set_debug(gc.DEBUG_STATS)
-
+    # misc server options
     if not server.show_progress:
         disable_progress_bar()
         disable_progress_bars()
diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 7d51dfd4..e1af489d 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -41,6 +41,7 @@ class ServerContext:
     worker_retries: int
     feature_flags: List[str]
     plugins: List[str]
+    debug: bool
 
     def __init__(
         self,
@@ -65,6 +66,7 @@ class ServerContext:
         worker_retries: Optional[int] = DEFAULT_WORKER_RETRIES,
         feature_flags: Optional[List[str]] = None,
         plugins: Optional[List[str]] = None,
+        debug: bool = False,
     ) -> None:
         self.bundle_path = bundle_path
         self.model_path = model_path
@@ -87,6 +89,7 @@ class ServerContext:
         self.worker_retries = worker_retries
         self.feature_flags = feature_flags or []
         self.plugins = plugins or []
+        self.debug = debug
 
         self.cache = ModelCache(self.cache_limit)
 
@@ -128,6 +131,7 @@ class ServerContext:
             ),
             feature_flags=environ.get("ONNX_WEB_FEATURE_FLAGS", "").split(","),
             plugins=environ.get("ONNX_WEB_PLUGINS", "").split(","),
+            debug=get_boolean(environ, "ONNX_WEB_DEBUG", False),
         )
 
     def has_feature(self, flag: str) -> bool:

From 4691e80744147a37a26b552a7a215db9c12c7dc8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 21:22:55 -0600
Subject: [PATCH 172/240] keep tiles after slicing

---
 api/onnx_web/chain/tile.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index a2c3da9a..fb170736 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -525,5 +525,6 @@ def add_margin(
         )
         tile_image = noise_source(base_image, (tile, tile), (0, 0), fill=fill_color)
         tile_image.paste(base_image, (left_margin, top_margin))
+        results.append(tile_image)
 
     return results

From 65912c5a4adc49a1c09819abdf3d0d0597c527d2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 23:18:57 -0600
Subject: [PATCH 173/240] apply lint to tests, test highres

---
 api/Makefile                                  |   4 +
 api/onnx_web/chain/result.py                  |   8 +
 api/onnx_web/chain/tile.py                    |   7 +-
 api/onnx_web/main.py                          |   1 +
 api/tests/chain/test_blend_grid.py            |  16 +-
 api/tests/chain/test_blend_img2img.py         |  31 +-
 api/tests/chain/test_blend_linear.py          |  14 +-
 api/tests/chain/test_correct_codeformer.py    |   2 +-
 api/tests/chain/test_tile.py                  | 151 +++---
 api/tests/chain/test_upscale_highres.py       |  10 +-
 api/tests/convert/diffusion/test_lora.py      |  70 ++-
 .../diffusion/test_textual_inversion.py       | 356 ++++++++------
 api/tests/convert/test_utils.py               | 310 ++++++------
 api/tests/helpers.py                          |   6 +-
 api/tests/image/test_mask_filter.py           |  30 +-
 api/tests/image/test_source_filter.py         |  36 +-
 api/tests/image/test_utils.py                 |  28 +-
 api/tests/mocks.py                            |  64 +--
 api/tests/prompt/test_parser.py               |   8 +-
 api/tests/server/test_load.py                 |  14 +
 api/tests/server/test_model_cache.py          |  78 +--
 api/tests/test_diffusers/test_load.py         | 454 ++++++++++--------
 api/tests/test_diffusers/test_run.py          | 347 +++++++------
 api/tests/test_diffusers/test_utils.py        | 171 ++++---
 api/tests/worker/test_pool.py                 | 176 +++----
 api/tests/worker/test_worker.py               | 241 ++++++----
 26 files changed, 1506 insertions(+), 1127 deletions(-)

diff --git a/api/Makefile b/api/Makefile
index db142073..579c8546 100644
--- a/api/Makefile
+++ b/api/Makefile
@@ -33,13 +33,17 @@ package-upload:
 
 lint-check:
 	black --check onnx_web/
+	black --check tests/
 	flake8 onnx_web
+	flake8 tests
 	isort --check-only --skip __init__.py --filter-files onnx_web
 	isort --check-only --skip __init__.py --filter-files tests
 
 lint-fix:
 	black onnx_web/
+	black tests/
 	flake8 onnx_web
+	flake8 tests
 	isort --skip __init__.py --filter-files onnx_web
 	isort --skip __init__.py --filter-files tests
 
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index 3bc54e43..9bd7395d 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -19,6 +19,14 @@ class StageResult:
     def empty():
         return StageResult(images=[])
 
+    @staticmethod
+    def from_arrays(arrays: List[np.ndarray]):
+        return StageResult(arrays=arrays)
+
+    @staticmethod
+    def from_images(images: List[Image.Image]):
+        return StageResult(images=images)
+
     def __init__(self, arrays=None, images=None) -> None:
         if arrays is not None and images is not None:
             raise ValueError("stages must only return one type of result")
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index fb170736..f8fe5e8d 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -25,9 +25,7 @@ class TileCallback(Protocol):
     Definition for a tile job function.
     """
 
-    def __call__(
-        self, image: Image.Image, dims: Tuple[int, int, int]
-    ) -> StageResult:
+    def __call__(self, image: Image.Image, dims: Tuple[int, int, int]) -> StageResult:
         """
         Run this stage against a single tile.
         """
@@ -319,6 +317,9 @@ def process_tile_stack(
             if mask:
                 tile_mask = mask.crop((left, top, right, bottom))
 
+        if isinstance(tile_stack, list):
+            tile_stack = StageResult.from_images(tile_stack)
+
         for image_filter in filters:
             tile_stack = image_filter(tile_stack, tile_mask, (left, top, tile))
 
diff --git a/api/onnx_web/main.py b/api/onnx_web/main.py
index 4255242e..6de5dc39 100644
--- a/api/onnx_web/main.py
+++ b/api/onnx_web/main.py
@@ -48,6 +48,7 @@ def main():
     # debug options
     if server.debug:
         import debugpy
+
         debugpy.listen(5678)
         logger.warning("waiting for debugger")
         debugpy.wait_for_client()
diff --git a/api/tests/chain/test_blend_grid.py b/api/tests/chain/test_blend_grid.py
index b1623019..0e6188b1 100644
--- a/api/tests/chain/test_blend_grid.py
+++ b/api/tests/chain/test_blend_grid.py
@@ -9,13 +9,15 @@ from onnx_web.chain.result import StageResult
 class BlendGridStageTests(unittest.TestCase):
     def test_stage(self):
         stage = BlendGridStage()
-        sources = StageResult(images=[
-            Image.new("RGB", (64, 64), "black"),
-            Image.new("RGB", (64, 64), "white"),
-            Image.new("RGB", (64, 64), "black"),
-            Image.new("RGB", (64, 64), "white"),
-        ])
+        sources = StageResult(
+            images=[
+                Image.new("RGB", (64, 64), "black"),
+                Image.new("RGB", (64, 64), "white"),
+                Image.new("RGB", (64, 64), "black"),
+                Image.new("RGB", (64, 64), "white"),
+            ]
+        )
         result = stage.run(None, None, None, None, sources, height=2, width=2)
 
         self.assertEqual(len(result), 5)
-        self.assertEqual(result.as_image()[-1].getpixel((0,0)), (0, 0, 0))
\ No newline at end of file
+        self.assertEqual(result.as_image()[-1].getpixel((0, 0)), (0, 0, 0))
diff --git a/api/tests/chain/test_blend_img2img.py b/api/tests/chain/test_blend_img2img.py
index 21b583f0..31aa27a3 100644
--- a/api/tests/chain/test_blend_img2img.py
+++ b/api/tests/chain/test_blend_img2img.py
@@ -6,21 +6,38 @@ from onnx_web.chain.blend_img2img import BlendImg2ImgStage
 from onnx_web.params import DeviceParams, ImageParams
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.context import WorkerContext
+from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_needs_models
 
 
 class BlendImg2ImgStageTests(unittest.TestCase):
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
     def test_stage(self):
-        """
         stage = BlendImg2ImgStage()
-        params = ImageParams("runwayml/stable-diffusion-v1-5", "txt2img", "euler-a", "an astronaut eating a hamburger", 3.0, 1, 1)
-        server = ServerContext()
-        worker = WorkerContext("test", DeviceParams("cpu", "CPUProvider"), None, None, None, None, None, None, 0)
+        params = ImageParams(
+            TEST_MODEL_DIFFUSION_SD15,
+            "txt2img",
+            "euler-a",
+            "an astronaut eating a hamburger",
+            3.0,
+            1,
+            1,
+        )
+        server = ServerContext(model_path="../models", output_path="../outputs")
+        worker = WorkerContext(
+            "test",
+            DeviceParams("cpu", "CPUProvider"),
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            0,
+        )
         sources = [
             Image.new("RGB", (64, 64), "black"),
         ]
         result = stage.run(worker, server, None, params, sources, strength=0.5, steps=1)
 
         self.assertEqual(len(result), 1)
-        self.assertEqual(result[0].getpixel((0,0)), (127, 127, 127))
-        """
-        pass
\ No newline at end of file
+        self.assertEqual(result[0].getpixel((0, 0)), (127, 127, 127))
diff --git a/api/tests/chain/test_blend_linear.py b/api/tests/chain/test_blend_linear.py
index a983a2e1..76a2715a 100644
--- a/api/tests/chain/test_blend_linear.py
+++ b/api/tests/chain/test_blend_linear.py
@@ -9,11 +9,15 @@ from onnx_web.chain.result import StageResult
 class BlendLinearStageTests(unittest.TestCase):
     def test_stage(self):
         stage = BlendLinearStage()
-        sources = StageResult(images=[
-            Image.new("RGB", (64, 64), "black"),
-        ])
+        sources = StageResult(
+            images=[
+                Image.new("RGB", (64, 64), "black"),
+            ]
+        )
         stage_source = Image.new("RGB", (64, 64), "white")
-        result = stage.run(None, None, None, None, sources, alpha=0.5, stage_source=stage_source)
+        result = stage.run(
+            None, None, None, None, sources, alpha=0.5, stage_source=stage_source
+        )
 
         self.assertEqual(len(result), 1)
-        self.assertEqual(result.as_image()[0].getpixel((0,0)), (127, 127, 127))
\ No newline at end of file
+        self.assertEqual(result.as_image()[0].getpixel((0, 0)), (127, 127, 127))
diff --git a/api/tests/chain/test_correct_codeformer.py b/api/tests/chain/test_correct_codeformer.py
index 9cc24de0..8a90d0c9 100644
--- a/api/tests/chain/test_correct_codeformer.py
+++ b/api/tests/chain/test_correct_codeformer.py
@@ -30,4 +30,4 @@ class CorrectCodeformerStageTests(unittest.TestCase):
 
         self.assertEqual(len(result), 0)
         """
-        pass
\ No newline at end of file
+        pass
diff --git a/api/tests/chain/test_tile.py b/api/tests/chain/test_tile.py
index 6323c0bb..c27cb077 100644
--- a/api/tests/chain/test_tile.py
+++ b/api/tests/chain/test_tile.py
@@ -2,6 +2,7 @@ import unittest
 
 from PIL import Image
 
+from onnx_web.chain.result import StageResult
 from onnx_web.chain.tile import (
     complete_tile,
     generate_tile_grid,
@@ -14,122 +15,126 @@ from onnx_web.params import Size
 
 
 class TestCompleteTile(unittest.TestCase):
-  def test_with_complete_tile(self):
-    partial = Image.new("RGB", (64, 64))
-    output = complete_tile(partial, 64)
+    def test_with_complete_tile(self):
+        partial = Image.new("RGB", (64, 64))
+        output = complete_tile(partial, 64)
 
-    self.assertEqual(output.size, (64, 64))
+        self.assertEqual(output.size, (64, 64))
 
-  def test_with_partial_tile(self):
-    partial = Image.new("RGB", (64, 32))
-    output = complete_tile(partial, 64)
+    def test_with_partial_tile(self):
+        partial = Image.new("RGB", (64, 32))
+        output = complete_tile(partial, 64)
 
-    self.assertEqual(output.size, (64, 64))
+        self.assertEqual(output.size, (64, 64))
 
-  def test_with_nothing(self):
-    output = complete_tile(None, 64)
+    def test_with_nothing(self):
+        output = complete_tile(None, 64)
 
-    self.assertIsNone(output)
+        self.assertIsNone(output)
 
 
 class TestNeedsTile(unittest.TestCase):
-  def test_with_undersized_source(self):
-    small = Image.new("RGB", (32, 32))
+    def test_with_undersized_source(self):
+        small = Image.new("RGB", (32, 32))
 
-    self.assertFalse(needs_tile(64, 64, source=small))
+        self.assertFalse(needs_tile(64, 64, source=small))
 
-  def test_with_oversized_source(self):
-    large = Image.new("RGB", (64, 64))
+    def test_with_oversized_source(self):
+        large = Image.new("RGB", (64, 64))
 
-    self.assertTrue(needs_tile(32, 32, source=large))
+        self.assertTrue(needs_tile(32, 32, source=large))
 
-  def test_with_undersized_size(self):
-    small = Size(32, 32)
+    def test_with_undersized_size(self):
+        small = Size(32, 32)
 
-    self.assertFalse(needs_tile(64, 64, size=small))
+        self.assertFalse(needs_tile(64, 64, size=small))
 
-  def test_with_oversized_source(self):
-    large = Size(64, 64)
+    def test_with_oversized_size(self):
+        large = Size(64, 64)
 
-    self.assertTrue(needs_tile(32, 32, size=large))
+        self.assertTrue(needs_tile(32, 32, size=large))
 
-  def test_with_nothing(self):
-    self.assertFalse(needs_tile(32, 32))
+    def test_with_nothing(self):
+        self.assertFalse(needs_tile(32, 32))
 
 
 class TestTileGrads(unittest.TestCase):
-  def test_center_tile(self):
-    grad_x, grad_y = make_tile_grads(32, 32, 8, 64, 64)
+    def test_center_tile(self):
+        grad_x, grad_y = make_tile_grads(32, 32, 8, 64, 64)
 
-    self.assertEqual(grad_x, [0, 1, 1, 0])
-    self.assertEqual(grad_y, [0, 1, 1, 0])
+        self.assertEqual(grad_x, [0, 1, 1, 0])
+        self.assertEqual(grad_y, [0, 1, 1, 0])
 
-  def test_vertical_edge_tile(self):
-    grad_x, grad_y = make_tile_grads(32, 0, 8, 64, 8)
+    def test_vertical_edge_tile(self):
+        grad_x, grad_y = make_tile_grads(32, 0, 8, 64, 8)
 
-    self.assertEqual(grad_x, [0, 1, 1, 0])
-    self.assertEqual(grad_y, [1, 1, 1, 1])
+        self.assertEqual(grad_x, [0, 1, 1, 0])
+        self.assertEqual(grad_y, [1, 1, 1, 1])
 
-  def test_horizontal_edge_tile(self):
-    grad_x, grad_y = make_tile_grads(0, 32, 8, 8, 64)
+    def test_horizontal_edge_tile(self):
+        grad_x, grad_y = make_tile_grads(0, 32, 8, 8, 64)
 
-    self.assertEqual(grad_x, [1, 1, 1, 1])
-    self.assertEqual(grad_y, [0, 1, 1, 0])
+        self.assertEqual(grad_x, [1, 1, 1, 1])
+        self.assertEqual(grad_y, [0, 1, 1, 0])
 
 
 class TestGenerateTileGrid(unittest.TestCase):
-  def test_grid_complete(self):
-    tiles = generate_tile_grid(16, 16, 8, 0.0)
+    def test_grid_complete(self):
+        tiles = generate_tile_grid(16, 16, 8, 0.0)
 
-    self.assertEqual(len(tiles), 4)
-    self.assertEqual(tiles, [(0, 0), (8, 0), (8, 8), (0, 8)])
+        self.assertEqual(len(tiles), 4)
+        self.assertEqual(tiles, [(0, 0), (8, 0), (0, 8), (8, 8)])
 
-  def test_grid_no_overlap(self):
-    tiles = generate_tile_grid(64, 64, 8, 0.0)
+    def test_grid_no_overlap(self):
+        tiles = generate_tile_grid(64, 64, 8, 0.0)
 
-    self.assertEqual(len(tiles), 64)
-    self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
-    self.assertEqual(tiles[-5:-1], [(16, 24), (24, 24), (32, 24), (32, 32)])
+        self.assertEqual(len(tiles), 64)
+        self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
+        self.assertEqual(tiles[-5:-1], [(24, 56), (32, 56), (40, 56), (48, 56)])
 
-  def test_grid_50_overlap(self):
-    tiles = generate_tile_grid(64, 64, 8, 0.5)
+    def test_grid_50_overlap(self):
+        tiles = generate_tile_grid(64, 64, 8, 0.5)
 
-    self.assertEqual(len(tiles), 225)
-    self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
-    self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
+        self.assertEqual(len(tiles), 256)
+        self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
+        self.assertEqual(tiles[-5:-1], [(44, 60), (48, 60), (52, 60), (56, 60)])
 
 
 class TestGenerateTileSpiral(unittest.TestCase):
-  def test_spiral_complete(self):
-    tiles = generate_tile_spiral(16, 16, 8, 0.0)
+    def test_spiral_complete(self):
+        tiles = generate_tile_spiral(16, 16, 8, 0.0)
 
-    self.assertEqual(len(tiles), 4)
-    self.assertEqual(tiles, [(0, 0), (8, 0), (8, 8), (0, 8)])
+        self.assertEqual(len(tiles), 4)
+        self.assertEqual(tiles, [(0, 0), (8, 0), (8, 8), (0, 8)])
 
-  def test_spiral_no_overlap(self):
-    tiles = generate_tile_spiral(64, 64, 8, 0.0)
+    def test_spiral_no_overlap(self):
+        tiles = generate_tile_spiral(64, 64, 8, 0.0)
 
-    self.assertEqual(len(tiles), 64)
-    self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
-    self.assertEqual(tiles[-5:-1], [(16, 24), (24, 24), (32, 24), (32, 32)])
+        self.assertEqual(len(tiles), 64)
+        self.assertEqual(tiles[0:4], [(0, 0), (8, 0), (16, 0), (24, 0)])
+        self.assertEqual(tiles[-5:-1], [(16, 24), (24, 24), (32, 24), (32, 32)])
 
-  def test_spiral_50_overlap(self):
-    tiles = generate_tile_spiral(64, 64, 8, 0.5)
+    def test_spiral_50_overlap(self):
+        tiles = generate_tile_spiral(64, 64, 8, 0.5)
 
-    self.assertEqual(len(tiles), 225)
-    self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
-    self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
+        self.assertEqual(len(tiles), 225)
+        self.assertEqual(tiles[0:4], [(0, 0), (4, 0), (8, 0), (12, 0)])
+        self.assertEqual(tiles[-5:-1], [(32, 32), (28, 32), (24, 32), (24, 28)])
 
 
 class TestProcessTileStack(unittest.TestCase):
-  def test_grid_full(self):
-    source = Image.new("RGB", (64, 64))
-    blend = process_tile_stack(source, 32, 1, [])
+    def test_grid_full(self):
+        source = Image.new("RGB", (64, 64))
+        blend = process_tile_stack(
+            StageResult(images=[source]), 32, 1, [], generate_tile_grid
+        )
 
-    self.assertEqual(blend.size, (64, 64))
+        self.assertEqual(blend[0].size, (64, 64))
 
-  def test_grid_partial(self):
-    source = Image.new("RGB", (72, 72))
-    blend = process_tile_stack(source, 32, 1, [])
+    def test_grid_partial(self):
+        source = Image.new("RGB", (72, 72))
+        blend = process_tile_stack(
+            StageResult(images=[source]), 32, 1, [], generate_tile_grid
+        )
 
-    self.assertEqual(blend.size, (72, 72))
+        self.assertEqual(blend[0].size, (72, 72))
diff --git a/api/tests/chain/test_upscale_highres.py b/api/tests/chain/test_upscale_highres.py
index 72437fc8..096eea54 100644
--- a/api/tests/chain/test_upscale_highres.py
+++ b/api/tests/chain/test_upscale_highres.py
@@ -9,6 +9,14 @@ class UpscaleHighresStageTests(unittest.TestCase):
     def test_empty(self):
         stage = UpscaleHighresStage()
         sources = StageResult.empty()
-        result = stage.run(None, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
+        result = stage.run(
+            None,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+        )
 
         self.assertEqual(len(result), 0)
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index 87a7fff0..bcf19680 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -6,7 +6,6 @@ from onnx import GraphProto, ModelProto, NodeProto
 from onnx.numpy_helper import from_array
 
 from onnx_web.convert.diffusion.lora import (
-    blend_loras,
     blend_node_conv_gemm,
     blend_node_matmul,
     blend_weights_loha,
@@ -33,7 +32,6 @@ class SumWeightsTests(unittest.TestCase):
         weights = sum_weights(np.zeros((4, 4)), np.ones((4, 4, 1, 1)))
         self.assertEqual(weights.shape, (4, 4, 1, 1))
 
-
     def test_3x3_kernel(self):
         """
         weights = sum_weights(np.zeros((4, 4, 3, 3)), np.ones((4, 4)))
@@ -53,14 +51,20 @@ class BufferExternalDataTensorTests(unittest.TestCase):
         )
         (slim_model, external_weights) = buffer_external_data_tensors(model)
 
-        self.assertEqual(len(slim_model.graph.initializer), len(model.graph.initializer))
+        self.assertEqual(
+            len(slim_model.graph.initializer), len(model.graph.initializer)
+        )
         self.assertEqual(len(external_weights), 1)
 
 
 class FixInitializerKeyTests(unittest.TestCase):
     def test_fix_name(self):
-        inputs = ["lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0.lora_down.weight"]
-        outputs = ["lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_lora_down_weight"]
+        inputs = [
+            "lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0.lora_down.weight"
+        ]
+        outputs = [
+            "lora_unet_up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_lora_down_weight"
+        ]
 
         for input, output in zip(inputs, outputs):
             self.assertEqual(fix_initializer_name(input), output)
@@ -92,25 +96,37 @@ class FixXLNameTests(unittest.TestCase):
         nodes = {
             "input_block_proj.lora_down.weight": {},
         }
-        fixed = fix_xl_names(nodes, [
-            NodeProto(name="/down_blocks_proj/MatMul"),
-        ])
+        fixed = fix_xl_names(
+            nodes,
+            [
+                NodeProto(name="/down_blocks_proj/MatMul"),
+            ],
+        )
 
-        self.assertEqual(fixed, {
-            "down_blocks_proj": nodes["input_block_proj.lora_down.weight"],
-        })
+        self.assertEqual(
+            fixed,
+            {
+                "down_blocks_proj": nodes["input_block_proj.lora_down.weight"],
+            },
+        )
 
     def test_middle_block(self):
         nodes = {
             "middle_block_proj.lora_down.weight": {},
         }
-        fixed = fix_xl_names(nodes, [
-            NodeProto(name="/mid_blocks_proj/MatMul"),
-        ])
+        fixed = fix_xl_names(
+            nodes,
+            [
+                NodeProto(name="/mid_blocks_proj/MatMul"),
+            ],
+        )
 
-        self.assertEqual(fixed, {
-            "mid_blocks_proj": nodes["middle_block_proj.lora_down.weight"],
-        })
+        self.assertEqual(
+            fixed,
+            {
+                "mid_blocks_proj": nodes["middle_block_proj.lora_down.weight"],
+            },
+        )
 
     def test_output_block(self):
         pass
@@ -133,13 +149,19 @@ class FixXLNameTests(unittest.TestCase):
         nodes = {
             "output_block_proj_out.lora_down.weight": {},
         }
-        fixed = fix_xl_names(nodes, [
-            NodeProto(name="/up_blocks_proj_out/MatMul"),
-        ])
+        fixed = fix_xl_names(
+            nodes,
+            [
+                NodeProto(name="/up_blocks_proj_out/MatMul"),
+            ],
+        )
 
-        self.assertEqual(fixed, {
-            "up_blocks_proj_out": nodes["output_block_proj_out.lora_down.weight"],
-        })
+        self.assertEqual(
+            fixed,
+            {
+                "up_blocks_proj_out": nodes["output_block_proj_out.lora_down.weight"],
+            },
+        )
 
 
 class KernelSliceTests(unittest.TestCase):
@@ -250,6 +272,7 @@ class BlendWeightsLoHATests(unittest.TestCase):
         self.assertEqual(result.shape, (4, 4))
         """
 
+
 class BlendWeightsLoRATests(unittest.TestCase):
     def test_blend_kernel_none(self):
         model = {
@@ -260,7 +283,6 @@ class BlendWeightsLoRATests(unittest.TestCase):
         key, result = blend_weights_lora("foo.lora_down", "", model, torch.float32)
         self.assertEqual(result.shape, (4, 4))
 
-
     def test_blend_kernel_1x1(self):
         model = {
             "foo.lora_down": torch.from_numpy(np.ones((1, 4, 1, 1))),
diff --git a/api/tests/convert/diffusion/test_textual_inversion.py b/api/tests/convert/diffusion/test_textual_inversion.py
index 246d53b4..287907b6 100644
--- a/api/tests/convert/diffusion/test_textual_inversion.py
+++ b/api/tests/convert/diffusion/test_textual_inversion.py
@@ -10,7 +10,6 @@ from onnx_web.convert.diffusion.textual_inversion import (
     blend_embedding_embeddings,
     blend_embedding_node,
     blend_embedding_parameters,
-    blend_textual_inversions,
     detect_embedding_format,
 )
 
@@ -18,210 +17,267 @@ TEST_DIMS = (8, 8)
 TEST_DIMS_EMBEDS = (1, *TEST_DIMS)
 
 TEST_MODEL_EMBEDS = {
-      "string_to_token": {
+    "string_to_token": {
         "test": 1,
-      },
-      "string_to_param": {
+    },
+    "string_to_param": {
         "test": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
-      },
+    },
 }
 
 
 class DetectEmbeddingFormatTests(unittest.TestCase):
-  def test_concept(self):
-    embedding = {
-      "<test>": "test",
-    }
-    self.assertEqual(detect_embedding_format(embedding), "concept")
+    def test_concept(self):
+        embedding = {
+            "<test>": "test",
+        }
+        self.assertEqual(detect_embedding_format(embedding), "concept")
 
-  def test_parameters(self):
-    embedding = {
-      "emb_params": "test",
-    }
-    self.assertEqual(detect_embedding_format(embedding), "parameters")
+    def test_parameters(self):
+        embedding = {
+            "emb_params": "test",
+        }
+        self.assertEqual(detect_embedding_format(embedding), "parameters")
 
-  def test_embeddings(self):
-    embedding = {
-      "string_to_token": "test",
-      "string_to_param": "test",
-    }
-    self.assertEqual(detect_embedding_format(embedding), "embeddings")
+    def test_embeddings(self):
+        embedding = {
+            "string_to_token": "test",
+            "string_to_param": "test",
+        }
+        self.assertEqual(detect_embedding_format(embedding), "embeddings")
 
-  def test_unknown(self):
-    embedding = {
-      "what_is_this": "test",
-    }
-    self.assertEqual(detect_embedding_format(embedding), None)
+    def test_unknown(self):
+        embedding = {
+            "what_is_this": "test",
+        }
+        self.assertEqual(detect_embedding_format(embedding), None)
 
 
 class BlendEmbeddingConceptTests(unittest.TestCase):
-  def test_existing_base_token(self):
-    embeds = {
-      "test": np.ones(TEST_DIMS),
-    }
-    blend_embedding_concept(embeds, {
-      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
-    }, np.float32, "test", 1.0)
+    def test_existing_base_token(self):
+        embeds = {
+            "test": np.ones(TEST_DIMS),
+        }
+        blend_embedding_concept(
+            embeds,
+            {
+                "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
-    self.assertEqual(embeds["test"].mean(), 2)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertEqual(embeds["test"].mean(), 2)
 
-  def test_missing_base_token(self):
-    embeds = {}
-    blend_embedding_concept(embeds, {
-      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
-    }, np.float32, "test", 1.0)
+    def test_missing_base_token(self):
+        embeds = {}
+        blend_embedding_concept(
+            embeds,
+            {
+                "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
 
-  def test_existing_token(self):
-    embeds = {
-      "<test>": np.ones(TEST_DIMS),
-    }
-    blend_embedding_concept(embeds, {
-      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
-    }, np.float32, "test", 1.0)
+    def test_existing_token(self):
+        embeds = {
+            "<test>": np.ones(TEST_DIMS),
+        }
+        blend_embedding_concept(
+            embeds,
+            {
+                "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["<test>", "test"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["<test>", "test"])
 
-  def test_missing_token(self):
-    embeds = {}
-    blend_embedding_concept(embeds, {
-      "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
-    }, np.float32, "test", 1.0)
+    def test_missing_token(self):
+        embeds = {}
+        blend_embedding_concept(
+            embeds,
+            {
+                "<test>": torch.from_numpy(np.ones(TEST_DIMS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["<test>", "test"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["<test>", "test"])
 
 
 class BlendEmbeddingParametersTests(unittest.TestCase):
-  def test_existing_base_token(self):
-    embeds = {
-      "test": np.ones(TEST_DIMS),
-    }
-    blend_embedding_parameters(embeds, {
-      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
-    }, np.float32, "test", 1.0)
+    def test_existing_base_token(self):
+        embeds = {
+            "test": np.ones(TEST_DIMS),
+        }
+        blend_embedding_parameters(
+            embeds,
+            {
+                "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
-    self.assertEqual(embeds["test"].mean(), 2)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertEqual(embeds["test"].mean(), 2)
 
-  def test_missing_base_token(self):
-    embeds = {}
-    blend_embedding_parameters(embeds, {
-      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
-    }, np.float32, "test", 1.0)
+    def test_missing_base_token(self):
+        embeds = {}
+        blend_embedding_parameters(
+            embeds,
+            {
+                "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
 
-  def test_existing_token(self):
-    embeds = {
-      "test": np.ones(TEST_DIMS_EMBEDS),
-    }
-    blend_embedding_parameters(embeds, {
-      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
-    }, np.float32, "test", 1.0)
+    def test_existing_token(self):
+        embeds = {
+            "test": np.ones(TEST_DIMS_EMBEDS),
+        }
+        blend_embedding_parameters(
+            embeds,
+            {
+                "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["test", "test-0", "test-all"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["test", "test-0", "test-all"])
 
-  def test_missing_token(self):
-    embeds = {}
-    blend_embedding_parameters(embeds, {
-      "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
-    }, np.float32, "test", 1.0)
+    def test_missing_token(self):
+        embeds = {}
+        blend_embedding_parameters(
+            embeds,
+            {
+                "emb_params": torch.from_numpy(np.ones(TEST_DIMS_EMBEDS)),
+            },
+            np.float32,
+            "test",
+            1.0,
+        )
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["test", "test-0", "test-all"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["test", "test-0", "test-all"])
 
 
 class BlendEmbeddingEmbeddingsTests(unittest.TestCase):
-  def test_existing_base_token(self):
-    embeds = {
-      "test": np.ones(TEST_DIMS),
-    }
-    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+    def test_existing_base_token(self):
+        embeds = {
+            "test": np.ones(TEST_DIMS),
+        }
+        blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
-    self.assertEqual(embeds["test"].mean(), 2)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertEqual(embeds["test"].mean(), 2)
 
-  def test_missing_base_token(self):
-    embeds = {}
-    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+    def test_missing_base_token(self):
+        embeds = {}
+        blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
 
-    self.assertIn("test", embeds)
-    self.assertEqual(embeds["test"].shape, TEST_DIMS)
+        self.assertIn("test", embeds)
+        self.assertEqual(embeds["test"].shape, TEST_DIMS)
 
-  def test_existing_token(self):
-    embeds = {
-      "test": np.ones(TEST_DIMS),
-    }
-    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+    def test_existing_token(self):
+        embeds = {
+            "test": np.ones(TEST_DIMS),
+        }
+        blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["test", "test-0", "test-all"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["test", "test-0", "test-all"])
 
-  def test_missing_token(self):
-    embeds = {}
-    blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
+    def test_missing_token(self):
+        embeds = {}
+        blend_embedding_embeddings(embeds, TEST_MODEL_EMBEDS, np.float32, "test", 1.0)
 
-    keys = list(embeds.keys())
-    keys.sort()
+        keys = list(embeds.keys())
+        keys.sort()
 
-    self.assertIn("test", embeds)
-    self.assertEqual(keys, ["test", "test-0", "test-all"])
+        self.assertIn("test", embeds)
+        self.assertEqual(keys, ["test", "test-0", "test-all"])
 
 
 class BlendEmbeddingNodeTests(unittest.TestCase):
-  def test_expand_weights(self):
-    weights = from_array(np.ones(TEST_DIMS))
-    weights.name = "text_model.embeddings.token_embedding.weight"
+    def test_expand_weights(self):
+        weights = from_array(np.ones(TEST_DIMS))
+        weights.name = "text_model.embeddings.token_embedding.weight"
 
-    model = ModelProto(graph=GraphProto(initializer=[
-      weights,
-    ]))
+        model = ModelProto(
+            graph=GraphProto(
+                initializer=[
+                    weights,
+                ]
+            )
+        )
 
-    embeds = {}
-    blend_embedding_node(model, {
-      'convert_tokens_to_ids': lambda t: t,
-    }, embeds, 2)
+        embeds = {}
+        blend_embedding_node(
+            model,
+            {
+                "convert_tokens_to_ids": lambda t: t,
+            },
+            embeds,
+            2,
+        )
 
-    result = to_array(model.graph.initializer[0])
+        result = to_array(model.graph.initializer[0])
 
-    self.assertEqual(len(model.graph.initializer), 1)
-    self.assertEqual(result.shape, (10, 8)) # (8 + 2, 8)
+        self.assertEqual(len(model.graph.initializer), 1)
+        self.assertEqual(result.shape, (10, 8))  # (8 + 2, 8)
 
 
 class BlendTextualInversionsTests(unittest.TestCase):
-  def test_blend_multi_concept(self):
-    pass
+    def test_blend_multi_concept(self):
+        pass
 
-  def test_blend_multi_parameters(self):
-    pass
+    def test_blend_multi_parameters(self):
+        pass
 
-  def test_blend_multi_embeddings(self):
-    pass
+    def test_blend_multi_embeddings(self):
+        pass
 
-  def test_blend_multi_mixed(self):
-    pass
+    def test_blend_multi_mixed(self):
+        pass
diff --git a/api/tests/convert/test_utils.py b/api/tests/convert/test_utils.py
index f08f0d0c..ae0c2842 100644
--- a/api/tests/convert/test_utils.py
+++ b/api/tests/convert/test_utils.py
@@ -13,7 +13,6 @@ from onnx_web.convert.utils import (
     tuple_to_upscaling,
 )
 from tests.helpers import (
-    TEST_MODEL_DIFFUSION_SD15,
     TEST_MODEL_UPSCALING_SWINIR,
     test_needs_models,
 )
@@ -21,220 +20,225 @@ from tests.helpers import (
 
 class ConversionContextTests(unittest.TestCase):
     def test_from_environ(self):
-      context = ConversionContext.from_environ()
-      self.assertEqual(context.opset, DEFAULT_OPSET)
+        context = ConversionContext.from_environ()
+        self.assertEqual(context.opset, DEFAULT_OPSET)
 
     def test_map_location(self):
-      context = ConversionContext.from_environ()
-      self.assertEqual(context.map_location.type, "cpu")
+        context = ConversionContext.from_environ()
+        self.assertEqual(context.map_location.type, "cpu")
 
 
 class DownloadProgressTests(unittest.TestCase):
-   def test_download_example(self):
-      path = download_progress([("https://example.com", "/tmp/example-dot-com")])
-      self.assertEqual(path, "/tmp/example-dot-com")
+    def test_download_example(self):
+        path = download_progress([("https://example.com", "/tmp/example-dot-com")])
+        self.assertEqual(path, "/tmp/example-dot-com")
 
 
 class TupleToSourceTests(unittest.TestCase):
-   def test_basic_tuple(self):
-      source = tuple_to_source(("foo", "bar"))
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_tuple(self):
+        source = tuple_to_source(("foo", "bar"))
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_list(self):
-      source = tuple_to_source(["foo", "bar"])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_list(self):
+        source = tuple_to_source(["foo", "bar"])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_dict(self):
-      source = tuple_to_source(["foo", "bar"])
-      source["bin"] = "bin"
+    def test_basic_dict(self):
+        source = tuple_to_source(["foo", "bar"])
+        source["bin"] = "bin"
 
-      # make sure this is returned as-is with extra fields
-      second = tuple_to_source(source)
+        # make sure this is returned as-is with extra fields
+        second = tuple_to_source(source)
 
-      self.assertEqual(source, second)
-      self.assertIn("bin", second)
+        self.assertEqual(source, second)
+        self.assertIn("bin", second)
 
 
 class TupleToCorrectionTests(unittest.TestCase):
-   def test_basic_tuple(self):
-      source = tuple_to_correction(("foo", "bar"))
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_tuple(self):
+        source = tuple_to_correction(("foo", "bar"))
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_list(self):
-      source = tuple_to_correction(["foo", "bar"])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_list(self):
+        source = tuple_to_correction(["foo", "bar"])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_dict(self):
-      source = tuple_to_correction(["foo", "bar"])
-      source["bin"] = "bin"
+    def test_basic_dict(self):
+        source = tuple_to_correction(["foo", "bar"])
+        source["bin"] = "bin"
 
-      # make sure this is returned with extra fields
-      second = tuple_to_source(source)
+        # make sure this is returned with extra fields
+        second = tuple_to_source(source)
 
-      self.assertEqual(source, second)
-      self.assertIn("bin", second)
+        self.assertEqual(source, second)
+        self.assertIn("bin", second)
 
-   def test_scale_tuple(self):
-      source = tuple_to_correction(["foo", "bar", 2])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_scale_tuple(self):
+        source = tuple_to_correction(["foo", "bar", 2])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_half_tuple(self):
-      source = tuple_to_correction(["foo", "bar", True])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_half_tuple(self):
+        source = tuple_to_correction(["foo", "bar", True])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_opset_tuple(self):
-      source = tuple_to_correction(["foo", "bar", 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_opset_tuple(self):
+        source = tuple_to_correction(["foo", "bar", 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_all_tuple(self):
-      source = tuple_to_correction(["foo", "bar", 2, True, 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
-      self.assertEqual(source["scale"], 2)
-      self.assertEqual(source["half"], True)
-      self.assertEqual(source["opset"], 14)
+    def test_all_tuple(self):
+        source = tuple_to_correction(["foo", "bar", 2, True, 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
+        self.assertEqual(source["scale"], 2)
+        self.assertEqual(source["half"], True)
+        self.assertEqual(source["opset"], 14)
 
 
 class TupleToDiffusionTests(unittest.TestCase):
-   def test_basic_tuple(self):
-      source = tuple_to_diffusion(("foo", "bar"))
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_tuple(self):
+        source = tuple_to_diffusion(("foo", "bar"))
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_list(self):
-      source = tuple_to_diffusion(["foo", "bar"])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_list(self):
+        source = tuple_to_diffusion(["foo", "bar"])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_dict(self):
-      source = tuple_to_diffusion(["foo", "bar"])
-      source["bin"] = "bin"
+    def test_basic_dict(self):
+        source = tuple_to_diffusion(["foo", "bar"])
+        source["bin"] = "bin"
 
-      # make sure this is returned with extra fields
-      second = tuple_to_diffusion(source)
+        # make sure this is returned with extra fields
+        second = tuple_to_diffusion(source)
 
-      self.assertEqual(source, second)
-      self.assertIn("bin", second)
+        self.assertEqual(source, second)
+        self.assertIn("bin", second)
 
-   def test_single_vae_tuple(self):
-      source = tuple_to_diffusion(["foo", "bar", True])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_single_vae_tuple(self):
+        source = tuple_to_diffusion(["foo", "bar", True])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_half_tuple(self):
-      source = tuple_to_diffusion(["foo", "bar", True])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_half_tuple(self):
+        source = tuple_to_diffusion(["foo", "bar", True])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_opset_tuple(self):
-      source = tuple_to_diffusion(["foo", "bar", 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_opset_tuple(self):
+        source = tuple_to_diffusion(["foo", "bar", 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_all_tuple(self):
-      source = tuple_to_diffusion(["foo", "bar", True, True, 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
-      self.assertEqual(source["single_vae"], True)
-      self.assertEqual(source["half"], True)
-      self.assertEqual(source["opset"], 14)
+    def test_all_tuple(self):
+        source = tuple_to_diffusion(["foo", "bar", True, True, 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
+        self.assertEqual(source["single_vae"], True)
+        self.assertEqual(source["half"], True)
+        self.assertEqual(source["opset"], 14)
 
 
 class TupleToUpscalingTests(unittest.TestCase):
-   def test_basic_tuple(self):
-      source = tuple_to_upscaling(("foo", "bar"))
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_tuple(self):
+        source = tuple_to_upscaling(("foo", "bar"))
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_list(self):
-      source = tuple_to_upscaling(["foo", "bar"])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_basic_list(self):
+        source = tuple_to_upscaling(["foo", "bar"])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_basic_dict(self):
-      source = tuple_to_upscaling(["foo", "bar"])
-      source["bin"] = "bin"
+    def test_basic_dict(self):
+        source = tuple_to_upscaling(["foo", "bar"])
+        source["bin"] = "bin"
 
-      # make sure this is returned with extra fields
-      second = tuple_to_source(source)
+        # make sure this is returned with extra fields
+        second = tuple_to_source(source)
 
-      self.assertEqual(source, second)
-      self.assertIn("bin", second)
+        self.assertEqual(source, second)
+        self.assertIn("bin", second)
 
-   def test_scale_tuple(self):
-      source = tuple_to_upscaling(["foo", "bar", 2])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_scale_tuple(self):
+        source = tuple_to_upscaling(["foo", "bar", 2])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_half_tuple(self):
-      source = tuple_to_upscaling(["foo", "bar", True])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_half_tuple(self):
+        source = tuple_to_upscaling(["foo", "bar", True])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_opset_tuple(self):
-      source = tuple_to_upscaling(["foo", "bar", 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
+    def test_opset_tuple(self):
+        source = tuple_to_upscaling(["foo", "bar", 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
 
-   def test_all_tuple(self):
-      source = tuple_to_upscaling(["foo", "bar", 2, True, 14])
-      self.assertEqual(source["name"], "foo")
-      self.assertEqual(source["source"], "bar")
-      self.assertEqual(source["scale"], 2)
-      self.assertEqual(source["half"], True)
-      self.assertEqual(source["opset"], 14)
+    def test_all_tuple(self):
+        source = tuple_to_upscaling(["foo", "bar", 2, True, 14])
+        self.assertEqual(source["name"], "foo")
+        self.assertEqual(source["source"], "bar")
+        self.assertEqual(source["scale"], 2)
+        self.assertEqual(source["half"], True)
+        self.assertEqual(source["opset"], 14)
 
 
 class SourceFormatTests(unittest.TestCase):
-   def test_with_format(self):
-      result = source_format({
-         "format": "foo",
-      })
-      self.assertEqual(result, "foo")
+    def test_with_format(self):
+        result = source_format(
+            {
+                "format": "foo",
+            }
+        )
+        self.assertEqual(result, "foo")
 
-   def test_source_known_extension(self):
-      result = source_format({
-         "source": "foo.safetensors",
-      })
-      self.assertEqual(result, "safetensors")
+    def test_source_known_extension(self):
+        result = source_format(
+            {
+                "source": "foo.safetensors",
+            }
+        )
+        self.assertEqual(result, "safetensors")
 
-   def test_source_unknown_extension(self):
-      result = source_format({
-         "source": "foo.none"
-      })
-      self.assertEqual(result, None)
+    def test_source_unknown_extension(self):
+        result = source_format({"source": "foo.none"})
+        self.assertEqual(result, None)
 
-   def test_incomplete_model(self):
-      self.assertIsNone(source_format({}))
+    def test_incomplete_model(self):
+        self.assertIsNone(source_format({}))
 
 
 class RemovePrefixTests(unittest.TestCase):
-   def test_with_prefix(self):
-      self.assertEqual(remove_prefix("foo.bar", "foo"), ".bar")
+    def test_with_prefix(self):
+        self.assertEqual(remove_prefix("foo.bar", "foo"), ".bar")
 
-   def test_without_prefix(self):
-      self.assertEqual(remove_prefix("foo.bar", "bin"), "foo.bar")
+    def test_without_prefix(self):
+        self.assertEqual(remove_prefix("foo.bar", "bin"), "foo.bar")
 
 
 class LoadTorchTests(unittest.TestCase):
-   pass
+    pass
 
 
 class LoadTensorTests(unittest.TestCase):
-   pass
+    pass
 
 
 class ResolveTensorTests(unittest.TestCase):
-   @test_needs_models([TEST_MODEL_UPSCALING_SWINIR])
-   def test_resolve_existing(self):
-      self.assertEqual(resolve_tensor("../models/.cache/upscaling-swinir"), TEST_MODEL_UPSCALING_SWINIR)
+    @test_needs_models([TEST_MODEL_UPSCALING_SWINIR])
+    def test_resolve_existing(self):
+        self.assertEqual(
+            resolve_tensor("../models/.cache/upscaling-swinir"),
+            TEST_MODEL_UPSCALING_SWINIR,
+        )
 
-   def test_resolve_missing(self):
-      self.assertIsNone(resolve_tensor("missing"))
+    def test_resolve_missing(self):
+        self.assertIsNone(resolve_tensor("missing"))
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index 3b6716b2..64714819 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -6,11 +6,13 @@ from onnx_web.params import DeviceParams
 
 
 def test_needs_models(models: List[str]):
-  return skipUnless(all([path.exists(model) for model in models]), "model does not exist")
+    return skipUnless(
+        all([path.exists(model) for model in models]), "model does not exist"
+    )
 
 
 def test_device() -> DeviceParams:
-  return DeviceParams("cpu", "CPUExecutionProvider")
+    return DeviceParams("cpu", "CPUExecutionProvider")
 
 
 TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
diff --git a/api/tests/image/test_mask_filter.py b/api/tests/image/test_mask_filter.py
index 58b46c7c..e36470e4 100644
--- a/api/tests/image/test_mask_filter.py
+++ b/api/tests/image/test_mask_filter.py
@@ -10,24 +10,24 @@ from onnx_web.image.mask_filter import (
 
 
 class MaskFilterNoneTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    mask = Image.new("RGB", dims)
-    result = mask_filter_none(mask, dims, (0, 0))
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        mask = Image.new("RGB", dims)
+        result = mask_filter_none(mask, dims, (0, 0))
+        self.assertEqual(result.size, dims)
 
 
 class MaskFilterGaussianMultiplyTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    mask = Image.new("RGB", dims)
-    result = mask_filter_gaussian_multiply(mask, dims, (0, 0))
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        mask = Image.new("RGB", dims)
+        result = mask_filter_gaussian_multiply(mask, dims, (0, 0))
+        self.assertEqual(result.size, dims)
 
 
 class MaskFilterGaussianScreenTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    mask = Image.new("RGB", dims)
-    result = mask_filter_gaussian_screen(mask, dims, (0, 0))
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        mask = Image.new("RGB", dims)
+        result = mask_filter_gaussian_screen(mask, dims, (0, 0))
+        self.assertEqual(result.size, dims)
diff --git a/api/tests/image/test_source_filter.py b/api/tests/image/test_source_filter.py
index 89e73924..fb44073e 100644
--- a/api/tests/image/test_source_filter.py
+++ b/api/tests/image/test_source_filter.py
@@ -11,27 +11,27 @@ from onnx_web.server.context import ServerContext
 
 
 class SourceFilterNoneTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    server = ServerContext()
-    source = Image.new("RGB", dims)
-    result = source_filter_none(server, source)
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        server = ServerContext()
+        source = Image.new("RGB", dims)
+        result = source_filter_none(server, source)
+        self.assertEqual(result.size, dims)
 
 
 class SourceFilterGaussianTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    server = ServerContext()
-    source = Image.new("RGB", dims)
-    result = source_filter_gaussian(server, source)
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        server = ServerContext()
+        source = Image.new("RGB", dims)
+        result = source_filter_gaussian(server, source)
+        self.assertEqual(result.size, dims)
 
 
 class SourceFilterNoiseTests(unittest.TestCase):
-  def test_basic(self):
-    dims = (64, 64)
-    server = ServerContext()
-    source = Image.new("RGB", dims)
-    result = source_filter_noise(server, source)
-    self.assertEqual(result.size, dims)
+    def test_basic(self):
+        dims = (64, 64)
+        server = ServerContext()
+        source = Image.new("RGB", dims)
+        result = source_filter_noise(server, source)
+        self.assertEqual(result.size, dims)
diff --git a/api/tests/image/test_utils.py b/api/tests/image/test_utils.py
index f3b10fd5..215bb10b 100644
--- a/api/tests/image/test_utils.py
+++ b/api/tests/image/test_utils.py
@@ -7,18 +7,18 @@ from onnx_web.params import Border
 
 
 class ExpandImageTests(unittest.TestCase):
-  def test_expand(self):
-    result = expand_image(
-      Image.new("RGB", (8, 8)),
-      Image.new("RGB", (8, 8), "white"),
-      Border.even(4),
-    )
-    self.assertEqual(result[0].size, (16, 16))
+    def test_expand(self):
+        result = expand_image(
+            Image.new("RGB", (8, 8)),
+            Image.new("RGB", (8, 8), "white"),
+            Border.even(4),
+        )
+        self.assertEqual(result[0].size, (16, 16))
 
-  def test_masked(self):
-    result = expand_image(
-      Image.new("RGB", (8, 8), "red"),
-      Image.new("RGB", (8, 8), "white"),
-      Border.even(4),
-    )
-    self.assertEqual(result[0].getpixel((8, 8)), (255, 0, 0))
+    def test_masked(self):
+        result = expand_image(
+            Image.new("RGB", (8, 8), "red"),
+            Image.new("RGB", (8, 8), "white"),
+            Border.even(4),
+        )
+        self.assertEqual(result[0].getpixel((8, 8)), (255, 0, 0))
diff --git a/api/tests/mocks.py b/api/tests/mocks.py
index f16ae22f..ef95d754 100644
--- a/api/tests/mocks.py
+++ b/api/tests/mocks.py
@@ -1,43 +1,43 @@
 from typing import Any, Optional
 
 
-class MockPipeline():
-  # flags
-  slice_size: Optional[str]
-  vae_slicing: Optional[bool]
-  sequential_offload: Optional[bool]
-  model_offload: Optional[bool]
-  xformers: Optional[bool]
+class MockPipeline:
+    # flags
+    slice_size: Optional[str]
+    vae_slicing: Optional[bool]
+    sequential_offload: Optional[bool]
+    model_offload: Optional[bool]
+    xformers: Optional[bool]
 
-  # stubs
-  _encode_prompt: Optional[Any]
-  unet: Optional[Any]
-  vae_decoder: Optional[Any]
-  vae_encoder: Optional[Any]
+    # stubs
+    _encode_prompt: Optional[Any]
+    unet: Optional[Any]
+    vae_decoder: Optional[Any]
+    vae_encoder: Optional[Any]
 
-  def __init__(self) -> None:
-    self.slice_size = None
-    self.vae_slicing = None
-    self.sequential_offload = None
-    self.model_offload = None
-    self.xformers = None
+    def __init__(self) -> None:
+        self.slice_size = None
+        self.vae_slicing = None
+        self.sequential_offload = None
+        self.model_offload = None
+        self.xformers = None
 
-    self._encode_prompt = None
-    self.unet = None
-    self.vae_decoder = None
-    self.vae_encoder = None
+        self._encode_prompt = None
+        self.unet = None
+        self.vae_decoder = None
+        self.vae_encoder = None
 
-  def enable_attention_slicing(self, slice_size: str = None):
-    self.slice_size = slice_size
+    def enable_attention_slicing(self, slice_size: str = None):
+        self.slice_size = slice_size
 
-  def enable_vae_slicing(self):
-    self.vae_slicing = True
+    def enable_vae_slicing(self):
+        self.vae_slicing = True
 
-  def enable_sequential_cpu_offload(self):
-    self.sequential_offload = True
+    def enable_sequential_cpu_offload(self):
+        self.sequential_offload = True
 
-  def enable_model_cpu_offload(self):
-    self.model_offload = True
+    def enable_model_cpu_offload(self):
+        self.model_offload = True
 
-  def enable_xformers_memory_efficient_attention(self):
-    self.xformers = True
\ No newline at end of file
+    def enable_xformers_memory_efficient_attention(self):
+        self.xformers = True
diff --git a/api/tests/prompt/test_parser.py b/api/tests/prompt/test_parser.py
index b6b13a23..15c91d6c 100644
--- a/api/tests/prompt/test_parser.py
+++ b/api/tests/prompt/test_parser.py
@@ -13,7 +13,7 @@ class ParserTests(unittest.TestCase):
                 str(["foo"]),
                 str(PromptPhrase(["bar"], weight=1.5)),
                 str(["bin"]),
-            ]
+            ],
         )
 
     def test_multi_word_phrase(self):
@@ -24,7 +24,7 @@ class ParserTests(unittest.TestCase):
                 str(["foo", "bar"]),
                 str(PromptPhrase(["middle", "words"], weight=1.5)),
                 str(["bin", "bun"]),
-            ]
+            ],
         )
 
     def test_nested_phrase(self):
@@ -33,7 +33,7 @@ class ParserTests(unittest.TestCase):
             [str(i) for i in res],
             [
                 str(["foo"]),
-                str(PromptPhrase(["bar"], weight=(1.5 ** 3))),
+                str(PromptPhrase(["bar"], weight=(1.5**3))),
                 str(["bin"]),
-            ]
+            ],
         )
diff --git a/api/tests/server/test_load.py b/api/tests/server/test_load.py
index c32b9663..b04df9ef 100644
--- a/api/tests/server/test_load.py
+++ b/api/tests/server/test_load.py
@@ -25,71 +25,85 @@ class ConfigParamTests(unittest.TestCase):
         params = get_config_params()
         self.assertIsNotNone(params)
 
+
 class AvailablePlatformTests(unittest.TestCase):
     def test_before_setup(self):
         platforms = get_available_platforms()
         self.assertIsNotNone(platforms)
 
+
 class CorrectModelTests(unittest.TestCase):
     def test_before_setup(self):
         models = get_correction_models()
         self.assertIsNotNone(models)
 
+
 class DiffusionModelTests(unittest.TestCase):
     def test_before_setup(self):
         models = get_diffusion_models()
         self.assertIsNotNone(models)
 
+
 class NetworkModelTests(unittest.TestCase):
     def test_before_setup(self):
         models = get_network_models()
         self.assertIsNotNone(models)
 
+
 class UpscalingModelTests(unittest.TestCase):
     def test_before_setup(self):
         models = get_upscaling_models()
         self.assertIsNotNone(models)
 
+
 class WildcardDataTests(unittest.TestCase):
     def test_before_setup(self):
         wildcards = get_wildcard_data()
         self.assertIsNotNone(wildcards)
 
+
 class ExtraStringsTests(unittest.TestCase):
     def test_before_setup(self):
         strings = get_extra_strings()
         self.assertIsNotNone(strings)
 
+
 class ExtraHashesTests(unittest.TestCase):
     def test_before_setup(self):
         hashes = get_extra_hashes()
         self.assertIsNotNone(hashes)
 
+
 class HighresMethodTests(unittest.TestCase):
     def test_before_setup(self):
         methods = get_highres_methods()
         self.assertIsNotNone(methods)
 
+
 class MaskFilterTests(unittest.TestCase):
     def test_before_setup(self):
         filters = get_mask_filters()
         self.assertIsNotNone(filters)
 
+
 class NoiseSourceTests(unittest.TestCase):
     def test_before_setup(self):
         sources = get_noise_sources()
         self.assertIsNotNone(sources)
 
+
 class SourceFilterTests(unittest.TestCase):
     def test_before_setup(self):
         filters = get_source_filters()
         self.assertIsNotNone(filters)
 
+
 class LoadExtrasTests(unittest.TestCase):
     def test_default_extras(self):
         server = ServerContext(extra_models=["../models/extras.json"])
         load_extras(server)
 
+
 class LoadModelsTests(unittest.TestCase):
     def test_default_models(self):
         server = ServerContext(model_path="../models")
diff --git a/api/tests/server/test_model_cache.py b/api/tests/server/test_model_cache.py
index 0e4839c9..c024b611 100644
--- a/api/tests/server/test_model_cache.py
+++ b/api/tests/server/test_model_cache.py
@@ -4,37 +4,37 @@ from onnx_web.server.model_cache import ModelCache
 
 
 class TestModelCache(unittest.TestCase):
-  def test_drop_existing(self):
-    cache = ModelCache(10)
-    cache.clear()
-    cache.set("foo", ("bar",), {})
-    self.assertGreater(cache.size, 0)
-    self.assertEqual(cache.drop("foo", ("bar",)), 1)
+    def test_drop_existing(self):
+        cache = ModelCache(10)
+        cache.clear()
+        cache.set("foo", ("bar",), {})
+        self.assertGreater(cache.size, 0)
+        self.assertEqual(cache.drop("foo", ("bar",)), 1)
 
-  def test_drop_missing(self):
-    cache = ModelCache(10)
-    cache.clear()
-    cache.set("foo", ("bar",), {})
-    self.assertGreater(cache.size, 0)
-    self.assertEqual(cache.drop("foo", ("bin",)), 0)
+    def test_drop_missing(self):
+        cache = ModelCache(10)
+        cache.clear()
+        cache.set("foo", ("bar",), {})
+        self.assertGreater(cache.size, 0)
+        self.assertEqual(cache.drop("foo", ("bin",)), 0)
 
-  def test_get_existing(self):
-    cache = ModelCache(10)
-    cache.clear()
-    value = {}
-    cache.set("foo", ("bar",), value)
-    self.assertGreater(cache.size, 0)
-    self.assertIs(cache.get("foo", ("bar",)), value)
+    def test_get_existing(self):
+        cache = ModelCache(10)
+        cache.clear()
+        value = {}
+        cache.set("foo", ("bar",), value)
+        self.assertGreater(cache.size, 0)
+        self.assertIs(cache.get("foo", ("bar",)), value)
 
-  def test_get_missing(self):
-    cache = ModelCache(10)
-    cache.clear()
-    value = {}
-    cache.set("foo", ("bar",), value)
-    self.assertGreater(cache.size, 0)
-    self.assertIs(cache.get("foo", ("bin",)), None)
+    def test_get_missing(self):
+        cache = ModelCache(10)
+        cache.clear()
+        value = {}
+        cache.set("foo", ("bar",), value)
+        self.assertGreater(cache.size, 0)
+        self.assertIs(cache.get("foo", ("bin",)), None)
 
-  """
+    """
   def test_set_existing(self):
     cache = ModelCache(10)
     cache.clear()
@@ -48,16 +48,16 @@ class TestModelCache(unittest.TestCase):
     self.assertIs(cache.get("foo", ("bar",)), value)
   """
 
-  def test_set_missing(self):
-    cache = ModelCache(10)
-    cache.clear()
-    value = {}
-    cache.set("foo", ("bar",), value)
-    self.assertIs(cache.get("foo", ("bar",)), value)
+    def test_set_missing(self):
+        cache = ModelCache(10)
+        cache.clear()
+        value = {}
+        cache.set("foo", ("bar",), value)
+        self.assertIs(cache.get("foo", ("bar",)), value)
 
-  def test_set_zero(self):
-    cache = ModelCache(0)
-    cache.clear()
-    value = {}
-    cache.set("foo", ("bar",), value)
-    self.assertEqual(cache.size, 0)
+    def test_set_zero(self):
+        cache = ModelCache(0)
+        cache.clear()
+        value = {}
+        cache.set("foo", ("bar",), value)
+        self.assertEqual(cache.size, 0)
diff --git a/api/tests/test_diffusers/test_load.py b/api/tests/test_diffusers/test_load.py
index 8f7a3963..014f7aa0 100644
--- a/api/tests/test_diffusers/test_load.py
+++ b/api/tests/test_diffusers/test_load.py
@@ -24,253 +24,307 @@ from tests.mocks import MockPipeline
 
 
 class TestAvailablePipelines(unittest.TestCase):
-  def test_available_pipelines(self):
-    pipelines = get_available_pipelines()
+    def test_available_pipelines(self):
+        pipelines = get_available_pipelines()
 
-    self.assertIn("txt2img", pipelines)
+        self.assertIn("txt2img", pipelines)
 
 
 class TestPipelineSchedulers(unittest.TestCase):
-  def test_pipeline_schedulers(self):
-    schedulers = get_pipeline_schedulers()
+    def test_pipeline_schedulers(self):
+        schedulers = get_pipeline_schedulers()
 
-    self.assertIn("euler-a", schedulers)
+        self.assertIn("euler-a", schedulers)
 
 
 class TestSchedulerNames(unittest.TestCase):
-  def test_valid_name(self):
-    scheduler = get_scheduler_name(DDIMScheduler)
+    def test_valid_name(self):
+        scheduler = get_scheduler_name(DDIMScheduler)
 
-    self.assertEqual("ddim", scheduler)
+        self.assertEqual("ddim", scheduler)
 
-  def test_missing_names(self):
-    self.assertIsNone(get_scheduler_name("test"))
+    def test_missing_names(self):
+        self.assertIsNone(get_scheduler_name("test"))
 
 
 class TestOptimizePipeline(unittest.TestCase):
-  def test_auto_attention_slicing(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-attention-slicing-auto",
-      ],
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.slice_size, "auto")
+    def test_auto_attention_slicing(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-attention-slicing-auto",
+            ],
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.slice_size, "auto")
 
-  def test_max_attention_slicing(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-attention-slicing-max",
-      ]
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.slice_size, "max")
+    def test_max_attention_slicing(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-attention-slicing-max",
+            ]
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.slice_size, "max")
 
-  def test_vae_slicing(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-vae-slicing",
-      ]
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.vae_slicing, True)
+    def test_vae_slicing(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-vae-slicing",
+            ]
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.vae_slicing, True)
 
-  def test_cpu_offload_sequential(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-cpu-offload-sequential",
-      ]
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.sequential_offload, True)
+    def test_cpu_offload_sequential(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-cpu-offload-sequential",
+            ]
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.sequential_offload, True)
 
-  def test_cpu_offload_model(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-cpu-offload-model",
-      ]
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.model_offload, True)
+    def test_cpu_offload_model(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-cpu-offload-model",
+            ]
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.model_offload, True)
 
-  def test_memory_efficient_attention(self):
-    server = ServerContext(
-      optimizations=[
-        "diffusers-memory-efficient-attention",
-      ]
-    )
-    pipeline = MockPipeline()
-    optimize_pipeline(server, pipeline)
-    self.assertEqual(pipeline.xformers, True)
+    def test_memory_efficient_attention(self):
+        server = ServerContext(
+            optimizations=[
+                "diffusers-memory-efficient-attention",
+            ]
+        )
+        pipeline = MockPipeline()
+        optimize_pipeline(server, pipeline)
+        self.assertEqual(pipeline.xformers, True)
 
 
 class TestPatchPipeline(unittest.TestCase):
-  def test_expand_not_lpw(self):
-    """
-    server = ServerContext()
-    pipeline = MockPipeline()
-    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
-    self.assertEqual(pipeline._encode_prompt, expand_prompt)
-    """
-    pass
+    def test_expand_not_lpw(self):
+        """
+        server = ServerContext()
+        pipeline = MockPipeline()
+        patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
+        self.assertEqual(pipeline._encode_prompt, expand_prompt)
+        """
+        pass
 
-  def test_unet_wrapper_not_xl(self):
-    server = ServerContext()
-    pipeline = MockPipeline()
-    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
-    self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
+    def test_unet_wrapper_not_xl(self):
+        server = ServerContext()
+        pipeline = MockPipeline()
+        patch_pipeline(
+            server,
+            pipeline,
+            None,
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
 
-  def test_unet_wrapper_xl(self):
-    server = ServerContext()
-    pipeline = MockPipeline()
-    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img-sdxl", "ddim", "test", 1.0, 10, 1))
-    self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
+    def test_unet_wrapper_xl(self):
+        server = ServerContext()
+        pipeline = MockPipeline()
+        patch_pipeline(
+            server,
+            pipeline,
+            None,
+            ImageParams("test", "txt2img-sdxl", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertTrue(isinstance(pipeline.unet, UNetWrapper))
 
-  def test_vae_wrapper(self):
-    server = ServerContext()
-    pipeline = MockPipeline()
-    patch_pipeline(server, pipeline, None, ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1))
-    self.assertTrue(isinstance(pipeline.vae_decoder, VAEWrapper))
-    self.assertTrue(isinstance(pipeline.vae_encoder, VAEWrapper))
+    def test_vae_wrapper(self):
+        server = ServerContext()
+        pipeline = MockPipeline()
+        patch_pipeline(
+            server,
+            pipeline,
+            None,
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertTrue(isinstance(pipeline.vae_decoder, VAEWrapper))
+        self.assertTrue(isinstance(pipeline.vae_encoder, VAEWrapper))
 
 
 class TestLoadControlNet(unittest.TestCase):
-  @unittest.skipUnless(path.exists("../models/control/canny.onnx"), "model does not exist")
-  def test_load_existing(self):
-    """
-    Should load a model
-    """
-    components = load_controlnet(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1, control=NetworkModel("canny", "control")),
+    @unittest.skipUnless(
+        path.exists("../models/control/canny.onnx"), "model does not exist"
     )
-    self.assertIn("controlnet", components)
+    def test_load_existing(self):
+        """
+        Should load a model
+        """
+        components = load_controlnet(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            ImageParams(
+                "test",
+                "txt2img",
+                "ddim",
+                "test",
+                1.0,
+                10,
+                1,
+                control=NetworkModel("canny", "control"),
+            ),
+        )
+        self.assertIn("controlnet", components)
 
-  def test_load_missing(self):
-    """
-    Should throw
-    """
-    components = {}
-    try:
-      components = load_controlnet(
-        ServerContext(),
-        DeviceParams("cpu", "CPUExecutionProvider"),
-        ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1, control=NetworkModel("missing", "control")),
-      )
-    except:
-      self.assertNotIn("controlnet", components)
-      return
+    def test_load_missing(self):
+        """
+        Should throw
+        """
+        components = {}
+        try:
+            components = load_controlnet(
+                ServerContext(),
+                DeviceParams("cpu", "CPUExecutionProvider"),
+                ImageParams(
+                    "test",
+                    "txt2img",
+                    "ddim",
+                    "test",
+                    1.0,
+                    10,
+                    1,
+                    control=NetworkModel("missing", "control"),
+                ),
+            )
+        except Exception:
+            self.assertNotIn("controlnet", components)
+            return
 
-    self.fail()
+        self.fail()
 
 
 class TestLoadTextEncoders(unittest.TestCase):
-  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
-  def test_load_embeddings(self):
-    """
-    Should add the token to tokenizer
-    Should increase the encoder dims
-    """
-    components = load_text_encoders(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/stable-diffusion-onnx-v1-5",
-      [
-        # TODO: add some embeddings
-      ],
-      [],
-      torch.float32,
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"),
+        "model does not exist",
     )
-    self.assertIn("text_encoder", components)
+    def test_load_embeddings(self):
+        """
+        Should add the token to tokenizer
+        Should increase the encoder dims
+        """
+        components = load_text_encoders(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/stable-diffusion-onnx-v1-5",
+            [
+                # TODO: add some embeddings
+            ],
+            [],
+            torch.float32,
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertIn("text_encoder", components)
 
-  def test_load_embeddings_xl(self):
-    pass
+    def test_load_embeddings_xl(self):
+        pass
 
-  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"), "model does not exist")
-  def test_load_loras(self):
-    components = load_text_encoders(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/stable-diffusion-onnx-v1-5",
-      [],
-      [
-        # TODO: add some loras
-      ],
-      torch.float32,
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/stable-diffusion-onnx-v1-5/text_encoder/model.onnx"),
+        "model does not exist",
     )
-    self.assertIn("text_encoder", components)
+    def test_load_loras(self):
+        components = load_text_encoders(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/stable-diffusion-onnx-v1-5",
+            [],
+            [
+                # TODO: add some loras
+            ],
+            torch.float32,
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertIn("text_encoder", components)
+
+    def test_load_loras_xl(self):
+        pass
 
-  def test_load_loras_xl(self):
-    pass
 
 class TestLoadUnet(unittest.TestCase):
-  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/unet/model.onnx"), "model does not exist")
-  def test_load_unet_loras(self):
-    components = load_unet(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/stable-diffusion-onnx-v1-5",
-      [
-        # TODO: add some loras
-      ],
-      "unet",
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/stable-diffusion-onnx-v1-5/unet/model.onnx"),
+        "model does not exist",
     )
-    self.assertIn("unet", components)
+    def test_load_unet_loras(self):
+        components = load_unet(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/stable-diffusion-onnx-v1-5",
+            [
+                # TODO: add some loras
+            ],
+            "unet",
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertIn("unet", components)
 
-  def test_load_unet_loras_xl(self):
-    pass
+    def test_load_unet_loras_xl(self):
+        pass
 
-  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/cnet/model.onnx"), "model does not exist")
-  def test_load_cnet_loras(self):
-    components = load_unet(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/stable-diffusion-onnx-v1-5",
-      [
-        # TODO: add some loras
-      ],
-      "cnet",
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/stable-diffusion-onnx-v1-5/cnet/model.onnx"),
+        "model does not exist",
     )
-    self.assertIn("unet", components)
+    def test_load_cnet_loras(self):
+        components = load_unet(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/stable-diffusion-onnx-v1-5",
+            [
+                # TODO: add some loras
+            ],
+            "cnet",
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertIn("unet", components)
 
 
 class TestLoadVae(unittest.TestCase):
-  @unittest.skipUnless(path.exists("../models/upscaling-stable-diffusion-x4/vae/model.onnx"), "model does not exist")
-  def test_load_single(self):
-    """
-    Should return single component
-    """
-    components = load_vae(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/upscaling-stable-diffusion-x4",
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/upscaling-stable-diffusion-x4/vae/model.onnx"),
+        "model does not exist",
     )
-    self.assertIn("vae", components)
-    self.assertNotIn("vae_decoder", components)
-    self.assertNotIn("vae_encoder", components)
+    def test_load_single(self):
+        """
+        Should return single component
+        """
+        components = load_vae(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/upscaling-stable-diffusion-x4",
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertIn("vae", components)
+        self.assertNotIn("vae_decoder", components)
+        self.assertNotIn("vae_encoder", components)
 
-  @unittest.skipUnless(path.exists("../models/stable-diffusion-onnx-v1-5/vae_encoder/model.onnx"), "model does not exist")
-  def test_load_split(self):
-    """
-    Should return split encoder/decoder
-    """
-    components = load_vae(
-      ServerContext(model_path="../models"),
-      DeviceParams("cpu", "CPUExecutionProvider"),
-      "../models/stable-diffusion-onnx-v1-5",
-      ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+    @unittest.skipUnless(
+        path.exists("../models/stable-diffusion-onnx-v1-5/vae_encoder/model.onnx"),
+        "model does not exist",
     )
-    self.assertNotIn("vae", components)
-    self.assertIn("vae_decoder", components)
-    self.assertIn("vae_encoder", components)
+    def test_load_split(self):
+        """
+        Should return split encoder/decoder
+        """
+        components = load_vae(
+            ServerContext(model_path="../models"),
+            DeviceParams("cpu", "CPUExecutionProvider"),
+            "../models/stable-diffusion-onnx-v1-5",
+            ImageParams("test", "txt2img", "ddim", "test", 1.0, 10, 1),
+        )
+        self.assertNotIn("vae", components)
+        self.assertIn("vae_decoder", components)
+        self.assertIn("vae_encoder", components)
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index 5152a834..bb374838 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -17,155 +17,234 @@ from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_device, test_needs_mod
 
 
 class TestTxt2ImgPipeline(unittest.TestCase):
-  @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
-  def test_basic(self):
-    cancel = Value("L", 0)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    active = Value("L", 0)
-    idle = Value("L", 0)
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+    def test_basic(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
 
-    worker = WorkerContext(
-      "test",
-      test_device(),
-      cancel,
-      logs,
-      pending,
-      progress,
-      active,
-      idle,
-      3,
-      0.1,
-    )
-    worker.start("test")
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
 
-    run_txt2img_pipeline(
-      worker,
-      ServerContext(model_path="../models", output_path="../outputs"),
-      ImageParams(
-        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
-      Size(256, 256),
-      ["test-txt2img.png"],
-      UpscaleParams("test"),
-      HighresParams(False, 1, 0, 0),
-    )
+        run_txt2img_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+            ),
+            Size(256, 256),
+            ["test-txt2img-basic.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+        )
+
+        self.assertTrue(path.exists("../outputs/test-txt2img-basic.png"))
+        output = Image.open("../outputs/test-txt2img-basic.png")
+        self.assertEqual(output.size, (256, 256))
+        # TODO: test contents of image
+
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+    def test_highres(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
+
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
+
+        run_txt2img_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+            ),
+            Size(256, 256),
+            ["test-txt2img-highres.png"],
+            UpscaleParams("test"),
+            HighresParams(True, 2, 0, 0),
+        )
+
+        self.assertTrue(path.exists("../outputs/test-txt2img-highres.png"))
+        output = Image.open("../outputs/test-txt2img-highres.png")
+        self.assertEqual(output.size, (512, 512))
 
-    self.assertTrue(path.exists("../outputs/test-txt2img.png"))
 
 class TestImg2ImgPipeline(unittest.TestCase):
-  @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
-  def test_basic(self):
-    cancel = Value("L", 0)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    active = Value("L", 0)
-    idle = Value("L", 0)
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+    def test_basic(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
 
-    worker = WorkerContext(
-      "test",
-      test_device(),
-      cancel,
-      logs,
-      pending,
-      progress,
-      active,
-      idle,
-      3,
-      0.1,
-    )
-    worker.start("test")
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
 
-    source = Image.new("RGB", (64, 64), "black")
-    run_img2img_pipeline(
-      worker,
-      ServerContext(model_path="../models", output_path="../outputs"),
-      ImageParams(
-        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
-      ["test-img2img.png"],
-      UpscaleParams("test"),
-      HighresParams(False, 1, 0, 0),
-      source,
-      1.0,
-    )
+        source = Image.new("RGB", (64, 64), "black")
+        run_img2img_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+            ),
+            ["test-img2img.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+            source,
+            1.0,
+        )
+
+        self.assertTrue(path.exists("../outputs/test-img2img.png"))
 
-    self.assertTrue(path.exists("../outputs/test-img2img.png"))
 
 class TestUpscalePipeline(unittest.TestCase):
-  @test_needs_models(["../models/upscaling-stable-diffusion-x4"])
-  def test_basic(self):
-    cancel = Value("L", 0)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    active = Value("L", 0)
-    idle = Value("L", 0)
+    @test_needs_models(["../models/upscaling-stable-diffusion-x4"])
+    def test_basic(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
 
-    worker = WorkerContext(
-      "test",
-      test_device(),
-      cancel,
-      logs,
-      pending,
-      progress,
-      active,
-      idle,
-      3,
-      0.1,
-    )
-    worker.start("test")
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
 
-    source = Image.new("RGB", (64, 64), "black")
-    run_upscale_pipeline(
-      worker,
-      ServerContext(model_path="../models", output_path="../outputs"),
-      ImageParams(
-        "../models/upscaling-stable-diffusion-x4", "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
-      Size(256, 256),
-      ["test-upscale.png"],
-      UpscaleParams("test"),
-      HighresParams(False, 1, 0, 0),
-      source,
-    )
+        source = Image.new("RGB", (64, 64), "black")
+        run_upscale_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                "../models/upscaling-stable-diffusion-x4",
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+            ),
+            Size(256, 256),
+            ["test-upscale.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+            source,
+        )
+
+        self.assertTrue(path.exists("../outputs/test-upscale.png"))
 
-    self.assertTrue(path.exists("../outputs/test-upscale.png"))
 
 class TestBlendPipeline(unittest.TestCase):
-  def test_basic(self):
-    cancel = Value("L", 0)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    active = Value("L", 0)
-    idle = Value("L", 0)
+    def test_basic(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
 
-    worker = WorkerContext(
-      "test",
-      test_device(),
-      cancel,
-      logs,
-      pending,
-      progress,
-      active,
-      idle,
-      3,
-      0.1,
-    )
-    worker.start("test")
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
 
-    source = Image.new("RGBA", (64, 64), "black")
-    mask = Image.new("RGBA", (64, 64), "white")
-    run_blend_pipeline(
-      worker,
-      ServerContext(model_path="../models", output_path="../outputs"),
-      ImageParams(
-        TEST_MODEL_DIFFUSION_SD15, "txt2img", "ddim", "an astronaut eating a hamburger", 3.0, 1, 1),
-      Size(64, 64),
-      ["test-blend.png"],
-      UpscaleParams("test"),
-      [source, source],
-      mask,
-    )
+        source = Image.new("RGBA", (64, 64), "black")
+        mask = Image.new("RGBA", (64, 64), "white")
+        run_blend_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+            ),
+            Size(64, 64),
+            ["test-blend.png"],
+            UpscaleParams("test"),
+            [source, source],
+            mask,
+        )
 
-    self.assertTrue(path.exists("../outputs/test-blend.png"))
+        self.assertTrue(path.exists("../outputs/test-blend.png"))
diff --git a/api/tests/test_diffusers/test_utils.py b/api/tests/test_diffusers/test_utils.py
index a98647cb..0e576d8b 100644
--- a/api/tests/test_diffusers/test_utils.py
+++ b/api/tests/test_diffusers/test_utils.py
@@ -10,7 +10,6 @@ from onnx_web.diffusers.utils import (
     get_loras_from_prompt,
     get_scaled_latents,
     get_tile_latents,
-    get_tokens_from_prompt,
     pop_random,
     slice_prompt,
 )
@@ -18,110 +17,128 @@ from onnx_web.params import Size
 
 
 class TestExpandIntervalRanges(unittest.TestCase):
-  def test_prompt_with_no_ranges(self):
-    prompt = "an astronaut eating a hamburger"
-    result = expand_interval_ranges(prompt)
-    self.assertEqual(prompt, result)
+    def test_prompt_with_no_ranges(self):
+        prompt = "an astronaut eating a hamburger"
+        result = expand_interval_ranges(prompt)
+        self.assertEqual(prompt, result)
+
+    def test_prompt_with_range(self):
+        prompt = "an astronaut-{1,4} eating a hamburger"
+        result = expand_interval_ranges(prompt)
+        self.assertEqual(
+            result, "an astronaut-1 astronaut-2 astronaut-3 eating a hamburger"
+        )
 
-  def test_prompt_with_range(self):
-    prompt = "an astronaut-{1,4} eating a hamburger"
-    result = expand_interval_ranges(prompt)
-    self.assertEqual(result, "an astronaut-1 astronaut-2 astronaut-3 eating a hamburger")
 
 class TestExpandAlternativeRanges(unittest.TestCase):
-  def test_prompt_with_no_ranges(self):
-    prompt = "an astronaut eating a hamburger"
-    result = expand_alternative_ranges(prompt)
-    self.assertEqual([prompt], result)
+    def test_prompt_with_no_ranges(self):
+        prompt = "an astronaut eating a hamburger"
+        result = expand_alternative_ranges(prompt)
+        self.assertEqual([prompt], result)
+
+    def test_ranges_match(self):
+        prompt = "(an astronaut|a squirrel) eating (a hamburger|an acorn)"
+        result = expand_alternative_ranges(prompt)
+        self.assertEqual(
+            result, ["an astronaut eating a hamburger", "a squirrel eating an acorn"]
+        )
 
-  def test_ranges_match(self):
-    prompt = "(an astronaut|a squirrel) eating (a hamburger|an acorn)"
-    result = expand_alternative_ranges(prompt)
-    self.assertEqual(result, ["an astronaut eating a hamburger", "a squirrel eating an acorn"])
 
 class TestInversionsFromPrompt(unittest.TestCase):
-  def test_get_inversions(self):
-    prompt = "<inversion:test:1.0> an astronaut eating an embedding"
-    result, tokens = get_inversions_from_prompt(prompt)
+    def test_get_inversions(self):
+        prompt = "<inversion:test:1.0> an astronaut eating an embedding"
+        result, tokens = get_inversions_from_prompt(prompt)
+
+        self.assertEqual(result, " an astronaut eating an embedding")
+        self.assertEqual(tokens, [("test", 1.0)])
 
-    self.assertEqual(result, " an astronaut eating an embedding")
-    self.assertEqual(tokens, [("test", 1.0)])
 
 class TestLoRAsFromPrompt(unittest.TestCase):
-  def test_get_loras(self):
-    prompt = "<lora:test:1.0> an astronaut eating a LoRA"
-    result, tokens = get_loras_from_prompt(prompt)
+    def test_get_loras(self):
+        prompt = "<lora:test:1.0> an astronaut eating a LoRA"
+        result, tokens = get_loras_from_prompt(prompt)
+
+        self.assertEqual(result, " an astronaut eating a LoRA")
+        self.assertEqual(tokens, [("test", 1.0)])
 
-    self.assertEqual(result, " an astronaut eating a LoRA")
-    self.assertEqual(tokens, [("test", 1.0)])
 
 class TestLatentsFromSeed(unittest.TestCase):
-  def test_batch_size(self):
-    latents = get_latents_from_seed(1, Size(64, 64), batch=4)
-    self.assertEqual(latents.shape, (4, 4, 8, 8))
+    def test_batch_size(self):
+        latents = get_latents_from_seed(1, Size(64, 64), batch=4)
+        self.assertEqual(latents.shape, (4, 4, 8, 8))
+
+    def test_consistency(self):
+        latents1 = get_latents_from_seed(1, Size(64, 64))
+        latents2 = get_latents_from_seed(1, Size(64, 64))
+        self.assertTrue(np.array_equal(latents1, latents2))
 
-  def test_consistency(self):
-    latents1 = get_latents_from_seed(1, Size(64, 64))
-    latents2 = get_latents_from_seed(1, Size(64, 64))
-    self.assertTrue(np.array_equal(latents1, latents2))
 
 class TestTileLatents(unittest.TestCase):
-  def test_full_tile(self):
-    partial = np.zeros((1, 1, 64, 64))
-    full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
-    self.assertEqual(full.shape, (1, 1, 8, 8))
+    def test_full_tile(self):
+        partial = np.zeros((1, 1, 64, 64))
+        full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
+        self.assertEqual(full.shape, (1, 1, 8, 8))
 
-  def test_contract_tile(self):
-    partial = np.zeros((1, 1, 64, 64))
-    full = get_tile_latents(partial, 1, (32, 32), (0, 0, 32))
-    self.assertEqual(full.shape, (1, 1, 4, 4))
+    def test_contract_tile(self):
+        partial = np.zeros((1, 1, 64, 64))
+        full = get_tile_latents(partial, 1, (32, 32), (0, 0, 32))
+        self.assertEqual(full.shape, (1, 1, 4, 4))
+
+    def test_expand_tile(self):
+        partial = np.zeros((1, 1, 32, 32))
+        full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
+        self.assertEqual(full.shape, (1, 1, 8, 8))
 
-  def test_expand_tile(self):
-    partial = np.zeros((1, 1, 32, 32))
-    full = get_tile_latents(partial, 1, (64, 64), (0, 0, 64))
-    self.assertEqual(full.shape, (1, 1, 8, 8))
 
 class TestScaledLatents(unittest.TestCase):
-  def test_scale_up(self):
-    latents = get_latents_from_seed(1, Size(16, 16))
-    scaled = get_scaled_latents(1, Size(16, 16), scale=2)
-    self.assertEqual(latents[0, 0, 0, 0], scaled[0, 0, 0, 0])
+    def test_scale_up(self):
+        latents = get_latents_from_seed(1, Size(16, 16))
+        scaled = get_scaled_latents(1, Size(16, 16), scale=2)
+        self.assertEqual(latents[0, 0, 0, 0], scaled[0, 0, 0, 0])
+
+    def test_scale_down(self):
+        latents = get_latents_from_seed(1, Size(16, 16))
+        scaled = get_scaled_latents(1, Size(16, 16), scale=0.5)
+        self.assertEqual(
+            (
+                latents[0, 0, 0, 0]
+                + latents[0, 0, 0, 1]
+                + latents[0, 0, 1, 0]
+                + latents[0, 0, 1, 1]
+            )
+            / 4,
+            scaled[0, 0, 0, 0],
+        )
 
-  def test_scale_down(self):
-    latents = get_latents_from_seed(1, Size(16, 16))
-    scaled = get_scaled_latents(1, Size(16, 16), scale=0.5)
-    self.assertEqual((
-      latents[0, 0, 0, 0] +
-      latents[0, 0, 0, 1] +
-      latents[0, 0, 1, 0] +
-      latents[0, 0, 1, 1]
-    ) / 4, scaled[0, 0, 0, 0])
 
 class TestReplaceWildcards(unittest.TestCase):
-  pass
+    pass
+
 
 class TestPopRandom(unittest.TestCase):
-  def test_pop(self):
-    items = ["1", "2", "3"]
-    pop_random(items)
-    self.assertEqual(len(items), 2)
+    def test_pop(self):
+        items = ["1", "2", "3"]
+        pop_random(items)
+        self.assertEqual(len(items), 2)
+
 
 class TestRepairNaN(unittest.TestCase):
-  def test_unchanged(self):
-    pass
+    def test_unchanged(self):
+        pass
+
+    def test_missing(self):
+        pass
 
-  def test_missing(self):
-    pass
 
 class TestSlicePrompt(unittest.TestCase):
-  def test_slice_no_delimiter(self):
-    slice = slice_prompt("foo", 1)
-    self.assertEqual(slice, "foo")
+    def test_slice_no_delimiter(self):
+        slice = slice_prompt("foo", 1)
+        self.assertEqual(slice, "foo")
 
-  def test_slice_within_range(self):
-    slice = slice_prompt("foo || bar", 1)
-    self.assertEqual(slice, " bar")
+    def test_slice_within_range(self):
+        slice = slice_prompt("foo || bar", 1)
+        self.assertEqual(slice, " bar")
 
-  def test_slice_outside_range(self):
-    slice = slice_prompt("foo || bar", 9)
-    self.assertEqual(slice, " bar")
+    def test_slice_outside_range(self):
+        slice = slice_prompt("foo || bar", 9)
+        self.assertEqual(slice, " bar")
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index d0a36982..3f6f13cd 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -13,122 +13,128 @@ lock = Event()
 
 
 def test_job(*args, **kwargs):
-  lock.wait()
+    lock.wait()
 
 
 def wait_job(*args, **kwargs):
-  sleep(0.5)
+    sleep(0.5)
 
 
 class TestWorkerPool(unittest.TestCase):
-  # lock: Optional[Event]
-  pool: Optional[DevicePoolExecutor]
+    # lock: Optional[Event]
+    pool: Optional[DevicePoolExecutor]
 
-  def setUp(self) -> None:
-    self.pool = None
+    def setUp(self) -> None:
+        self.pool = None
 
-  def tearDown(self) -> None:
-    if self.pool is not None:
-        self.pool.join()
+    def tearDown(self) -> None:
+        if self.pool is not None:
+            self.pool.join()
 
-  def test_no_devices(self):
-    server = ServerContext()
-    self.pool = DevicePoolExecutor(server, [], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+    def test_no_devices(self):
+        server = ServerContext()
+        self.pool = DevicePoolExecutor(server, [], join_timeout=TEST_JOIN_TIMEOUT)
+        self.pool.start()
 
-  def test_fake_worker(self):
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
-    self.assertEqual(len(self.pool.workers), 1)
+    def test_fake_worker(self):
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
+        self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+        self.pool.start()
+        self.assertEqual(len(self.pool.workers), 1)
 
-  def test_cancel_pending(self):
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
+    def test_cancel_pending(self):
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+        self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+        self.pool.start()
 
-    self.pool.submit("test", wait_job, lock=lock)
-    self.assertEqual(self.pool.done("test"), (True, None))
+        self.pool.submit("test", wait_job, lock=lock)
+        self.assertEqual(self.pool.done("test"), (True, None))
 
-    self.assertTrue(self.pool.cancel("test"))
-    self.assertEqual(self.pool.done("test"), (False, None))
+        self.assertTrue(self.pool.cancel("test"))
+        self.assertEqual(self.pool.done("test"), (False, None))
 
-  def test_cancel_running(self):
-    pass
+    def test_cancel_running(self):
+        pass
 
-  def test_next_device(self):
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+    def test_next_device(self):
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
+        self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+        self.pool.start()
 
-    self.assertEqual(self.pool.get_next_device(), 0)
+        self.assertEqual(self.pool.get_next_device(), 0)
 
-  def test_needs_device(self):
-    device1 = DeviceParams("cpu1", "CPUProvider")
-    device2 = DeviceParams("cpu2", "CPUProvider")
-    server = ServerContext()
-    self.pool = DevicePoolExecutor(server, [device1, device2], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start()
+    def test_needs_device(self):
+        device1 = DeviceParams("cpu1", "CPUProvider")
+        device2 = DeviceParams("cpu2", "CPUProvider")
+        server = ServerContext()
+        self.pool = DevicePoolExecutor(
+            server, [device1, device2], join_timeout=TEST_JOIN_TIMEOUT
+        )
+        self.pool.start()
 
-    self.assertEqual(self.pool.get_next_device(needs_device=device2), 1)
+        self.assertEqual(self.pool.get_next_device(needs_device=device2), 1)
 
-  def test_done_running(self):
-    """
-    TODO: flaky
-    """
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
+    def test_done_running(self):
+        """
+        TODO: flaky
+        """
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1)
-    self.pool.start(lock)
-    sleep(2.0)
+        self.pool = DevicePoolExecutor(
+            server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1
+        )
+        self.pool.start(lock)
+        sleep(2.0)
 
-    self.pool.submit("test", test_job)
-    sleep(2.0)
+        self.pool.submit("test", test_job)
+        sleep(2.0)
 
-    pending, _progress = self.pool.done("test")
-    self.assertFalse(pending)
+        pending, _progress = self.pool.done("test")
+        self.assertFalse(pending)
 
-  def test_done_pending(self):
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
+    def test_done_pending(self):
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
-    self.pool.start(lock)
+        self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT)
+        self.pool.start(lock)
 
-    self.pool.submit("test1", test_job)
-    self.pool.submit("test2", test_job)
-    self.assertTrue(self.pool.done("test2"), (True, None))
+        self.pool.submit("test1", test_job)
+        self.pool.submit("test2", test_job)
+        self.assertTrue(self.pool.done("test2"), (True, None))
 
-    lock.set()
+        lock.set()
 
-  def test_done_finished(self):
-    """
-    TODO: flaky
-    """
-    device = DeviceParams("cpu", "CPUProvider")
-    server = ServerContext()
+    def test_done_finished(self):
+        """
+        TODO: flaky
+        """
+        device = DeviceParams("cpu", "CPUProvider")
+        server = ServerContext()
 
-    self.pool = DevicePoolExecutor(server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1)
-    self.pool.start()
-    sleep(2.0)
+        self.pool = DevicePoolExecutor(
+            server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1
+        )
+        self.pool.start()
+        sleep(2.0)
 
-    self.pool.submit("test", wait_job)
-    self.assertEqual(self.pool.done("test"), (True, None))
+        self.pool.submit("test", wait_job)
+        self.assertEqual(self.pool.done("test"), (True, None))
 
-    sleep(2.0)
-    pending, _progress = self.pool.done("test")
-    self.assertFalse(pending)
+        sleep(2.0)
+        pending, _progress = self.pool.done("test")
+        self.assertFalse(pending)
 
-  def test_recycle_live(self):
-    pass
+    def test_recycle_live(self):
+        pass
 
-  def test_recycle_dead(self):
-    pass
+    def test_recycle_dead(self):
+        pass
 
-  def test_running_status(self):
-    pass
\ No newline at end of file
+    def test_running_status(self):
+        pass
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
index 9f02d4e9..993c6d67 100644
--- a/api/tests/worker/test_worker.py
+++ b/api/tests/worker/test_worker.py
@@ -18,119 +18,194 @@ from tests.helpers import test_device
 
 
 def main_memory(_worker):
-  raise Exception(MEMORY_ERRORS[0])
+    raise Exception(MEMORY_ERRORS[0])
+
 
 def main_retry(_worker):
-  raise RetryException()
+    raise RetryException()
+
 
 def main_interrupt(_worker):
-  raise KeyboardInterrupt()
+    raise KeyboardInterrupt()
 
 
 class WorkerMainTests(unittest.TestCase):
-  def test_pending_exception_empty(self):
-    pass
+    def test_pending_exception_empty(self):
+        pass
 
-  def test_pending_exception_interrupt(self):
-    status = None
+    def test_pending_exception_interrupt(self):
+        status = None
 
-    def exit(exit_status):
-      nonlocal status
-      status = exit_status
+        def exit(exit_status):
+            nonlocal status
+            status = exit_status
 
-    job = JobCommand("test", "test", main_interrupt, [], {})
-    cancel = Value("L", False)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    pid = Value("L", getpid())
-    idle = Value("L", False)
+        job = JobCommand("test", "test", main_interrupt, [], {})
+        cancel = Value("L", False)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        pid = Value("L", getpid())
+        idle = Value("L", False)
 
-    pending.put(job)
-    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+        pending.put(job)
+        worker_main(
+            WorkerContext(
+                "test",
+                test_device(),
+                cancel,
+                logs,
+                pending,
+                progress,
+                pid,
+                idle,
+                0,
+                0.0,
+            ),
+            ServerContext(),
+            exit=exit,
+        )
 
-    self.assertEqual(status, EXIT_INTERRUPT)
-    pass
+        self.assertEqual(status, EXIT_INTERRUPT)
+        pass
 
-  def test_pending_exception_retry(self):
-    status = None
+    def test_pending_exception_retry(self):
+        status = None
 
-    def exit(exit_status):
-      nonlocal status
-      status = exit_status
+        def exit(exit_status):
+            nonlocal status
+            status = exit_status
 
-    job = JobCommand("test", "test", main_retry, [], {})
-    cancel = Value("L", False)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    pid = Value("L", getpid())
-    idle = Value("L", False)
+        job = JobCommand("test", "test", main_retry, [], {})
+        cancel = Value("L", False)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        pid = Value("L", getpid())
+        idle = Value("L", False)
 
-    pending.put(job)
-    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+        pending.put(job)
+        worker_main(
+            WorkerContext(
+                "test",
+                test_device(),
+                cancel,
+                logs,
+                pending,
+                progress,
+                pid,
+                idle,
+                0,
+                0.0,
+            ),
+            ServerContext(),
+            exit=exit,
+        )
 
-    self.assertEqual(status, EXIT_ERROR)
-    pass
+        self.assertEqual(status, EXIT_ERROR)
+        pass
 
-  def test_pending_exception_value(self):
-    status = None
+    def test_pending_exception_value(self):
+        status = None
 
-    def exit(exit_status):
-      nonlocal status
-      status = exit_status
+        def exit(exit_status):
+            nonlocal status
+            status = exit_status
 
-    cancel = Value("L", False)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    pid = Value("L", getpid())
-    idle = Value("L", False)
+        cancel = Value("L", False)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        pid = Value("L", getpid())
+        idle = Value("L", False)
 
-    pending.close()
-    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+        pending.close()
+        worker_main(
+            WorkerContext(
+                "test",
+                test_device(),
+                cancel,
+                logs,
+                pending,
+                progress,
+                pid,
+                idle,
+                0,
+                0.0,
+            ),
+            ServerContext(),
+            exit=exit,
+        )
 
-    self.assertEqual(status, EXIT_ERROR)
+        self.assertEqual(status, EXIT_ERROR)
 
-  def test_pending_exception_other_memory(self):
-    status = None
+    def test_pending_exception_other_memory(self):
+        status = None
 
-    def exit(exit_status):
-      nonlocal status
-      status = exit_status
+        def exit(exit_status):
+            nonlocal status
+            status = exit_status
 
-    job = JobCommand("test", "test", main_memory, [], {})
-    cancel = Value("L", False)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    pid = Value("L", getpid())
-    idle = Value("L", False)
+        job = JobCommand("test", "test", main_memory, [], {})
+        cancel = Value("L", False)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        pid = Value("L", getpid())
+        idle = Value("L", False)
 
-    pending.put(job)
-    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
+        pending.put(job)
+        worker_main(
+            WorkerContext(
+                "test",
+                test_device(),
+                cancel,
+                logs,
+                pending,
+                progress,
+                pid,
+                idle,
+                0,
+                0.0,
+            ),
+            ServerContext(),
+            exit=exit,
+        )
 
-    self.assertEqual(status, EXIT_MEMORY)
+        self.assertEqual(status, EXIT_MEMORY)
 
+    def test_pending_exception_other_unknown(self):
+        pass
 
-  def test_pending_exception_other_unknown(self):
-    pass
+    def test_pending_replaced(self):
+        status = None
 
-  def test_pending_replaced(self):
-    status = None
+        def exit(exit_status):
+            nonlocal status
+            status = exit_status
 
-    def exit(exit_status):
-      nonlocal status
-      status = exit_status
+        cancel = Value("L", False)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        pid = Value("L", 0)
+        idle = Value("L", False)
 
-    cancel = Value("L", False)
-    logs = Queue()
-    pending = Queue()
-    progress = Queue()
-    pid = Value("L", 0)
-    idle = Value("L", False)
-
-    worker_main(WorkerContext("test", test_device(), cancel, logs, pending, progress, pid, idle, 0, 0.0), ServerContext(), exit=exit)
-
-    self.assertEqual(status, EXIT_REPLACED)
+        worker_main(
+            WorkerContext(
+                "test",
+                test_device(),
+                cancel,
+                logs,
+                pending,
+                progress,
+                pid,
+                idle,
+                0,
+                0.0,
+            ),
+            ServerContext(),
+            exit=exit,
+        )
 
+        self.assertEqual(status, EXIT_REPLACED)

From c4aa262ed7b3d5de91dc3507ab5947812e8b5c30 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 19 Nov 2023 23:40:34 -0600
Subject: [PATCH 174/240] try a different hack

---
 api/onnx_web/chain/tile.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index f8fe5e8d..f600d06b 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -317,12 +317,12 @@ def process_tile_stack(
             if mask:
                 tile_mask = mask.crop((left, top, right, bottom))
 
-        if isinstance(tile_stack, list):
-            tile_stack = StageResult.from_images(tile_stack)
-
         for image_filter in filters:
             tile_stack = image_filter(tile_stack, tile_mask, (left, top, tile))
 
+        if isinstance(tile_stack, list):
+            tile_stack = StageResult.from_images(tile_stack)
+
         tiles.append((left, top, tile_stack.as_image()))
 
     lefts, tops, stacks = list(zip(*tiles))

From 60615e097bcbcf0c8c0142ba69cf1301a0932361 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 19:10:11 -0600
Subject: [PATCH 175/240] fix(api): support normal LoRA keys in SDXL LoRAs

---
 api/onnx_web/convert/diffusion/lora.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index f99d1ee8..91904e11 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -86,6 +86,15 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
             block = "up_blocks"
         elif root.startswith("text_model"):
             block = "text_model"
+        elif root.startswith("down_blocks"):
+            fixed[fix_node_name(key)] = value
+            continue
+        elif root.startswith("mid_blocks"):
+            fixed[fix_node_name(key)] = value
+            continue
+        elif root.startswith("up_blocks"):
+            fixed[fix_node_name(key)] = value
+            continue
         else:
             logger.warning("unknown XL key name: %s", key)
             fixed[key] = value

From b6aed0542c558ecdba4e0da61f281a2cd5f635e0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 19:10:41 -0600
Subject: [PATCH 176/240] fix(api): update deprecated imports from diffusers

---
 api/onnx_web/diffusers/pipelines/controlnet.py | 2 +-
 api/onnx_web/diffusers/pipelines/panorama.py   | 2 +-
 api/onnx_web/diffusers/pipelines/pix2pix.py    | 2 +-
 api/onnx_web/diffusers/pipelines/upscale.py    | 2 +-
 api/pyproject.toml                             | 2 +-
 5 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/controlnet.py b/api/onnx_web/diffusers/pipelines/controlnet.py
index 684b0c5e..bcee67bf 100644
--- a/api/onnx_web/diffusers/pipelines/controlnet.py
+++ b/api/onnx_web/diffusers/pipelines/controlnet.py
@@ -13,7 +13,7 @@ import numpy as np
 import PIL
 import torch
 from diffusers.configuration_utils import FrozenDict
-from diffusers.pipeline_utils import DiffusionPipeline
+from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
 from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput
 from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMScheduler
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 78151f12..22473a51 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -19,7 +19,7 @@ import numpy as np
 import PIL
 import torch
 from diffusers.configuration_utils import FrozenDict
-from diffusers.pipeline_utils import DiffusionPipeline
+from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
 from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput
 from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMScheduler
diff --git a/api/onnx_web/diffusers/pipelines/pix2pix.py b/api/onnx_web/diffusers/pipelines/pix2pix.py
index ffcd7e9b..2689fa4f 100644
--- a/api/onnx_web/diffusers/pipelines/pix2pix.py
+++ b/api/onnx_web/diffusers/pipelines/pix2pix.py
@@ -32,7 +32,7 @@ except ImportError:
     }
 
 from diffusers import OnnxRuntimeModel
-from diffusers.pipeline_utils import DiffusionPipeline
+from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput
 from diffusers.schedulers import (
     DDIMScheduler,
diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index deb2c8c3..db961091 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -11,7 +11,7 @@ from typing import Any, Callable, List, Optional, Union
 import numpy as np
 import PIL
 import torch
-from diffusers.pipeline_utils import ImagePipelineOutput
+from diffusers.pipelines.pipeline_utils import ImagePipelineOutput
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
 from diffusers.pipelines.stable_diffusion import StableDiffusionUpscalePipeline
 from diffusers.schedulers import DDPMScheduler
diff --git a/api/pyproject.toml b/api/pyproject.toml
index efed7be3..f0c3b689 100644
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@@ -41,9 +41,9 @@ module = [
     "diffusers.pipelines.latent_diffusion.pipeline_latent_diffusion",
     "diffusers.pipelines.onnx_utils",
     "diffusers.pipelines.paint_by_example",
+    "diffusers.pipelines.pipeline_utils",
     "diffusers.pipelines.stable_diffusion",
     "diffusers.pipelines.stable_diffusion.convert_from_ckpt",
-    "diffusers.pipeline_utils",
     "diffusers.schedulers",
     "diffusers.utils.logging",
     "facexlib.utils",

From a02523c54c932e11c6a0432a7bddea2f07bdae3f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 19:11:04 -0600
Subject: [PATCH 177/240] update pipeline tests

---
 api/tests/chain/test_blend_img2img.py      | 18 +++++++++------
 api/tests/chain/test_correct_codeformer.py | 27 ++++++++++++++++------
 api/tests/convert/diffusion/test_lora.py   |  2 +-
 api/tests/convert/test_utils.py            |  5 +---
 api/tests/helpers.py                       |  1 +
 5 files changed, 34 insertions(+), 19 deletions(-)

diff --git a/api/tests/chain/test_blend_img2img.py b/api/tests/chain/test_blend_img2img.py
index 31aa27a3..9d6f71d9 100644
--- a/api/tests/chain/test_blend_img2img.py
+++ b/api/tests/chain/test_blend_img2img.py
@@ -3,10 +3,11 @@ import unittest
 from PIL import Image
 
 from onnx_web.chain.blend_img2img import BlendImg2ImgStage
-from onnx_web.params import DeviceParams, ImageParams
+from onnx_web.chain.result import StageResult
+from onnx_web.params import ImageParams
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.context import WorkerContext
-from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_needs_models
+from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_device, test_needs_models
 
 
 class BlendImg2ImgStageTests(unittest.TestCase):
@@ -25,7 +26,7 @@ class BlendImg2ImgStageTests(unittest.TestCase):
         server = ServerContext(model_path="../models", output_path="../outputs")
         worker = WorkerContext(
             "test",
-            DeviceParams("cpu", "CPUProvider"),
+            test_device(),
             None,
             None,
             None,
@@ -33,11 +34,14 @@ class BlendImg2ImgStageTests(unittest.TestCase):
             None,
             None,
             0,
+            0.1,
+        )
+        sources = StageResult(
+            images=[
+                Image.new("RGB", (64, 64), "black"),
+            ]
         )
-        sources = [
-            Image.new("RGB", (64, 64), "black"),
-        ]
         result = stage.run(worker, server, None, params, sources, strength=0.5, steps=1)
 
         self.assertEqual(len(result), 1)
-        self.assertEqual(result[0].getpixel((0, 0)), (127, 127, 127))
+        self.assertEqual(result.as_image()[0].getpixel((0, 0)), (0, 0, 0))
diff --git a/api/tests/chain/test_correct_codeformer.py b/api/tests/chain/test_correct_codeformer.py
index 8a90d0c9..fa764554 100644
--- a/api/tests/chain/test_correct_codeformer.py
+++ b/api/tests/chain/test_correct_codeformer.py
@@ -1,21 +1,27 @@
 import unittest
 
 from onnx_web.chain.correct_codeformer import CorrectCodeformerStage
-from onnx_web.params import DeviceParams, HighresParams, UpscaleParams
+from onnx_web.chain.result import StageResult
+from onnx_web.params import HighresParams, UpscaleParams
 from onnx_web.server.context import ServerContext
 from onnx_web.server.hacks import apply_patches
 from onnx_web.worker.context import WorkerContext
+from tests.helpers import (
+    TEST_MODEL_CORRECTION_CODEFORMER,
+    test_device,
+    test_needs_models,
+)
 
 
 class CorrectCodeformerStageTests(unittest.TestCase):
+    @test_needs_models([TEST_MODEL_CORRECTION_CODEFORMER])
     def test_empty(self):
-        """
-        server = ServerContext()
+        server = ServerContext(model_path="../models", output_path="../outputs")
         apply_patches(server)
 
         worker = WorkerContext(
             "test",
-            DeviceParams("cpu", "CPUProvider"),
+            test_device(),
             None,
             None,
             None,
@@ -23,11 +29,18 @@ class CorrectCodeformerStageTests(unittest.TestCase):
             None,
             None,
             0,
+            0.1,
         )
         stage = CorrectCodeformerStage()
         sources = StageResult.empty()
-        result = stage.run(worker, None, None, None, sources, highres=HighresParams(False,1, 0, 0), upscale=UpscaleParams(""))
+        result = stage.run(
+            worker,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(""),
+        )
 
         self.assertEqual(len(result), 0)
-        """
-        pass
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index bcf19680..2b94b559 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -233,7 +233,7 @@ class BlendWeightsLoHATests(unittest.TestCase):
         i = 32
         j = 4
         k = 1
-        l = 1
+        l = 1  # NOQA
         p = 2
         r = 4
 
diff --git a/api/tests/convert/test_utils.py b/api/tests/convert/test_utils.py
index ae0c2842..4281adbc 100644
--- a/api/tests/convert/test_utils.py
+++ b/api/tests/convert/test_utils.py
@@ -12,10 +12,7 @@ from onnx_web.convert.utils import (
     tuple_to_source,
     tuple_to_upscaling,
 )
-from tests.helpers import (
-    TEST_MODEL_UPSCALING_SWINIR,
-    test_needs_models,
-)
+from tests.helpers import TEST_MODEL_UPSCALING_SWINIR, test_needs_models
 
 
 class ConversionContextTests(unittest.TestCase):
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index 64714819..e6c359ed 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -15,5 +15,6 @@ def test_device() -> DeviceParams:
     return DeviceParams("cpu", "CPUExecutionProvider")
 
 
+TEST_MODEL_CORRECTION_CODEFORMER = "../models/.cache/correction-codeformer.pth"
 TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
 TEST_MODEL_UPSCALING_SWINIR = "../models/.cache/upscaling-swinir.pth"

From a39fe1d21caac515eb294906a51570ae8a2dc058 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 21:46:34 -0600
Subject: [PATCH 178/240] use pre-fixed names for XL LoRA key matching

---
 api/onnx_web/convert/diffusion/lora.py | 46 ++++++++++++--------------
 1 file changed, 22 insertions(+), 24 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index 91904e11..ac03f713 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -71,8 +71,9 @@ def fix_node_name(key: str):
         return fixed_name
 
 
-def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
+def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any], List[str]]:
     fixed = {}
+    remaining = list(nodes)
 
     for key, value in keys.items():
         root, *rest = key.split(".")
@@ -87,14 +88,11 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
         elif root.startswith("text_model"):
             block = "text_model"
         elif root.startswith("down_blocks"):
-            fixed[fix_node_name(key)] = value
-            continue
-        elif root.startswith("mid_blocks"):
-            fixed[fix_node_name(key)] = value
-            continue
+            block = "down_blocks"
+        elif root.startswith("mid_block"):
+            block = "mid_block"
         elif root.startswith("up_blocks"):
-            fixed[fix_node_name(key)] = value
-            continue
+            block = "up_blocks"
         else:
             logger.warning("unknown XL key name: %s", key)
             fixed[key] = value
@@ -125,14 +123,14 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
         match = None
         if block == "text_model":
             match = next(
-                node for node in nodes if fix_node_name(node.name) == f"{root}_MatMul"
+                node for node in remaining if node == f"{root}_MatMul"
             )
         else:
             match = next(
                 node
-                for node in nodes
-                if node.name.startswith(f"/{block}")
-                and fix_node_name(node.name).endswith(
+                for node in remaining
+                if node.startswith(f"/{block}")
+                and node.endswith(
                     f"{suffix}_MatMul"
                 )  # needs to be fixed because some places use to_out.0
             )
@@ -141,9 +139,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
             logger.warning("no matches for XL key: %s", root)
             continue
 
-        name: str = match.name
-        name = fix_node_name(name.rstrip("/MatMul"))
-
+        name = match.rstrip("/MatMul")
         if name.endswith("proj_o"):
             # wtf
             name = f"{name}ut"
@@ -151,9 +147,9 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]):
         logger.trace("matching XL key with node: %s -> %s", key, match.name)
 
         fixed[name] = value
-        nodes.remove(match)
+        remaining.remove(match)
 
-    return fixed
+    return (fixed, remaining)
 
 
 def kernel_slice(x: int, y: int, shape: Tuple[int, int, int, int]) -> Tuple[int, int]:
@@ -472,10 +468,17 @@ def blend_loras(
                     )
                     blended[base_key] = np_weights
 
+    # fix node names once
+    fixed_initializer_names = [
+        fix_initializer_name(node.name) for node in base_model.graph.initializer
+    ]
+    fixed_node_names = [fix_node_name(node.name) for node in base_model.graph.node]
+
     # rewrite node names for XL
     if xl:
-        nodes = list(base_model.graph.node)
-        blended = fix_xl_names(blended, nodes)
+        blended, remaining = fix_xl_names(blended, fixed_node_names)
+        if len(remaining) > 0:
+            logger.warning("could not match some XL keys: %s", remaining)
 
     logger.debug(
         "updating %s of %s initializers",
@@ -483,11 +486,6 @@ def blend_loras(
         len(base_model.graph.initializer),
     )
 
-    fixed_initializer_names = [
-        fix_initializer_name(node.name) for node in base_model.graph.initializer
-    ]
-    fixed_node_names = [fix_node_name(node.name) for node in base_model.graph.node]
-
     unmatched_keys = []
     for base_key, weights in blended.items():
         conv_key = base_key + "_Conv"

From 33bd67beb6eda90e9fb0aa959a3905a1f8e7db6b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 22:33:17 -0600
Subject: [PATCH 179/240] switch LoRA back to fixing node names on the fly

---
 api/onnx_web/convert/diffusion/lora.py | 42 +++++++++++++++++++-------
 1 file changed, 31 insertions(+), 11 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index ac03f713..1d2279c3 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -71,7 +71,7 @@ def fix_node_name(key: str):
         return fixed_name
 
 
-def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any], List[str]]:
+def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]:
     fixed = {}
     remaining = list(nodes)
 
@@ -79,6 +79,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
         root, *rest = key.split(".")
         logger.trace("fixing XL node name: %s -> %s", key, root)
 
+        simple = False
         if root.startswith("input"):
             block = "down_blocks"
         elif root.startswith("middle"):
@@ -89,10 +90,13 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
             block = "text_model"
         elif root.startswith("down_blocks"):
             block = "down_blocks"
+            simple = True
         elif root.startswith("mid_block"):
             block = "mid_block"
+            simple = True
         elif root.startswith("up_blocks"):
             block = "up_blocks"
+            simple = True
         else:
             logger.warning("unknown XL key name: %s", key)
             fixed[key] = value
@@ -100,6 +104,10 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
 
         suffix = None
         for s in [
+            "conv",
+            "conv_shortcut",
+            "conv1",
+            "conv2",
             "fc1",
             "fc2",
             "ff_net_0_proj",
@@ -120,17 +128,26 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
             continue
 
         logger.trace("searching for XL node: /%s/*/%s", block, suffix)
-        match = None
-        if block == "text_model":
+        match: Optional[NodeProto] = None
+        if "conv" in suffix:
             match = next(
-                node for node in remaining if node == f"{root}_MatMul"
+                node for node in remaining if fix_node_name(node.name) == f"{root}_Conv"
+            )
+        elif "time_emb_proj" in root:
+            match = next(
+                node for node in remaining if fix_node_name(node.name) == f"{root}_Gemm"
+            )
+        elif block == "text_model" or simple:
+            match = next(
+                node for node in remaining if fix_node_name(node.name) == f"{root}_MatMul"
             )
         else:
+            # search in order. one side has sparse indices, so they will not match.
             match = next(
                 node
                 for node in remaining
-                if node.startswith(f"/{block}")
-                and node.endswith(
+                if node.name.startswith(f"/{block}")
+                and fix_node_name(node.name).endswith(
                     f"{suffix}_MatMul"
                 )  # needs to be fixed because some places use to_out.0
             )
@@ -138,8 +155,12 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
         if match is None:
             logger.warning("no matches for XL key: %s", root)
             continue
+        else:
+            logger.trace("matched key: %s -> %s", key, match.name)
+
+        name: str = match.name
+        name = fix_node_name(name).rstrip("/MatMul").rstrip("/Gemm").rstrip("/Conv")
 
-        name = match.rstrip("/MatMul")
         if name.endswith("proj_o"):
             # wtf
             name = f"{name}ut"
@@ -149,7 +170,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[str]) -> Tuple[Dict[str, Any]
         fixed[name] = value
         remaining.remove(match)
 
-    return (fixed, remaining)
+    return fixed
 
 
 def kernel_slice(x: int, y: int, shape: Tuple[int, int, int, int]) -> Tuple[int, int]:
@@ -476,9 +497,8 @@ def blend_loras(
 
     # rewrite node names for XL
     if xl:
-        blended, remaining = fix_xl_names(blended, fixed_node_names)
-        if len(remaining) > 0:
-            logger.warning("could not match some XL keys: %s", remaining)
+        nodes = list(base_model.graph.node)
+        blended = fix_xl_names(blended, nodes)
 
     logger.debug(
         "updating %s of %s initializers",

From 54dc970a7e95ab331aaa9110760f5133b511e285 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 23:12:24 -0600
Subject: [PATCH 180/240] correctly remove operator types

---
 api/onnx_web/convert/diffusion/lora.py | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index 1d2279c3..b912b107 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -127,7 +127,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
             logger.warning("new XL key type: %s", root)
             continue
 
-        logger.trace("searching for XL node: /%s/*/%s", block, suffix)
+        logger.trace("searching for XL node: %s -> /%s/*/%s", root, block, suffix)
         match: Optional[NodeProto] = None
         if "conv" in suffix:
             match = next(
@@ -159,13 +159,15 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
             logger.trace("matched key: %s -> %s", key, match.name)
 
         name: str = match.name
-        name = fix_node_name(name).rstrip("/MatMul").rstrip("/Gemm").rstrip("/Conv")
+        name = fix_node_name(name)
+        if name.endswith("_MatMul"):
+            name = name[:-7]
+        elif name.endswith("_Gemm"):
+            name = name[:-5]
+        elif name.endswith("_Conv"):
+            name = name[:-5]
 
-        if name.endswith("proj_o"):
-            # wtf
-            name = f"{name}ut"
-
-        logger.trace("matching XL key with node: %s -> %s", key, match.name)
+        logger.trace("matching XL key with node: %s -> %s, %s", key, match.name, name)
 
         fixed[name] = value
         remaining.remove(match)

From fd97eebfa208f24055ce78a8eec16395ec4e043a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 23:14:15 -0600
Subject: [PATCH 181/240] feat(api): add LCM scheduler

---
 api/onnx_web/diffusers/load.py                   | 1 +
 api/onnx_web/diffusers/version_safe_diffusers.py | 5 +++++
 2 files changed, 6 insertions(+)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index d7ffe749..7755ecc5 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -44,6 +44,7 @@ from .version_safe_diffusers import (
     KarrasVeScheduler,
     KDPM2AncestralDiscreteScheduler,
     KDPM2DiscreteScheduler,
+    LCMScheduler,
     LMSDiscreteScheduler,
     OnnxRuntimeModel,
     OnnxStableDiffusionImg2ImgPipeline,
diff --git a/api/onnx_web/diffusers/version_safe_diffusers.py b/api/onnx_web/diffusers/version_safe_diffusers.py
index 79198b81..d256d615 100644
--- a/api/onnx_web/diffusers/version_safe_diffusers.py
+++ b/api/onnx_web/diffusers/version_safe_diffusers.py
@@ -12,6 +12,11 @@ try:
 except ImportError:
     from ..diffusers.stub_scheduler import StubScheduler as DEISMultistepScheduler
 
+try:
+    from diffusers import LCMScheduler
+except ImportError:
+    from ..diffusers.stub_scheduler import StubScheduler as LCMScheduler
+
 try:
     from diffusers import UniPCMultistepScheduler
 except ImportError:

From 66dfa7206abcc51fb7a14a761ee3818014e29949 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 21 Nov 2023 23:23:46 -0600
Subject: [PATCH 182/240] add LCM to available scheduler list

---
 api/onnx_web/diffusers/load.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 7755ecc5..75dafc2e 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -85,6 +85,7 @@ pipeline_schedulers = {
     "k-dpm-2-a": KDPM2AncestralDiscreteScheduler,
     "k-dpm-2": KDPM2DiscreteScheduler,
     "karras-ve": KarrasVeScheduler,
+    "lcm": LCMScheduler,
     "lms-discrete": LMSDiscreteScheduler,
     "pndm": PNDMScheduler,
     "unipc-multi": UniPCMultistepScheduler,

From f00bfe9bd00fd767699ffc4e4a2300d5ed27ad5f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 11:19:58 -0600
Subject: [PATCH 183/240] more tests, apply lint

---
 api/onnx_web/convert/diffusion/lora.py        | 10 +-
 .../diffusers/pipelines/controlnet.py         |  2 +-
 api/onnx_web/diffusers/pipelines/panorama.py  |  2 +-
 api/onnx_web/diffusers/pipelines/upscale.py   |  2 +-
 api/tests/chain/test_correct_gfpgan.py        | 44 +++++++++
 api/tests/chain/test_upscale_bsrgan.py        | 41 ++++++++
 api/tests/chain/test_upscale_outpaint.py      | 52 ++++++++++
 api/tests/chain/test_upscale_resrgan.py       | 39 ++++++++
 api/tests/chain/test_upscale_swinir.py        | 41 ++++++++
 api/tests/helpers.py                          |  6 ++
 api/tests/test_diffusers/test_run.py          | 97 +++++++++++++++++++
 api/tests/worker/test_pool.py                 |  8 +-
 12 files changed, 334 insertions(+), 10 deletions(-)
 create mode 100644 api/tests/chain/test_correct_gfpgan.py
 create mode 100644 api/tests/chain/test_upscale_bsrgan.py
 create mode 100644 api/tests/chain/test_upscale_outpaint.py
 create mode 100644 api/tests/chain/test_upscale_resrgan.py
 create mode 100644 api/tests/chain/test_upscale_swinir.py

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index b912b107..d10157ee 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -139,7 +139,9 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
             )
         elif block == "text_model" or simple:
             match = next(
-                node for node in remaining if fix_node_name(node.name) == f"{root}_MatMul"
+                node
+                for node in remaining
+                if fix_node_name(node.name) == f"{root}_MatMul"
             )
         else:
             # search in order. one side has sparse indices, so they will not match.
@@ -172,6 +174,12 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
         fixed[name] = value
         remaining.remove(match)
 
+    logger.debug(
+        "SDXL LoRA key fixup matched %s keys, %s remaining",
+        len(fixed.keys()),
+        len(remaining),
+    )
+
     return fixed
 
 
diff --git a/api/onnx_web/diffusers/pipelines/controlnet.py b/api/onnx_web/diffusers/pipelines/controlnet.py
index bcee67bf..e0515dc5 100644
--- a/api/onnx_web/diffusers/pipelines/controlnet.py
+++ b/api/onnx_web/diffusers/pipelines/controlnet.py
@@ -13,8 +13,8 @@ import numpy as np
 import PIL
 import torch
 from diffusers.configuration_utils import FrozenDict
-from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
+from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput
 from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMScheduler
 from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 22473a51..11511fa7 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -19,8 +19,8 @@ import numpy as np
 import PIL
 import torch
 from diffusers.configuration_utils import FrozenDict
-from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
+from diffusers.pipelines.pipeline_utils import DiffusionPipeline
 from diffusers.pipelines.stable_diffusion import StableDiffusionPipelineOutput
 from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMScheduler
 from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index db961091..ff571f83 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -11,8 +11,8 @@ from typing import Any, Callable, List, Optional, Union
 import numpy as np
 import PIL
 import torch
-from diffusers.pipelines.pipeline_utils import ImagePipelineOutput
 from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
+from diffusers.pipelines.pipeline_utils import ImagePipelineOutput
 from diffusers.pipelines.stable_diffusion import StableDiffusionUpscalePipeline
 from diffusers.schedulers import DDPMScheduler
 
diff --git a/api/tests/chain/test_correct_gfpgan.py b/api/tests/chain/test_correct_gfpgan.py
new file mode 100644
index 00000000..9f8b6cb3
--- /dev/null
+++ b/api/tests/chain/test_correct_gfpgan.py
@@ -0,0 +1,44 @@
+import unittest
+
+from onnx_web.chain.correct_gfpgan import CorrectGFPGANStage
+from onnx_web.chain.result import StageResult
+from onnx_web.params import HighresParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.server.hacks import apply_patches
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import test_device, test_needs_onnx_models
+
+TEST_MODEL = "../models/correction-gfpgan-v1-3"
+
+
+class CorrectGFPGANStageTests(unittest.TestCase):
+    @test_needs_onnx_models([TEST_MODEL])
+    def test_empty(self):
+        server = ServerContext(model_path="../models", output_path="../outputs")
+        apply_patches(server)
+
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            0,
+            0.1,
+        )
+        stage = CorrectGFPGANStage()
+        sources = StageResult.empty()
+        result = stage.run(
+            worker,
+            None,
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(TEST_MODEL),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_upscale_bsrgan.py b/api/tests/chain/test_upscale_bsrgan.py
new file mode 100644
index 00000000..f93b800c
--- /dev/null
+++ b/api/tests/chain/test_upscale_bsrgan.py
@@ -0,0 +1,41 @@
+import unittest
+
+from onnx_web.chain.result import StageResult
+from onnx_web.chain.upscale_bsrgan import UpscaleBSRGANStage
+from onnx_web.params import HighresParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import test_device, test_needs_onnx_models
+
+TEST_MODEL = "../models/upscaling-bsrgan-x4"
+
+
+class UpscaleBSRGANStageTests(unittest.TestCase):
+    @test_needs_onnx_models([TEST_MODEL])
+    def test_empty(self):
+        stage = UpscaleBSRGANStage()
+        sources = StageResult.empty()
+        result = stage.run(
+            WorkerContext(
+                "test",
+                test_device(),
+                None,
+                None,
+                None,
+                None,
+                None,
+                None,
+                3,
+                0.1,
+            ),
+            ServerContext(
+                model_path="../models",
+            ),
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(TEST_MODEL),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_upscale_outpaint.py b/api/tests/chain/test_upscale_outpaint.py
new file mode 100644
index 00000000..0e524014
--- /dev/null
+++ b/api/tests/chain/test_upscale_outpaint.py
@@ -0,0 +1,52 @@
+import unittest
+
+from PIL import Image
+
+from onnx_web.chain.result import StageResult
+from onnx_web.chain.upscale_outpaint import UpscaleOutpaintStage
+from onnx_web.params import Border, HighresParams, ImageParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import test_device, test_needs_models
+
+
+class UpscaleOutpaintStageTests(unittest.TestCase):
+    @test_needs_models(["../models/stable-diffusion-onnx-v1-inpainting"])
+    def test_empty(self):
+        stage = UpscaleOutpaintStage()
+        sources = StageResult.empty()
+        result = stage.run(
+            WorkerContext(
+                "test",
+                test_device(),
+                None,
+                None,
+                None,
+                None,
+                None,
+                None,
+                3,
+                0.1,
+            ),
+            ServerContext(
+                # model_path="../models",
+            ),
+            None,
+            ImageParams(
+                "../models/stable-diffusion-onnx-v1-inpainting",
+                "inpaint",
+                "euler",
+                "test",
+                5.0,
+                1,
+                1,
+            ),
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams("stable-diffusion-onnx-v1-inpainting"),
+            border=Border.even(0),
+            dims=(),
+            tile_mask=Image.new("RGB", (64, 64)),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_upscale_resrgan.py b/api/tests/chain/test_upscale_resrgan.py
new file mode 100644
index 00000000..f832767f
--- /dev/null
+++ b/api/tests/chain/test_upscale_resrgan.py
@@ -0,0 +1,39 @@
+import unittest
+
+from onnx_web.chain.result import StageResult
+from onnx_web.chain.upscale_resrgan import UpscaleRealESRGANStage
+from onnx_web.params import HighresParams, StageParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import test_device, test_needs_onnx_models
+
+TEST_MODEL = "../models/upscaling-real-esrgan-x4-v3"
+
+
+class UpscaleRealESRGANStageTests(unittest.TestCase):
+    @test_needs_onnx_models([TEST_MODEL])
+    def test_empty(self):
+        stage = UpscaleRealESRGANStage()
+        sources = StageResult.empty()
+        result = stage.run(
+            WorkerContext(
+                "test",
+                test_device(),
+                None,
+                None,
+                None,
+                None,
+                None,
+                None,
+                3,
+                0.1,
+            ),
+            ServerContext(model_path="../models"),
+            StageParams(),
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams("upscaling-real-esrgan-x4-v3"),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/chain/test_upscale_swinir.py b/api/tests/chain/test_upscale_swinir.py
new file mode 100644
index 00000000..e2bf69fe
--- /dev/null
+++ b/api/tests/chain/test_upscale_swinir.py
@@ -0,0 +1,41 @@
+import unittest
+
+from onnx_web.chain.result import StageResult
+from onnx_web.chain.upscale_swinir import UpscaleSwinIRStage
+from onnx_web.params import HighresParams, UpscaleParams
+from onnx_web.server.context import ServerContext
+from onnx_web.worker.context import WorkerContext
+from tests.helpers import test_device, test_needs_onnx_models
+
+TEST_MODEL = "../models/upscaling-swinir-real-large-x4"
+
+
+class UpscaleSwinIRStageTests(unittest.TestCase):
+    @test_needs_onnx_models([TEST_MODEL])
+    def test_empty(self):
+        stage = UpscaleSwinIRStage()
+        sources = StageResult.empty()
+        result = stage.run(
+            WorkerContext(
+                "test",
+                test_device(),
+                None,
+                None,
+                None,
+                None,
+                None,
+                None,
+                3,
+                0.1,
+            ),
+            ServerContext(
+                # model_path="../models",
+            ),
+            None,
+            None,
+            sources,
+            highres=HighresParams(False, 1, 0, 0),
+            upscale=UpscaleParams(TEST_MODEL),
+        )
+
+        self.assertEqual(len(result), 0)
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index e6c359ed..852ecd77 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -11,6 +11,12 @@ def test_needs_models(models: List[str]):
     )
 
 
+def test_needs_onnx_models(models: List[str]):
+    return skipUnless(
+        all([path.exists(f"{model}.onnx") for model in models]), "model does not exist"
+    )
+
+
 def test_device() -> DeviceParams:
     return DeviceParams("cpu", "CPUExecutionProvider")
 
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index bb374838..59600fea 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -63,6 +63,55 @@ class TestTxt2ImgPipeline(unittest.TestCase):
         self.assertEqual(output.size, (256, 256))
         # TODO: test contents of image
 
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+    def test_batch(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
+
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
+
+        run_txt2img_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+                batch=2,
+            ),
+            Size(256, 256),
+            ["test-txt2img-batch-0.png", "test-txt2img-batch-1.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+        )
+
+        self.assertTrue(path.exists("../outputs/test-txt2img-batch-0.png"))
+        self.assertTrue(path.exists("../outputs/test-txt2img-batch-1.png"))
+
+        output = Image.open("../outputs/test-txt2img-batch-0.png")
+        self.assertEqual(output.size, (256, 256))
+        # TODO: test contents of image
+
     @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
     def test_highres(self):
         cancel = Value("L", 0)
@@ -108,6 +157,54 @@ class TestTxt2ImgPipeline(unittest.TestCase):
         output = Image.open("../outputs/test-txt2img-highres.png")
         self.assertEqual(output.size, (512, 512))
 
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
+    def test_highres_batch(self):
+        cancel = Value("L", 0)
+        logs = Queue()
+        pending = Queue()
+        progress = Queue()
+        active = Value("L", 0)
+        idle = Value("L", 0)
+
+        worker = WorkerContext(
+            "test",
+            test_device(),
+            cancel,
+            logs,
+            pending,
+            progress,
+            active,
+            idle,
+            3,
+            0.1,
+        )
+        worker.start("test")
+
+        run_txt2img_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15,
+                "txt2img",
+                "ddim",
+                "an astronaut eating a hamburger",
+                3.0,
+                1,
+                1,
+                batch=2,
+            ),
+            Size(256, 256),
+            ["test-txt2img-highres-batch-0.png", "test-txt2img-highres-batch-1.png"],
+            UpscaleParams("test"),
+            HighresParams(True, 2, 0, 0),
+        )
+
+        self.assertTrue(path.exists("../outputs/test-txt2img-highres-batch-0.png"))
+        self.assertTrue(path.exists("../outputs/test-txt2img-highres-batch-1.png"))
+
+        output = Image.open("../outputs/test-txt2img-highres-batch-0.png")
+        self.assertEqual(output.size, (512, 512))
+
 
 class TestImg2ImgPipeline(unittest.TestCase):
     @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
diff --git a/api/tests/worker/test_pool.py b/api/tests/worker/test_pool.py
index 3f6f13cd..ea709156 100644
--- a/api/tests/worker/test_pool.py
+++ b/api/tests/worker/test_pool.py
@@ -89,10 +89,8 @@ class TestWorkerPool(unittest.TestCase):
             server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1
         )
         self.pool.start(lock)
-        sleep(2.0)
-
         self.pool.submit("test", test_job)
-        sleep(2.0)
+        sleep(5.0)
 
         pending, _progress = self.pool.done("test")
         self.assertFalse(pending)
@@ -121,12 +119,10 @@ class TestWorkerPool(unittest.TestCase):
             server, [device], join_timeout=TEST_JOIN_TIMEOUT, progress_interval=0.1
         )
         self.pool.start()
-        sleep(2.0)
-
         self.pool.submit("test", wait_job)
         self.assertEqual(self.pool.done("test"), (True, None))
 
-        sleep(2.0)
+        sleep(5.0)
         pending, _progress = self.pool.done("test")
         self.assertFalse(pending)
 

From 3ffb30f1217aa66a705a382410cc7e3059b2d612 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 11:34:18 -0600
Subject: [PATCH 184/240] fix(api): update deprecated import from diffusers

---
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 9d4dfc08..9a4ec773 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -10,7 +10,8 @@ from optimum.onnxruntime.modeling_diffusion import ORTStableDiffusionXLPipelineB
 from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
     StableDiffusionXLImg2ImgPipelineMixin,
 )
-from optimum.pipelines.diffusers.pipeline_utils import preprocess, rescale_noise_cfg
+from optimum.pipelines.diffusers.pipeline_utils import rescale_noise_cfg
+from diffusers.image_processor import VaeImageProcessor
 
 from onnx_web.chain.tile import make_tile_mask
 
@@ -728,7 +729,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         )
 
         # 3. Preprocess image
-        image = preprocess(image)
+        processor = VaeImageProcessor()
+        image = processor.preprocess(image)
 
         # 4. Prepare timesteps
         self.scheduler.set_timesteps(num_inference_steps)

From 51f0806c4a4b2d14802f2f38562af278cfec1766 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 11:36:03 -0600
Subject: [PATCH 185/240] restore inpainting fix

---
 api/onnx_web/chain/pipeline.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 359e2bfb..0ed63b4a 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -162,8 +162,7 @@ class ChainPipeline:
             if stage_pipe.max_tile > 0:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
-            # TODO: stage_sources will always be defined here
-            if must_tile:
+            if must_tile or len(stage_sources) > 0:
                 logger.info(
                     "image contains sources or is larger than tile size of %s, tiling stage",
                     tile,

From ddd3d45b79f08d82055a143ea7492444705ab071 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 23:21:45 -0600
Subject: [PATCH 186/240] fix(api): add logging along SDXL custom VAE codepath

---
 api/onnx_web/convert/diffusion/diffusion_xl.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/api/onnx_web/convert/diffusion/diffusion_xl.py b/api/onnx_web/convert/diffusion/diffusion_xl.py
index a4f11dd9..7a03b700 100644
--- a/api/onnx_web/convert/diffusion/diffusion_xl.py
+++ b/api/onnx_web/convert/diffusion/diffusion_xl.py
@@ -65,8 +65,10 @@ def convert_diffusion_diffusers_xl(
     if replace_vae is not None:
         vae_path = path.join(conversion.model_path, replace_vae)
         if check_ext(replace_vae, RESOLVE_FORMATS):
+            logger.debug("loading VAE from single tensor file: %s", vae_path)
             pipeline.vae = AutoencoderKL.from_single_file(vae_path)
         else:
+            logger.debug("loading pretrained VAE from path: %s", vae_path)
             pipeline.vae = AutoencoderKL.from_pretrained(vae_path)
 
     if path.exists(temp_path):

From a90a96376516e968557730456a0e8e83d992ebaf Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 23:22:05 -0600
Subject: [PATCH 187/240] fix(api): ensure pipeline is using selected scheduler

---
 api/onnx_web/diffusers/load.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 75dafc2e..a04cb5e5 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -227,6 +227,9 @@ def load_pipeline(
             **components,
         )
 
+        if pipe.scheduler != scheduler:
+            pipe.scheduler = scheduler
+
         # make sure XL models are actually being used
         if "text_encoder_session" in components:
             pipe.text_encoder = ORTModelTextEncoder(

From 34493e79689e1336a8ea69ff431fd4c1ab15d80a Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 23:22:28 -0600
Subject: [PATCH 188/240] update inpaint pipeline to use stage results

---
 api/onnx_web/diffusers/run.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index e80734a0..0cb59ac3 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -385,7 +385,7 @@ def run_inpaint_pipeline(
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
     images = chain.run(
-        worker, server, params, [source], callback=progress, latents=latents
+        worker, server, params, StageResult(images=[source]), callback=progress, latents=latents
     )
 
     _pairs, loras, inversions, _rest = parse_prompt(params)

From 8df6ec231fc7686f9a5353afef6a84e01754645f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 23:22:51 -0600
Subject: [PATCH 189/240] fix(scripts): improve MSE logging in release tests

---
 api/scripts/test-release.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/api/scripts/test-release.py b/api/scripts/test-release.py
index e46843a2..fbd5a6b8 100644
--- a/api/scripts/test-release.py
+++ b/api/scripts/test-release.py
@@ -476,11 +476,12 @@ def run_test(
         ref = Image.open(ref_name) if path.exists(ref_name) else None
 
         mse = find_mse(result, ref)
+        threshold = test.mse_threshold * mse_mult
 
-        if mse < (test.mse_threshold * mse_mult):
-            logger.info("MSE within threshold: %.5f < %.5f", mse, test.mse_threshold)
+        if mse < threshold:
+            logger.info("MSE within threshold: %.5f < %.5f", mse, threshold)
         else:
-            logger.warning("MSE above threshold: %.5f > %.5f", mse, test.mse_threshold)
+            logger.warning("MSE above threshold: %.5f > %.5f", mse, threshold)
             passed = False
 
     return passed

From 98f8abbacd3c8293f0da9a0831e1d3fe65120ca0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 23 Nov 2023 23:53:17 -0600
Subject: [PATCH 190/240] fix(api): correctly detect unknown embedding format

---
 api/onnx_web/convert/diffusion/textual_inversion.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/convert/diffusion/textual_inversion.py b/api/onnx_web/convert/diffusion/textual_inversion.py
index 0a5ed755..02d72eab 100644
--- a/api/onnx_web/convert/diffusion/textual_inversion.py
+++ b/api/onnx_web/convert/diffusion/textual_inversion.py
@@ -180,7 +180,7 @@ def blend_textual_inversions(
             continue
 
         if format is None:
-            format = detect_embedding_format()
+            format = detect_embedding_format(loaded_embeds)
 
         if format == "concept":
             blend_embedding_concept(embeds, loaded_embeds, dtype, base_token, weight)

From 8d4410305e4d411661c72607c2717690a5c62447 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 10:36:53 -0600
Subject: [PATCH 191/240] fix(api): convert latents to numpy before using

---
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 4 ++--
 api/onnx_web/diffusers/run.py                   | 7 ++++++-
 2 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 9a4ec773..fe8a6532 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -5,13 +5,13 @@ from typing import Any, Callable, Dict, List, Optional, Tuple, Union
 import numpy as np
 import PIL
 import torch
+from diffusers.image_processor import VaeImageProcessor
 from diffusers.pipelines.stable_diffusion_xl import StableDiffusionXLPipelineOutput
 from optimum.onnxruntime.modeling_diffusion import ORTStableDiffusionXLPipelineBase
 from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
     StableDiffusionXLImg2ImgPipelineMixin,
 )
 from optimum.pipelines.diffusers.pipeline_utils import rescale_noise_cfg
-from diffusers.image_processor import VaeImageProcessor
 
 from onnx_web.chain.tile import make_tile_mask
 
@@ -730,7 +730,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 3. Preprocess image
         processor = VaeImageProcessor()
-        image = processor.preprocess(image)
+        image = processor.preprocess(image).cpu().numpy()
 
         # 4. Prepare timesteps
         self.scheduler.set_timesteps(num_inference_steps)
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 0cb59ac3..5991c57a 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -385,7 +385,12 @@ def run_inpaint_pipeline(
     latents = get_latents_from_seed(params.seed, size, batch=params.batch)
     progress = worker.get_progress_callback()
     images = chain.run(
-        worker, server, params, StageResult(images=[source]), callback=progress, latents=latents
+        worker,
+        server,
+        params,
+        StageResult(images=[source]),
+        callback=progress,
+        latents=latents,
     )
 
     _pairs, loras, inversions, _rest = parse_prompt(params)

From 74832fc61bd0b940ff3925c0183cc11ba14befe7 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 15:22:07 -0600
Subject: [PATCH 192/240] fix(api): match SDXL keys per LoRA

---
 api/onnx_web/convert/diffusion/lora.py | 68 ++++++++++++--------------
 1 file changed, 32 insertions(+), 36 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index d10157ee..f2dbf75e 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -452,13 +452,16 @@ def blend_loras(
     else:
         lora_prefix = f"lora_{model_type}_"
 
-    blended: Dict[str, np.ndarray] = {}
+    layers = []
     for (lora_name, lora_weight), lora_model in zip(loras, lora_models):
         logger.debug("blending LoRA from %s with weight of %s", lora_name, lora_weight)
         if lora_model is None:
             logger.warning("unable to load tensor for LoRA")
             continue
 
+        blended: Dict[str, np.ndarray] = {}
+        layers.append(blended)
+
         for key in lora_model.keys():
             if ".hada_w1_a" in key and lora_prefix in key:
                 # LoHA
@@ -466,38 +469,36 @@ def blend_loras(
                     key, lora_prefix, lora_model, dtype
                 )
                 np_weights = np_weights * lora_weight
-                if base_key in blended:
-                    logger.trace(
-                        "summing LoHA weights: %s + %s",
-                        blended[base_key].shape,
-                        np_weights.shape,
-                    )
-                    blended[base_key] = sum_weights(blended[base_key], np_weights)
-                else:
-                    logger.trace(
-                        "adding LoHA weights: %s",
-                        np_weights.shape,
-                    )
-                    blended[base_key] = np_weights
+                logger.trace(
+                    "adding LoHA weights: %s",
+                    np_weights.shape,
+                )
+                blended[base_key] = np_weights
             elif ".lora_down" in key and lora_prefix in key:
                 # LoRA or LoCON
                 base_key, np_weights = blend_weights_lora(
                     key, lora_prefix, lora_model, dtype
                 )
                 np_weights = np_weights * lora_weight
-                if base_key in blended:
-                    logger.trace(
-                        "summing LoRA weights: %s + %s",
-                        blended[base_key].shape,
-                        np_weights.shape,
-                    )
-                    blended[base_key] = sum_weights(blended[base_key], np_weights)
-                else:
-                    logger.trace(
-                        "adding LoRA weights: %s",
-                        np_weights.shape,
-                    )
-                    blended[base_key] = np_weights
+                logger.trace(
+                    "adding LoRA weights: %s",
+                    np_weights.shape,
+                )
+                blended[base_key] = np_weights
+
+    # rewrite node names for XL and flatten layers
+    weights = Dict[str, np.ndarray] = {}
+
+    for blended in layers:
+        if xl:
+            nodes = list(base_model.graph.node)
+            blended = fix_xl_names(blended, nodes)
+
+        for key, value in blended.items():
+            if key in weights:
+                weights[key] = sum_weights(weights[key], value)
+            else:
+                weights[key] = value
 
     # fix node names once
     fixed_initializer_names = [
@@ -505,19 +506,14 @@ def blend_loras(
     ]
     fixed_node_names = [fix_node_name(node.name) for node in base_model.graph.node]
 
-    # rewrite node names for XL
-    if xl:
-        nodes = list(base_model.graph.node)
-        blended = fix_xl_names(blended, nodes)
-
     logger.debug(
         "updating %s of %s initializers",
-        len(blended.keys()),
+        len(weights.keys()),
         len(base_model.graph.initializer),
     )
 
     unmatched_keys = []
-    for base_key, weights in blended.items():
+    for base_key, weights in weights.items():
         conv_key = base_key + "_Conv"
         gemm_key = base_key + "_Gemm"
         matmul_key = base_key + "_MatMul"
@@ -579,7 +575,7 @@ def blend_loras(
         else:
             unmatched_keys.append(base_key)
 
-    logger.debug(
+    logger.trace(
         "node counts: %s -> %s, %s -> %s",
         len(fixed_initializer_names),
         len(base_model.graph.initializer),
@@ -588,7 +584,7 @@ def blend_loras(
     )
 
     if len(unmatched_keys) > 0:
-        logger.warning("could not find nodes for some keys: %s", unmatched_keys)
+        logger.warning("could not find nodes for some LoRA keys: %s", unmatched_keys)
 
     return base_model
 

From d7c95a4a4f182fbbcb1f789305f0aa0c32027198 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 16:51:03 -0600
Subject: [PATCH 193/240] fix SDXL node names once

---
 api/onnx_web/convert/diffusion/lora.py | 31 +++++++++++++-------------
 1 file changed, 15 insertions(+), 16 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index f2dbf75e..6e8ecc6e 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -73,7 +73,7 @@ def fix_node_name(key: str):
 
 def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]:
     fixed = {}
-    remaining = list(nodes)
+    names = [fix_node_name(node.name) for node in nodes]
 
     for key, value in keys.items():
         root, *rest = key.split(".")
@@ -128,28 +128,28 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
             continue
 
         logger.trace("searching for XL node: %s -> /%s/*/%s", root, block, suffix)
-        match: Optional[NodeProto] = None
+        match: Optional[str] = None
         if "conv" in suffix:
             match = next(
-                node for node in remaining if fix_node_name(node.name) == f"{root}_Conv"
+                node for node in names if node == f"{root}_Conv"
             )
         elif "time_emb_proj" in root:
             match = next(
-                node for node in remaining if fix_node_name(node.name) == f"{root}_Gemm"
+                node for node in names if node == f"{root}_Gemm"
             )
         elif block == "text_model" or simple:
             match = next(
                 node
-                for node in remaining
-                if fix_node_name(node.name) == f"{root}_MatMul"
+                for node in names
+                if node == f"{root}_MatMul"
             )
         else:
             # search in order. one side has sparse indices, so they will not match.
             match = next(
                 node
-                for node in remaining
-                if node.name.startswith(f"/{block}")
-                and fix_node_name(node.name).endswith(
+                for node in names
+                if node.startswith(block)
+                and node.endswith(
                     f"{suffix}_MatMul"
                 )  # needs to be fixed because some places use to_out.0
             )
@@ -158,10 +158,9 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
             logger.warning("no matches for XL key: %s", root)
             continue
         else:
-            logger.trace("matched key: %s -> %s", key, match.name)
+            logger.trace("matched key: %s -> %s", key, match)
 
-        name: str = match.name
-        name = fix_node_name(name)
+        name = match
         if name.endswith("_MatMul"):
             name = name[:-7]
         elif name.endswith("_Gemm"):
@@ -169,15 +168,15 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
         elif name.endswith("_Conv"):
             name = name[:-5]
 
-        logger.trace("matching XL key with node: %s -> %s, %s", key, match.name, name)
+        logger.trace("matching XL key with node: %s -> %s, %s", key, match, name)
 
         fixed[name] = value
-        remaining.remove(match)
+        names.remove(match)
 
     logger.debug(
         "SDXL LoRA key fixup matched %s keys, %s remaining",
         len(fixed.keys()),
-        len(remaining),
+        len(names),
     )
 
     return fixed
@@ -487,7 +486,7 @@ def blend_loras(
                 blended[base_key] = np_weights
 
     # rewrite node names for XL and flatten layers
-    weights = Dict[str, np.ndarray] = {}
+    weights: Dict[str, np.ndarray] = {}
 
     for blended in layers:
         if xl:

From 3f3811e16abccafd45c350799bea03ba56c7aa56 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 17:02:21 -0600
Subject: [PATCH 194/240] fix(api): build SDXL pipeline to avoid optimum
 patches

---
 api/onnx_web/diffusers/load.py | 66 +++++++++++-----------------------
 1 file changed, 20 insertions(+), 46 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index a04cb5e5..248f8887 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -217,55 +217,29 @@ def load_pipeline(
         components.update(vae_components)
 
         pipeline_class = available_pipelines.get(pipeline, OnnxStableDiffusionPipeline)
-        logger.debug("loading pretrained SD pipeline for %s", pipeline_class.__name__)
-        pipe = pipeline_class.from_pretrained(
-            model,
-            provider=device.ort_provider(),
-            sess_options=device.sess_options(),
-            safety_checker=None,
-            torch_dtype=torch_dtype,
-            **components,
-        )
 
-        if pipe.scheduler != scheduler:
-            pipe.scheduler = scheduler
-
-        # make sure XL models are actually being used
-        if "text_encoder_session" in components:
-            pipe.text_encoder = ORTModelTextEncoder(
-                components["text_encoder_session"], pipe
-            )
-
-        if "text_encoder_2_session" in components:
-            pipe.text_encoder_2 = ORTModelTextEncoder(
-                components["text_encoder_2_session"], pipe
-            )
-
-        if "tokenizer" in components:
-            pipe.tokenizer = components["tokenizer"]
-
-        if "tokenizer_2" in components:
-            pipe.tokenizer_2 = components["tokenizer_2"]
-
-        if "unet_session" in components:
-            # unload old UNet
-            logger.debug("unloading previous Unet")
-            pipe.unet = None
-            run_gc([device])
-
-            # attach correct one
-            pipe.unet = ORTModelUnet(components["unet_session"], pipe)
-
-        if "vae_decoder_session" in components:
-            pipe.vae_decoder = ORTModelVaeDecoder(
+        if params.is_xl():
+            logger.debug("assembling SDXL pipeline for %s", pipeline_class.__name__)
+            pipe = pipeline_class(
                 components["vae_decoder_session"],
-                pipe,
+                components["text_encoder_session"],
+                components["unet_session"],
+                {}, # empty config
+                components["tokenizer"],
+                scheduler,
+                vae_encoder_session=components.get("vae_encoder_session", None),
+                text_encoder_2_session=components.get("text_encoder_2_session", None),
+                tokenizer_2=components.get("tokenizer_2", None),
             )
-
-        if "vae_encoder_session" in components:
-            pipe.vae_encoder = ORTModelVaeEncoder(
-                components["vae_encoder_session"],
-                pipe,
+        else:
+            logger.debug("loading pretrained SD pipeline for %s", pipeline_class.__name__)
+            pipe = pipeline_class.from_pretrained(
+                model,
+                provider=device.ort_provider(),
+                sess_options=device.sess_options(),
+                safety_checker=None,
+                torch_dtype=torch_dtype,
+                **components,
             )
 
         if not server.show_progress:

From 44a23a6366a1f60537737bc8535259acf541dce8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 22:40:01 -0600
Subject: [PATCH 195/240] apply lint

---
 api/onnx_web/convert/diffusion/lora.py | 17 +++++------------
 api/onnx_web/diffusers/load.py         | 12 ++++--------
 2 files changed, 9 insertions(+), 20 deletions(-)

diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index 6e8ecc6e..f115942f 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -130,19 +130,11 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
         logger.trace("searching for XL node: %s -> /%s/*/%s", root, block, suffix)
         match: Optional[str] = None
         if "conv" in suffix:
-            match = next(
-                node for node in names if node == f"{root}_Conv"
-            )
+            match = next(node for node in names if node == f"{root}_Conv")
         elif "time_emb_proj" in root:
-            match = next(
-                node for node in names if node == f"{root}_Gemm"
-            )
+            match = next(node for node in names if node == f"{root}_Gemm")
         elif block == "text_model" or simple:
-            match = next(
-                node
-                for node in names
-                if node == f"{root}_MatMul"
-            )
+            match = next(node for node in names if node == f"{root}_MatMul")
         else:
             # search in order. one side has sparse indices, so they will not match.
             match = next(
@@ -174,8 +166,9 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
         names.remove(match)
 
     logger.debug(
-        "SDXL LoRA key fixup matched %s keys, %s remaining",
+        "SDXL LoRA key fixup matched %s of %s keys, %s nodes remaining",
         len(fixed.keys()),
+        len(keys.keys()),
         len(names),
     )
 
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 248f8887..e7394dc7 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -7,12 +7,6 @@ from optimum.onnxruntime import (  # ORTStableDiffusionXLInpaintPipeline,
     ORTStableDiffusionXLImg2ImgPipeline,
     ORTStableDiffusionXLPipeline,
 )
-from optimum.onnxruntime.modeling_diffusion import (
-    ORTModelTextEncoder,
-    ORTModelUnet,
-    ORTModelVaeDecoder,
-    ORTModelVaeEncoder,
-)
 from transformers import CLIPTokenizer
 
 from ..constants import ONNX_MODEL
@@ -224,7 +218,7 @@ def load_pipeline(
                 components["vae_decoder_session"],
                 components["text_encoder_session"],
                 components["unet_session"],
-                {}, # empty config
+                {},  # empty config
                 components["tokenizer"],
                 scheduler,
                 vae_encoder_session=components.get("vae_encoder_session", None),
@@ -232,7 +226,9 @@ def load_pipeline(
                 tokenizer_2=components.get("tokenizer_2", None),
             )
         else:
-            logger.debug("loading pretrained SD pipeline for %s", pipeline_class.__name__)
+            logger.debug(
+                "loading pretrained SD pipeline for %s", pipeline_class.__name__
+            )
             pipe = pipeline_class.from_pretrained(
                 model,
                 provider=device.ort_provider(),

From 9e930a91d5c331acf78da0c6676e64727bf38128 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 22:40:22 -0600
Subject: [PATCH 196/240] fix(api): load lists without empty items

---
 api/onnx_web/server/context.py | 17 ++++++++---------
 api/onnx_web/utils.py          |  9 +++++++++
 2 files changed, 17 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index e1af489d..9ab4494b 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -5,7 +5,7 @@ from typing import List, Optional
 
 import torch
 
-from ..utils import get_boolean
+from ..utils import get_boolean, get_list
 from .model_cache import ModelCache
 
 logger = getLogger(__name__)
@@ -106,20 +106,19 @@ class ServerContext:
             model_path=environ.get("ONNX_WEB_MODEL_PATH", path.join("..", "models")),
             output_path=environ.get("ONNX_WEB_OUTPUT_PATH", path.join("..", "outputs")),
             params_path=environ.get("ONNX_WEB_PARAMS_PATH", "."),
-            # others
-            cors_origin=environ.get("ONNX_WEB_CORS_ORIGIN", "*").split(","),
+            cors_origin=get_list(environ, "ONNX_WEB_CORS_ORIGIN", "*"),
             any_platform=get_boolean(
                 environ, "ONNX_WEB_ANY_PLATFORM", DEFAULT_ANY_PLATFORM
             ),
-            block_platforms=environ.get("ONNX_WEB_BLOCK_PLATFORMS", "").split(","),
+            block_platforms=get_list(environ, "ONNX_WEB_BLOCK_PLATFORMS", ""),
             default_platform=environ.get("ONNX_WEB_DEFAULT_PLATFORM", None),
-            image_format=environ.get("ONNX_WEB_IMAGE_FORMAT", "png"),
+            image_format=environ.get("ONNX_WEB_IMAGE_FORMAT", DEFAULT_IMAGE_FORMAT),
             cache_limit=int(environ.get("ONNX_WEB_CACHE_MODELS", DEFAULT_CACHE_LIMIT)),
             show_progress=get_boolean(
                 environ, "ONNX_WEB_SHOW_PROGRESS", DEFAULT_SHOW_PROGRESS
             ),
-            optimizations=environ.get("ONNX_WEB_OPTIMIZATIONS", "").split(","),
-            extra_models=environ.get("ONNX_WEB_EXTRA_MODELS", "").split(","),
+            optimizations=get_list(environ, "ONNX_WEB_OPTIMIZATIONS", ""),
+            extra_models=get_list(environ, "ONNX_WEB_EXTRA_MODELS", ""),
             job_limit=int(environ.get("ONNX_WEB_JOB_LIMIT", DEFAULT_JOB_LIMIT)),
             memory_limit=memory_limit,
             admin_token=environ.get("ONNX_WEB_ADMIN_TOKEN", None),
@@ -129,8 +128,8 @@ class ServerContext:
             worker_retries=int(
                 environ.get("ONNX_WEB_WORKER_RETRIES", DEFAULT_WORKER_RETRIES)
             ),
-            feature_flags=environ.get("ONNX_WEB_FEATURE_FLAGS", "").split(","),
-            plugins=environ.get("ONNX_WEB_PLUGINS", "").split(","),
+            feature_flags=get_list(environ, "ONNX_WEB_FEATURE_FLAGS", ""),
+            plugins=get_list(environ, "ONNX_WEB_PLUGINS", ""),
             debug=get_boolean(environ, "ONNX_WEB_DEBUG", False),
         )
 
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 43547c63..799e9dd5 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -18,6 +18,11 @@ logger = getLogger(__name__)
 SAFE_CHARS = "._-"
 
 
+def split_list(val: str) -> List[str]:
+    parts = [part.strip() for part in val.split(",")]
+    return [part for part in parts if len(part.strip()) > 0]
+
+
 def base_join(base: str, tail: str) -> str:
     tail_path = path.relpath(path.normpath(path.join("/", tail)), "/")
     return path.join(base, tail_path)
@@ -36,6 +41,10 @@ def get_boolean(args: Any, key: str, default_value: bool) -> bool:
     return val.lower() in ("1", "t", "true", "y", "yes")
 
 
+def get_list(args: Any, key: str) -> List[str]:
+    return split_list(args.get(key, ""))
+
+
 def get_and_clamp_float(
     args: Any, key: str, default_value: float, max_value: float, min_value=0.0
 ) -> float:

From 17e25a3bc38bbef0b390abef1e8b7b46b2b643b5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Fri, 24 Nov 2023 23:02:22 -0600
Subject: [PATCH 197/240] fix list parser default

---
 api/onnx_web/server/context.py | 10 +++++-----
 api/onnx_web/utils.py          |  4 ++--
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/server/context.py b/api/onnx_web/server/context.py
index 9ab4494b..034fc3c6 100644
--- a/api/onnx_web/server/context.py
+++ b/api/onnx_web/server/context.py
@@ -106,19 +106,19 @@ class ServerContext:
             model_path=environ.get("ONNX_WEB_MODEL_PATH", path.join("..", "models")),
             output_path=environ.get("ONNX_WEB_OUTPUT_PATH", path.join("..", "outputs")),
             params_path=environ.get("ONNX_WEB_PARAMS_PATH", "."),
-            cors_origin=get_list(environ, "ONNX_WEB_CORS_ORIGIN", "*"),
+            cors_origin=get_list(environ, "ONNX_WEB_CORS_ORIGIN", default="*"),
             any_platform=get_boolean(
                 environ, "ONNX_WEB_ANY_PLATFORM", DEFAULT_ANY_PLATFORM
             ),
-            block_platforms=get_list(environ, "ONNX_WEB_BLOCK_PLATFORMS", ""),
+            block_platforms=get_list(environ, "ONNX_WEB_BLOCK_PLATFORMS"),
             default_platform=environ.get("ONNX_WEB_DEFAULT_PLATFORM", None),
             image_format=environ.get("ONNX_WEB_IMAGE_FORMAT", DEFAULT_IMAGE_FORMAT),
             cache_limit=int(environ.get("ONNX_WEB_CACHE_MODELS", DEFAULT_CACHE_LIMIT)),
             show_progress=get_boolean(
                 environ, "ONNX_WEB_SHOW_PROGRESS", DEFAULT_SHOW_PROGRESS
             ),
-            optimizations=get_list(environ, "ONNX_WEB_OPTIMIZATIONS", ""),
-            extra_models=get_list(environ, "ONNX_WEB_EXTRA_MODELS", ""),
+            optimizations=get_list(environ, "ONNX_WEB_OPTIMIZATIONS"),
+            extra_models=get_list(environ, "ONNX_WEB_EXTRA_MODELS"),
             job_limit=int(environ.get("ONNX_WEB_JOB_LIMIT", DEFAULT_JOB_LIMIT)),
             memory_limit=memory_limit,
             admin_token=environ.get("ONNX_WEB_ADMIN_TOKEN", None),
@@ -128,7 +128,7 @@ class ServerContext:
             worker_retries=int(
                 environ.get("ONNX_WEB_WORKER_RETRIES", DEFAULT_WORKER_RETRIES)
             ),
-            feature_flags=get_list(environ, "ONNX_WEB_FEATURE_FLAGS", ""),
+            feature_flags=get_list(environ, "ONNX_WEB_FEATURE_FLAGS"),
             plugins=get_list(environ, "ONNX_WEB_PLUGINS", ""),
             debug=get_boolean(environ, "ONNX_WEB_DEBUG", False),
         )
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 799e9dd5..9dac0d40 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -41,8 +41,8 @@ def get_boolean(args: Any, key: str, default_value: bool) -> bool:
     return val.lower() in ("1", "t", "true", "y", "yes")
 
 
-def get_list(args: Any, key: str) -> List[str]:
-    return split_list(args.get(key, ""))
+def get_list(args: Any, key: str, default = "") -> List[str]:
+    return split_list(args.get(key, default))
 
 
 def get_and_clamp_float(

From 192bd08156963621352118ddd69ce3f571ae3a61 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 07:50:36 -0600
Subject: [PATCH 198/240] apply sonar lint

---
 api/onnx_web/chain/pipeline.py           |  2 +-
 api/onnx_web/diffusers/load.py           |  2 +-
 api/onnx_web/utils.py                    |  2 +-
 api/tests/convert/diffusion/test_lora.py |  2 +-
 api/tests/test_diffusers/test_run.py     | 31 +++++++++++++-----------
 api/tests/worker/test_worker.py          |  2 --
 6 files changed, 21 insertions(+), 20 deletions(-)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 0ed63b4a..ee7015ab 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -218,7 +218,7 @@ class ChainPipeline:
                     "image does not contain sources and is within tile size of %s, running stage",
                     tile,
                 )
-                for i in range(worker.retries):
+                for _i in range(worker.retries):
                     try:
                         stage_result = stage_pipe.run(
                             worker,
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index e7394dc7..1ef4335e 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -95,7 +95,7 @@ def add_pipeline(name: str, pipeline: Any) -> bool:
         return False
     else:
         available_pipelines[name] = pipeline
-        return False
+        return True
 
 
 def get_available_pipelines() -> List[str]:
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 9dac0d40..67e7847d 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -41,7 +41,7 @@ def get_boolean(args: Any, key: str, default_value: bool) -> bool:
     return val.lower() in ("1", "t", "true", "y", "yes")
 
 
-def get_list(args: Any, key: str, default = "") -> List[str]:
+def get_list(args: Any, key: str, default="") -> List[str]:
     return split_list(args.get(key, default))
 
 
diff --git a/api/tests/convert/diffusion/test_lora.py b/api/tests/convert/diffusion/test_lora.py
index 2b94b559..a39b0b8b 100644
--- a/api/tests/convert/diffusion/test_lora.py
+++ b/api/tests/convert/diffusion/test_lora.py
@@ -141,7 +141,7 @@ class FixXLNameTests(unittest.TestCase):
         nodes = {
             "lora_unet.input_block.lora_down.weight": {},
         }
-        fixed = fix_xl_names(nodes, [""])
+        fixed = fix_xl_names(nodes, [NodeProto(name="test")])
 
         self.assertEqual(fixed, nodes)
 
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index 59600fea..e9988116 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -15,6 +15,9 @@ from onnx_web.server.context import ServerContext
 from onnx_web.worker.context import WorkerContext
 from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_device, test_needs_models
 
+TEST_PROMPT = "an astronaut eating a hamburger"
+TEST_SCHEDULER = "ddim"
+
 
 class TestTxt2ImgPipeline(unittest.TestCase):
     @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
@@ -46,8 +49,8 @@ class TestTxt2ImgPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -92,8 +95,8 @@ class TestTxt2ImgPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -141,8 +144,8 @@ class TestTxt2ImgPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -186,8 +189,8 @@ class TestTxt2ImgPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -237,8 +240,8 @@ class TestImg2ImgPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -284,8 +287,8 @@ class TestUpscalePipeline(unittest.TestCase):
             ImageParams(
                 "../models/upscaling-stable-diffusion-x4",
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
@@ -331,8 +334,8 @@ class TestBlendPipeline(unittest.TestCase):
             ImageParams(
                 TEST_MODEL_DIFFUSION_SD15,
                 "txt2img",
-                "ddim",
-                "an astronaut eating a hamburger",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
                 3.0,
                 1,
                 1,
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
index 993c6d67..553094ad 100644
--- a/api/tests/worker/test_worker.py
+++ b/api/tests/worker/test_worker.py
@@ -67,7 +67,6 @@ class WorkerMainTests(unittest.TestCase):
         )
 
         self.assertEqual(status, EXIT_INTERRUPT)
-        pass
 
     def test_pending_exception_retry(self):
         status = None
@@ -103,7 +102,6 @@ class WorkerMainTests(unittest.TestCase):
         )
 
         self.assertEqual(status, EXIT_ERROR)
-        pass
 
     def test_pending_exception_value(self):
         status = None

From b1328fdfdb747cd563762a91d9bbf0c9a37cf2e2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 07:50:54 -0600
Subject: [PATCH 199/240] fix(api): handle images with alpha channels better

---
 api/onnx_web/image/noise_source.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/image/noise_source.py b/api/onnx_web/image/noise_source.py
index c543aa6e..a1dd47f1 100644
--- a/api/onnx_web/image/noise_source.py
+++ b/api/onnx_web/image/noise_source.py
@@ -94,7 +94,7 @@ def noise_source_normal(
 def noise_source_histogram(
     source: Image.Image, dims: Point, _origin: Point, **kw
 ) -> Image.Image:
-    r, g, b = source.split()
+    r, g, b, *_a = source.split()
     width, height = dims
     size = width * height
 

From 6ecdae44a2efb455364575be66c8cf6d02c9ff07 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 12:25:16 -0600
Subject: [PATCH 200/240] fix(api): pass correct outscale to highres stages

---
 api/onnx_web/chain/highres.py        |  2 +-
 api/onnx_web/chain/tile.py           |  1 -
 api/onnx_web/diffusers/run.py        | 17 ++++++++---------
 api/onnx_web/params.py               | 11 +++++++++++
 api/tests/test_diffusers/test_run.py |  3 ++-
 5 files changed, 22 insertions(+), 12 deletions(-)

diff --git a/api/onnx_web/chain/highres.py b/api/onnx_web/chain/highres.py
index 523b9a3a..2a43e051 100644
--- a/api/onnx_web/chain/highres.py
+++ b/api/onnx_web/chain/highres.py
@@ -57,7 +57,7 @@ def stage_highres(
 
         chain.stage(
             BlendImg2ImgStage(),
-            stage,
+            stage.with_args(outscale=1),
             overlap=params.vae_overlap,
             prompt_index=prompt_index + i,
             strength=highres.strength,
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index f600d06b..b88d9628 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -156,7 +156,6 @@ def blend_tiles(
     value = np.zeros(scaled_size)
 
     for left, top, tile_image in tiles:
-        # TODO: histogram equalization
         equalized = np.array(tile_image).astype(np.float32)
         mask = np.ones_like(equalized[:, :, 0])
 
diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 5991c57a..f5bd3a06 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -64,21 +64,20 @@ def run_txt2img_pipeline(
 
     # apply upscaling and correction, before highres
     highres_size = params.unet_tile
-    stage = StageParams(tile_size=highres_size)
-
     if params.is_panorama():
+        if server.has_feature("panorama-highres"):
+            # run the whole highres pass with one panorama call
+            highres_size = tile_size * highres.scale
+
         chain.stage(
             BlendDenoiseStage(),
-            stage,
+            StageParams(tile_size=highres_size),
         )
 
-        if server.has_feature("panorama-highres"):
-            highres_size = tile_size * highres.scale
-
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
-            stage,
+            StageParams(outscale=first_upscale.outscale, tile_size=highres_size),
             params,
             chain=chain,
             upscale=first_upscale,
@@ -86,7 +85,7 @@ def run_txt2img_pipeline(
 
     # apply highres
     stage_highres(
-        stage,
+        StageParams(outscale=highres.scale, tile_size=highres_size),
         params,
         highres,
         upscale,
@@ -96,7 +95,7 @@ def run_txt2img_pipeline(
 
     # apply upscaling and correction, after highres
     stage_upscale_correction(
-        stage,
+        StageParams(outscale=after_upscale.outscale, tile_size=highres_size),
         params,
         chain=chain,
         upscale=after_upscale,
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index efac3742..7d0ad48c 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -369,6 +369,17 @@ class StageParams:
         self.tile_order = tile_order
         self.tile_size = tile_size
 
+    def with_args(
+        self,
+        **kwargs,
+    ):
+        return StageParams(
+            name=kwargs.get("name", self.name),
+            outscale=kwargs.get("outscale", self.outscale),
+            tile_order=kwargs.get("tile_order", self.tile_order),
+            tile_size=kwargs.get("tile_size", self.tile_size),
+        )
+
 
 class UpscaleParams:
     def __init__(
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index e9988116..e4004e15 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -149,10 +149,11 @@ class TestTxt2ImgPipeline(unittest.TestCase):
                 3.0,
                 1,
                 1,
+                unet_tile=256,
             ),
             Size(256, 256),
             ["test-txt2img-highres.png"],
-            UpscaleParams("test"),
+            UpscaleParams("test", scale=2, outscale=2),
             HighresParams(True, 2, 0, 0),
         )
 

From 02447f5fd6e909e7da0633dffd2b7124df85bf45 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 12:29:17 -0600
Subject: [PATCH 201/240] fix(api): provide some necessary SDXL config

---
 api/onnx_web/diffusers/load.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 1ef4335e..6de8316e 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -218,7 +218,10 @@ def load_pipeline(
                 components["vae_decoder_session"],
                 components["text_encoder_session"],
                 components["unet_session"],
-                {},  # empty config
+                {
+                    "force_zeros_for_empty_prompt": True,
+                    "requires_aesthetics_score": False,
+                },
                 components["tokenizer"],
                 scheduler,
                 vae_encoder_session=components.get("vae_encoder_session", None),

From d78e843af4e53baa1fe23c733e425e803fdcdd17 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 14:02:42 -0600
Subject: [PATCH 202/240] fix(api): consistently handle tile size across
 premade pipelines

---
 api/onnx_web/diffusers/run.py | 85 ++++++++++++++++++++++-------------
 api/onnx_web/params.py        |  8 +++-
 2 files changed, 60 insertions(+), 33 deletions(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index f5bd3a06..11939b02 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -34,6 +34,24 @@ from .utils import get_latents_from_seed, parse_prompt
 logger = getLogger(__name__)
 
 
+def get_base_tile(params: ImageParams, size: Size) -> int:
+    if params.is_panorama():
+        tile = max(params.unet_tile, size.width, size.height)
+        logger.debug("adjusting tile size for panorama to %s", tile)
+        return tile
+
+    return params.unet_tile
+
+
+def get_highres_tile(
+    server: ServerContext, params: ImageParams, highres: HighresParams, tile: int
+) -> int:
+    if params.is_panorama() and server.has_feature("panorama-highres"):
+        return tile * highres.scale
+
+    return params.unet_tile
+
+
 def run_txt2img_pipeline(
     worker: WorkerContext,
     server: ServerContext,
@@ -44,11 +62,7 @@ def run_txt2img_pipeline(
     highres: HighresParams,
 ) -> None:
     # if using panorama, the pipeline will tile itself (views)
-    if params.is_panorama():
-        tile_size = max(params.unet_tile, size.width, size.height)
-        logger.debug("adjusting tile size for panorama to %s", tile_size)
-    else:
-        tile_size = params.unet_tile
+    tile_size = get_base_tile(params, size)
 
     # prepare the chain pipeline and first stage
     chain = ChainPipeline()
@@ -63,12 +77,8 @@ def run_txt2img_pipeline(
     )
 
     # apply upscaling and correction, before highres
-    highres_size = params.unet_tile
+    highres_size = get_highres_tile(server, params, highres, tile_size)
     if params.is_panorama():
-        if server.has_feature("panorama-highres"):
-            # run the whole highres pass with one panorama call
-            highres_size = tile_size * highres.scale
-
         chain.stage(
             BlendDenoiseStage(),
             StageParams(tile_size=highres_size),
@@ -151,13 +161,13 @@ def run_img2img_pipeline(
             source = f(server, source)
 
     # prepare the chain pipeline and first stage
+    tile_size = get_base_tile(params, Size(*source.size))
     chain = ChainPipeline()
-    stage = StageParams(
-        tile_size=params.unet_tile,
-    )
     chain.stage(
         BlendImg2ImgStage(),
-        stage,
+        StageParams(
+            tile_size=tile_size,
+        ),
         prompt_index=0,
         strength=strength,
         overlap=params.vae_overlap,
@@ -167,7 +177,10 @@ def run_img2img_pipeline(
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
-            stage,
+            StageParams(
+                outscale=first_upscale.outscale,
+                tile_size=tile_size,
+            ),
             params,
             upscale=first_upscale,
             chain=chain,
@@ -177,13 +190,16 @@ def run_img2img_pipeline(
     for _i in range(params.loopback):
         chain.stage(
             BlendImg2ImgStage(),
-            stage,
+            StageParams(
+                tile_size=tile_size,
+            ),
             strength=strength,
         )
 
     # highres, if selected
+    highres_size = get_highres_tile(server, params, highres, tile_size)
     stage_highres(
-        stage,
+        StageParams(tile_size=highres_size, outscale=highres.scale),
         params,
         highres,
         upscale,
@@ -193,7 +209,7 @@ def run_img2img_pipeline(
 
     # apply upscaling and correction, after highres
     stage_upscale_correction(
-        stage,
+        StageParams(tile_size=tile_size, outscale=after_upscale.scale),
         params,
         upscale=after_upscale,
         chain=chain,
@@ -252,7 +268,7 @@ def run_inpaint_pipeline(
     full_res_inpaint_padding: float,
 ) -> None:
     logger.debug("building inpaint pipeline")
-    tile_size = params.unet_tile
+    tile_size = get_base_tile(params, size)
 
     if mask is None:
         # if no mask was provided, keep the full source image
@@ -339,10 +355,9 @@ def run_inpaint_pipeline(
 
     # set up the chain pipeline and base stage
     chain = ChainPipeline()
-    stage = StageParams(tile_order=tile_order, tile_size=tile_size)
     chain.stage(
         UpscaleOutpaintStage(),
-        stage,
+        StageParams(tile_order=tile_order, tile_size=tile_size),
         border=border,
         mask=mask,
         fill_color=fill_color,
@@ -356,15 +371,16 @@ def run_inpaint_pipeline(
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
-            stage,
+            StageParams(outscale=first_upscale.outscale, tile_size=tile_size),
             params,
             upscale=first_upscale,
             chain=chain,
         )
 
     # apply highres
+    highres_size = get_highres_tile(server, params, highres, tile_size)
     stage_highres(
-        stage,
+        StageParams(outscale=highres.scale, tile_size=highres_size),
         params,
         highres,
         upscale,
@@ -374,7 +390,7 @@ def run_inpaint_pipeline(
 
     # apply upscaling and correction
     stage_upscale_correction(
-        stage,
+        StageParams(outscale=after_upscale.outscale),
         params,
         upscale=after_upscale,
         chain=chain,
@@ -433,21 +449,22 @@ def run_upscale_pipeline(
 ) -> None:
     # set up the chain pipeline, no base stage for upscaling
     chain = ChainPipeline()
-    stage = StageParams(tile_size=params.unet_tile)
+    tile_size = get_base_tile(params, size)
 
     # apply upscaling and correction, before highres
     first_upscale, after_upscale = split_upscale(upscale)
     if first_upscale:
         stage_upscale_correction(
-            stage,
+            StageParams(outscale=first_upscale.outscale, tile_size=tile_size),
             params,
             upscale=first_upscale,
             chain=chain,
         )
 
     # apply highres
+    highres_size = get_highres_tile(server, params, highres, tile_size)
     stage_highres(
-        stage,
+        StageParams(outscale=highres.scale, tile_size=highres_size),
         params,
         highres,
         upscale,
@@ -457,7 +474,7 @@ def run_upscale_pipeline(
 
     # apply upscaling and correction, after highres
     stage_upscale_correction(
-        stage,
+        StageParams(outscale=after_upscale.outscale, tile_size=tile_size),
         params,
         upscale=after_upscale,
         chain=chain,
@@ -504,12 +521,18 @@ def run_blend_pipeline(
 ) -> None:
     # set up the chain pipeline and base stage
     chain = ChainPipeline()
-    stage = StageParams()
-    chain.stage(BlendMaskStage(), stage, stage_source=sources[1], stage_mask=mask)
+    tile_size = get_base_tile(params, size)
+
+    chain.stage(
+        BlendMaskStage(),
+        StageParams(tile_size=tile_size),
+        stage_source=sources[1],
+        stage_mask=mask,
+    )
 
     # apply upscaling and correction
     stage_upscale_correction(
-        stage,
+        StageParams(outscale=upscale.outscale),
         params,
         upscale=upscale,
         chain=chain,
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 7d0ad48c..34f1d070 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -488,10 +488,14 @@ class HighresParams:
         self.method = method
         self.iterations = iterations
 
+    def outscale(self) -> int:
+        return self.scale**self.iterations
+
     def resize(self, size: Size) -> Size:
+        outscale = self.outscale()
         return Size(
-            size.width * (self.scale**self.iterations),
-            size.height * (self.scale**self.iterations),
+            size.width * outscale,
+            size.height * outscale,
         )
 
     def tojson(self):

From 1818a36c11b9319eddc91cb3fd8d9589d800a04c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 15:25:47 -0600
Subject: [PATCH 203/240] fix(api): correctly handle completely black mask
 images

---
 api/onnx_web/diffusers/run.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/run.py b/api/onnx_web/diffusers/run.py
index 11939b02..5b159019 100644
--- a/api/onnx_web/diffusers/run.py
+++ b/api/onnx_web/diffusers/run.py
@@ -297,8 +297,12 @@ def run_inpaint_pipeline(
     logger.debug("border zero: %s", border.isZero())
     full_res_inpaint = full_res_inpaint and border.isZero()
     if full_res_inpaint:
-        mask_left, mask_top, mask_right, mask_bottom = mask.getbbox()
-        logger.debug("mask bbox: %s", mask.getbbox())
+        bbox = mask.getbbox()
+        if bbox is None:
+            bbox = (0, 0, source.width, source.height)
+
+        logger.debug("mask bounding box: %s", bbox)
+        mask_left, mask_top, mask_right, mask_bottom = bbox
         mask_width = mask_right - mask_left
         mask_height = mask_bottom - mask_top
         # ensure we have some padding around the mask when we do the inpaint (and that the region size is even)

From c134edf4b3eb08afaa48b75e4da8290b21e9751d Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 15:28:03 -0600
Subject: [PATCH 204/240] sonar lint

---
 api/tests/chain/test_upscale_outpaint.py | 4 +---
 api/tests/chain/test_upscale_swinir.py   | 4 +---
 api/tests/worker/test_worker.py          | 2 +-
 3 files changed, 3 insertions(+), 7 deletions(-)

diff --git a/api/tests/chain/test_upscale_outpaint.py b/api/tests/chain/test_upscale_outpaint.py
index 0e524014..261a8d45 100644
--- a/api/tests/chain/test_upscale_outpaint.py
+++ b/api/tests/chain/test_upscale_outpaint.py
@@ -28,9 +28,7 @@ class UpscaleOutpaintStageTests(unittest.TestCase):
                 3,
                 0.1,
             ),
-            ServerContext(
-                # model_path="../models",
-            ),
+            ServerContext(),
             None,
             ImageParams(
                 "../models/stable-diffusion-onnx-v1-inpainting",
diff --git a/api/tests/chain/test_upscale_swinir.py b/api/tests/chain/test_upscale_swinir.py
index e2bf69fe..dfa9676e 100644
--- a/api/tests/chain/test_upscale_swinir.py
+++ b/api/tests/chain/test_upscale_swinir.py
@@ -28,9 +28,7 @@ class UpscaleSwinIRStageTests(unittest.TestCase):
                 3,
                 0.1,
             ),
-            ServerContext(
-                # model_path="../models",
-            ),
+            ServerContext(),
             None,
             None,
             sources,
diff --git a/api/tests/worker/test_worker.py b/api/tests/worker/test_worker.py
index 553094ad..6365fac9 100644
--- a/api/tests/worker/test_worker.py
+++ b/api/tests/worker/test_worker.py
@@ -18,7 +18,7 @@ from tests.helpers import test_device
 
 
 def main_memory(_worker):
-    raise Exception(MEMORY_ERRORS[0])
+    raise MemoryError(MEMORY_ERRORS[0])
 
 
 def main_retry(_worker):

From 1c3b2f8dfcbdf3e246e6e0edec22c6ff71ced157 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 18:52:47 -0600
Subject: [PATCH 205/240] fix(api): better handling of alpha channels

---
 api/onnx_web/chain/blend_grid.py   |  9 +++++----
 api/onnx_web/chain/blend_mask.py   |  3 ++-
 api/onnx_web/chain/result.py       | 14 +++++++++++++-
 api/onnx_web/chain/tile.py         |  6 ++++--
 api/onnx_web/image/mask_filter.py  |  2 +-
 api/onnx_web/image/noise_source.py | 19 +++++++++++--------
 api/onnx_web/image/utils.py        |  2 +-
 7 files changed, 37 insertions(+), 18 deletions(-)

diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 234f6c3b..5ca17151 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -3,7 +3,7 @@ from typing import Optional
 
 from PIL import Image
 
-from ..params import ImageParams, SizeChart, StageParams
+from ..params import ImageParams, Size, SizeChart, StageParams
 from ..server import ServerContext
 from ..worker import ProgressCallback, WorkerContext
 from .base import BaseStage
@@ -36,9 +36,10 @@ class BlendGridStage(BaseStage):
         logger.info("combining source images using grid layout")
 
         images = sources.as_image()
-        size = images[0].size
+        ref_image = images[0]
+        size = Size(*ref_image.size)
 
-        output = Image.new("RGB", (size[0] * width, size[1] * height))
+        output = Image.new(ref_image.mode, (size.width * width, size.height * height))
 
         # TODO: labels
         if order is None:
@@ -49,7 +50,7 @@ class BlendGridStage(BaseStage):
             y = i // width
 
             n = order[i]
-            output.paste(images[n], (x * size[0], y * size[1]))
+            output.paste(images[n], (x * size.width, y * size.height))
 
         return StageResult(images=[*images, output])
 
diff --git a/api/onnx_web/chain/blend_mask.py b/api/onnx_web/chain/blend_mask.py
index 4ebb1498..4486bbf6 100644
--- a/api/onnx_web/chain/blend_mask.py
+++ b/api/onnx_web/chain/blend_mask.py
@@ -30,7 +30,8 @@ class BlendMaskStage(BaseStage):
     ) -> StageResult:
         logger.info("blending image using mask")
 
-        mult_mask = Image.new("RGBA", stage_mask.size, color="black")
+        # TODO: does this need an alpha channel?
+        mult_mask = Image.new(stage_mask.mode, stage_mask.size, color="black")
         mult_mask.alpha_composite(stage_mask)
         mult_mask = mult_mask.convert("L")
 
diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index 9bd7395d..ea19c850 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -52,4 +52,16 @@ class StageResult:
         if self.images is not None:
             return self.images
 
-        return [Image.fromarray(np.uint8(i), "RGB") for i in self.arrays]
+        return [Image.fromarray(np.uint8(i), shape_mode(i)) for i in self.arrays]
+
+
+def shape_mode(arr: np.ndarray) -> str:
+    if len(arr.shape) != 3:
+        raise ValueError("unknown array format")
+
+    if arr.shape[-1] == 3:
+        return "RGB"
+    elif arr.shape[-1] == 4:
+        return "RGBA"
+
+    raise ValueError("unknown image format")
\ No newline at end of file
diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index b88d9628..6b738556 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -151,7 +151,9 @@ def blend_tiles(
         "adjusting tile size from %s to %s based on %s overlap", tile, adj_tile, overlap
     )
 
-    scaled_size = (height * scale, width * scale, 3)
+    channels = max([4 if tile_image.mode == "RGBA" else 3 for _left, _top, tile_image in tiles])
+    scaled_size = (height * scale, width * scale, channels)
+
     count = np.zeros(scaled_size)
     value = np.zeros(scaled_size)
 
@@ -221,7 +223,7 @@ def blend_tiles(
                 margin_left : equalized.shape[1] + margin_right,
                 np.newaxis,
             ],
-            3,
+            channels,
             axis=2,
         )
 
diff --git a/api/onnx_web/image/mask_filter.py b/api/onnx_web/image/mask_filter.py
index 82a19dfa..967fce1f 100644
--- a/api/onnx_web/image/mask_filter.py
+++ b/api/onnx_web/image/mask_filter.py
@@ -8,7 +8,7 @@ def mask_filter_none(
 ) -> Image.Image:
     width, height = dims
 
-    noise = Image.new("RGB", (width, height), fill)
+    noise = Image.new(mask.mode, (width, height), fill)
     noise.paste(mask, origin)
 
     return noise
diff --git a/api/onnx_web/image/noise_source.py b/api/onnx_web/image/noise_source.py
index a1dd47f1..2c260f14 100644
--- a/api/onnx_web/image/noise_source.py
+++ b/api/onnx_web/image/noise_source.py
@@ -17,21 +17,21 @@ def noise_source_fill_edge(
     """
     width, height = dims
 
-    noise = Image.new("RGB", (width, height), fill)
+    noise = Image.new(source.mode, (width, height), fill)
     noise.paste(source, origin)
 
     return noise
 
 
 def noise_source_fill_mask(
-    _source: Image.Image, dims: Point, _origin: Point, fill="white", **kw
+    source: Image.Image, dims: Point, _origin: Point, fill="white", **kw
 ) -> Image.Image:
     """
     Fill the whole canvas, no source or noise.
     """
     width, height = dims
 
-    noise = Image.new("RGB", (width, height), fill)
+    noise = Image.new(source.mode, (width, height), fill)
 
     return noise
 
@@ -52,7 +52,7 @@ def noise_source_gaussian(
 
 
 def noise_source_uniform(
-    _source: Image.Image, dims: Point, _origin: Point, **kw
+    source: Image.Image, dims: Point, _origin: Point, **kw
 ) -> Image.Image:
     width, height = dims
     size = width * height
@@ -61,6 +61,7 @@ def noise_source_uniform(
     noise_g = random.uniform(0, 256, size=size)
     noise_b = random.uniform(0, 256, size=size)
 
+    # needs to be RGB for pixel manipulation
     noise = Image.new("RGB", (width, height))
 
     for x in range(width):
@@ -68,11 +69,11 @@ def noise_source_uniform(
             i = get_pixel_index(x, y, width)
             noise.putpixel((x, y), (int(noise_r[i]), int(noise_g[i]), int(noise_b[i])))
 
-    return noise
+    return noise.convert(source.mode)
 
 
 def noise_source_normal(
-    _source: Image.Image, dims: Point, _origin: Point, **kw
+    source: Image.Image, dims: Point, _origin: Point, **kw
 ) -> Image.Image:
     width, height = dims
     size = width * height
@@ -81,6 +82,7 @@ def noise_source_normal(
     noise_g = random.normal(128, 32, size=size)
     noise_b = random.normal(128, 32, size=size)
 
+    # needs to be RGB for pixel manipulation
     noise = Image.new("RGB", (width, height))
 
     for x in range(width):
@@ -88,7 +90,7 @@ def noise_source_normal(
             i = get_pixel_index(x, y, width)
             noise.putpixel((x, y), (int(noise_r[i]), int(noise_g[i]), int(noise_b[i])))
 
-    return noise
+    return noise.convert(source.mode)
 
 
 def noise_source_histogram(
@@ -112,6 +114,7 @@ def noise_source_histogram(
         256, p=np.divide(np.copy(hist_b), np.sum(hist_b)), size=size
     )
 
+    # needs to be RGB for pixel manipulation
     noise = Image.new("RGB", (width, height))
 
     for x in range(width):
@@ -119,4 +122,4 @@ def noise_source_histogram(
             i = get_pixel_index(x, y, width)
             noise.putpixel((x, y), (noise_r[i], noise_g[i], noise_b[i]))
 
-    return noise
+    return noise.convert(source.mode)
diff --git a/api/onnx_web/image/utils.py b/api/onnx_web/image/utils.py
index 4e2f3a7a..a1264ff0 100644
--- a/api/onnx_web/image/utils.py
+++ b/api/onnx_web/image/utils.py
@@ -20,7 +20,7 @@ def expand_image(
     size = tuple(size)
     origin = (expand.left, expand.top)
 
-    full_source = Image.new("RGB", size, fill)
+    full_source = Image.new(source.mode, size, fill)
     full_source.paste(source, origin)
 
     # new mask pixels need to be filled with white so they will be replaced

From 83ebd77c3d4fe61d05d2f5c16905a705b9edc35e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 21:19:11 -0600
Subject: [PATCH 206/240] fix(api): handle blending numpy arrays

---
 api/onnx_web/chain/tile.py | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index 6b738556..a6705e5c 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -2,7 +2,7 @@ import itertools
 from enum import Enum
 from logging import getLogger
 from math import ceil
-from typing import Any, Callable, List, Optional, Protocol, Tuple
+from typing import Any, Callable, List, Optional, Protocol, Tuple, Union
 
 import numpy as np
 from PIL import Image
@@ -138,6 +138,20 @@ def make_tile_mask(
     return mask
 
 
+def get_channels(image: Union[np.ndarray, Image.Image]) -> int:
+    if isinstance(image, np.ndarray):
+        return image.shape[-1]
+
+    if image.mode == "RGBA":
+        return 4
+    elif image.mode == "RGB":
+        return 3
+    elif image.mode == "L":
+        return 1
+
+    raise ValueError("unknown image format")
+
+
 def blend_tiles(
     tiles: List[Tuple[int, int, Image.Image]],
     scale: int,
@@ -151,7 +165,7 @@ def blend_tiles(
         "adjusting tile size from %s to %s based on %s overlap", tile, adj_tile, overlap
     )
 
-    channels = max([4 if tile_image.mode == "RGBA" else 3 for _left, _top, tile_image in tiles])
+    channels = max([get_channels(tile_image) for _left, _top, tile_image in tiles])
     scaled_size = (height * scale, width * scale, channels)
 
     count = np.zeros(scaled_size)

From 93e3125e289d32ca2b2c95ed692fa75200c8101e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 25 Nov 2023 23:18:57 -0600
Subject: [PATCH 207/240] fix(api): be more careful with VAE patch flags, add
 margin to latents if needed

---
 api/onnx_web/chain/result.py         |   2 +-
 api/onnx_web/diffusers/load.py       |   9 ++-
 api/onnx_web/diffusers/utils.py      |   4 +-
 api/tests/helpers.py                 |  25 ++++++
 api/tests/test_diffusers/test_run.py | 114 ++++++++++++++++++++++-----
 5 files changed, 125 insertions(+), 29 deletions(-)

diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index ea19c850..799b7b8e 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -64,4 +64,4 @@ def shape_mode(arr: np.ndarray) -> str:
     elif arr.shape[-1] == 4:
         return "RGBA"
 
-    raise ValueError("unknown image format")
\ No newline at end of file
+    raise ValueError("unknown image format")
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 6de8316e..3b8565d6 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -253,10 +253,11 @@ def load_pipeline(
     for vae in VAE_COMPONENTS:
         if hasattr(pipe, vae):
             vae_model = getattr(pipe, vae)
-            vae_model.set_tiled(tiled=params.tiled_vae)
-            vae_model.set_window_size(
-                params.vae_tile // LATENT_FACTOR, params.vae_overlap
-            )
+            if isinstance(vae_model, VAEWrapper):
+                vae_model.set_tiled(tiled=params.tiled_vae)
+                vae_model.set_window_size(
+                    params.vae_tile // LATENT_FACTOR, params.vae_overlap
+                )
 
     # update panorama params
     if params.is_panorama():
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index f308e2fa..140ece45 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -300,9 +300,7 @@ def get_tile_latents(
 
     tile_latents = full_latents[:, :, y:yt, x:xt]
 
-    if tile_latents.shape != full_latents.shape and (
-        tile_latents.shape[2] < t or tile_latents.shape[3] < t
-    ):
+    if tile_latents.shape[2] < t or tile_latents.shape[3] < t:
         extra_latents = get_latents_from_seed(seed, size, batch=tile_latents.shape[0])
         extra_latents[
             :, :, 0 : tile_latents.shape[2], 0 : tile_latents.shape[3]
diff --git a/api/tests/helpers.py b/api/tests/helpers.py
index 852ecd77..f0c10edd 100644
--- a/api/tests/helpers.py
+++ b/api/tests/helpers.py
@@ -1,8 +1,10 @@
+from multiprocessing import Queue, Value
 from os import path
 from typing import List
 from unittest import skipUnless
 
 from onnx_web.params import DeviceParams
+from onnx_web.worker.context import WorkerContext
 
 
 def test_needs_models(models: List[str]):
@@ -21,6 +23,29 @@ def test_device() -> DeviceParams:
     return DeviceParams("cpu", "CPUExecutionProvider")
 
 
+def test_worker() -> WorkerContext:
+    cancel = Value("L", 0)
+    logs = Queue()
+    pending = Queue()
+    progress = Queue()
+    active = Value("L", 0)
+    idle = Value("L", 0)
+
+    return WorkerContext(
+        "test",
+        test_device(),
+        cancel,
+        logs,
+        pending,
+        progress,
+        active,
+        idle,
+        3,
+        0.1,
+    )
+
+
 TEST_MODEL_CORRECTION_CODEFORMER = "../models/.cache/correction-codeformer.pth"
 TEST_MODEL_DIFFUSION_SD15 = "../models/stable-diffusion-onnx-v1-5"
+TEST_MODEL_DIFFUSION_SD15_INPAINT = "../models/stable-diffusion-onnx-v1-inpainting"
 TEST_MODEL_UPSCALING_SWINIR = "../models/.cache/upscaling-swinir.pth"
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index e4004e15..261566e0 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -7,13 +7,29 @@ from PIL import Image
 from onnx_web.diffusers.run import (
     run_blend_pipeline,
     run_img2img_pipeline,
+    run_inpaint_pipeline,
     run_txt2img_pipeline,
     run_upscale_pipeline,
 )
-from onnx_web.params import HighresParams, ImageParams, Size, UpscaleParams
+from onnx_web.image.mask_filter import mask_filter_none
+from onnx_web.image.noise_source import noise_source_uniform
+from onnx_web.params import (
+    Border,
+    HighresParams,
+    ImageParams,
+    Size,
+    TileOrder,
+    UpscaleParams,
+)
 from onnx_web.server.context import ServerContext
 from onnx_web.worker.context import WorkerContext
-from tests.helpers import TEST_MODEL_DIFFUSION_SD15, test_device, test_needs_models
+from tests.helpers import (
+    TEST_MODEL_DIFFUSION_SD15,
+    TEST_MODEL_DIFFUSION_SD15_INPAINT,
+    test_device,
+    test_needs_models,
+    test_worker,
+)
 
 TEST_PROMPT = "an astronaut eating a hamburger"
 TEST_SCHEDULER = "ddim"
@@ -213,25 +229,7 @@ class TestTxt2ImgPipeline(unittest.TestCase):
 class TestImg2ImgPipeline(unittest.TestCase):
     @test_needs_models([TEST_MODEL_DIFFUSION_SD15])
     def test_basic(self):
-        cancel = Value("L", 0)
-        logs = Queue()
-        pending = Queue()
-        progress = Queue()
-        active = Value("L", 0)
-        idle = Value("L", 0)
-
-        worker = WorkerContext(
-            "test",
-            test_device(),
-            cancel,
-            logs,
-            pending,
-            progress,
-            active,
-            idle,
-            3,
-            0.1,
-        )
+        worker = test_worker()
         worker.start("test")
 
         source = Image.new("RGB", (64, 64), "black")
@@ -257,6 +255,80 @@ class TestImg2ImgPipeline(unittest.TestCase):
         self.assertTrue(path.exists("../outputs/test-img2img.png"))
 
 
+class TestInpaintPipeline(unittest.TestCase):
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15_INPAINT])
+    def test_basic_white(self):
+        worker = test_worker()
+        worker.start("test")
+
+        source = Image.new("RGB", (64, 64), "black")
+        mask = Image.new("RGB", (64, 64), "white")
+        run_inpaint_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15_INPAINT,
+                "txt2img",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
+                3.0,
+                1,
+                1,
+            ),
+            Size(*source.size),
+            ["test-inpaint-white.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+            source,
+            mask,
+            Border.even(0),
+            noise_source_uniform,
+            mask_filter_none,
+            "white",
+            TileOrder.spiral,
+            False,
+            0.0,
+        )
+
+        self.assertTrue(path.exists("../outputs/test-inpaint-white.png"))
+
+    @test_needs_models([TEST_MODEL_DIFFUSION_SD15_INPAINT])
+    def test_basic_black(self):
+        worker = test_worker()
+        worker.start("test")
+
+        source = Image.new("RGB", (64, 64), "black")
+        mask = Image.new("RGB", (64, 64), "black")
+        run_inpaint_pipeline(
+            worker,
+            ServerContext(model_path="../models", output_path="../outputs"),
+            ImageParams(
+                TEST_MODEL_DIFFUSION_SD15_INPAINT,
+                "txt2img",
+                TEST_SCHEDULER,
+                TEST_PROMPT,
+                3.0,
+                1,
+                1,
+            ),
+            Size(*source.size),
+            ["test-inpaint-black.png"],
+            UpscaleParams("test"),
+            HighresParams(False, 1, 0, 0),
+            source,
+            mask,
+            Border.even(0),
+            noise_source_uniform,
+            mask_filter_none,
+            "black",
+            TileOrder.spiral,
+            False,
+            0.0,
+        )
+
+        self.assertTrue(path.exists("../outputs/test-inpaint-black.png"))
+
+
 class TestUpscalePipeline(unittest.TestCase):
     @test_needs_models(["../models/upscaling-stable-diffusion-x4"])
     def test_basic(self):

From 7ca5dc12a44b369254ee253e573ca4d01079ba04 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 26 Nov 2023 10:38:12 -0600
Subject: [PATCH 208/240] fix(api): match inpaint source and mask formats

---
 api/onnx_web/server/api.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index 4c23ba22..bbd5f038 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -252,7 +252,7 @@ def inpaint(server: ServerContext, pool: DevicePoolExecutor):
     if mask_file is None:
         return error_reply("mask image is required")
 
-    source = Image.open(BytesIO(source_file.read())).convert("RGB")
+    source = Image.open(BytesIO(source_file.read())).convert("RGBA")
     size = Size(source.width, source.height)
 
     mask_top_layer = Image.open(BytesIO(mask_file.read())).convert("RGBA")

From 75f1a2ceade1fd604aff277d77738cb6e58ab27b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 26 Nov 2023 10:43:08 -0600
Subject: [PATCH 209/240] pass results object to chain pipeline from endpoint

---
 api/onnx_web/diffusers/pipelines/upscale.py | 6 +-----
 api/onnx_web/server/api.py                  | 3 ++-
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index fc0e477b..e9df3a5f 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -55,11 +55,7 @@ class FakeConfig:
     scaling_factor: float
 
     def __init__(self) -> None:
-        self.block_out_channels = [
-            128,
-            256,
-            512
-        ]
+        self.block_out_channels = [128, 256, 512]
         self.scaling_factor = 0.08333
 
 
diff --git a/api/onnx_web/server/api.py b/api/onnx_web/server/api.py
index bbd5f038..a9162f0f 100644
--- a/api/onnx_web/server/api.py
+++ b/api/onnx_web/server/api.py
@@ -8,6 +8,7 @@ from jsonschema import validate
 from PIL import Image
 
 from ..chain import CHAIN_STAGES, ChainPipeline
+from ..chain.result import StageResult
 from ..diffusers.load import get_available_pipelines, get_pipeline_schedulers
 from ..diffusers.run import (
     run_blend_pipeline,
@@ -472,7 +473,7 @@ def chain(server: ServerContext, pool: DevicePoolExecutor):
         pipeline,
         server,
         base_params,
-        [],
+        StageResult.empty(),
         output=output,
         size=base_size,
         needs_device=device,

From fa38b474f06d30ef487bf34fe1a6b925f2f657fd Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 26 Nov 2023 14:13:45 -0600
Subject: [PATCH 210/240] fix(api): abandon pretrained loader entirely to fix
 SD upscaling

---
 api/onnx_web/diffusers/load.py | 33 ++++++++++++++++++++++++---------
 1 file changed, 24 insertions(+), 9 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 3b8565d6..7e78ab62 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -230,17 +230,32 @@ def load_pipeline(
             )
         else:
             logger.debug(
-                "loading pretrained SD pipeline for %s", pipeline_class.__name__
-            )
-            pipe = pipeline_class.from_pretrained(
-                model,
-                provider=device.ort_provider(),
-                sess_options=device.sess_options(),
-                safety_checker=None,
-                torch_dtype=torch_dtype,
-                **components,
+                "assembling SD pipeline for %s", pipeline_class.__name__
             )
 
+            if pipeline_class == OnnxStableDiffusionUpscalePipeline:
+                # upscale uses a single VAE
+                pipe = pipeline_class(
+                    components["vae"],
+                    components["text_encoder"],
+                    components["tokenizer"],
+                    components["unet"],
+                    scheduler,
+                    scheduler,
+                )
+            else:
+                pipe = pipeline_class(
+                    components["vae_encoder"],
+                    components["vae_decoder"],
+                    components["text_encoder"],
+                    components["tokenizer"],
+                    components["unet"],
+                    scheduler,
+                    None,
+                    None,
+                    requires_safety_checker=False,
+                )
+
         if not server.show_progress:
             pipe.set_progress_bar_config(disable=True)
 

From d3a4cc8fd20ae156e986f9afa9414070aae17163 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 26 Nov 2023 15:23:28 -0600
Subject: [PATCH 211/240] fix(api): use upstream SD upscaling pipeline as base
 for in-tree one

---
 api/onnx_web/diffusers/pipelines/upscale.py | 307 +-------------------
 1 file changed, 4 insertions(+), 303 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index e9df3a5f..2fb3a2e1 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -1,55 +1,13 @@
-###
-# This is based on a combination of the ONNX img2img pipeline and the PyTorch upscale pipeline:
-# https://github.com/huggingface/diffusers/blob/v0.11.1/src/diffusers/pipelines/stable_diffusion/pipeline_onnx_stable_diffusion_img2img.py
-# https://github.com/huggingface/diffusers/blob/v0.11.1/src/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_upscale.py
-# See also: https://github.com/huggingface/diffusers/pull/2158
-###
-
 from logging import getLogger
-from typing import Any, Callable, List, Optional, Union
+from typing import Any, List
 
-import numpy as np
-import PIL
-import torch
-from diffusers.pipelines.onnx_utils import ORT_TO_NP_TYPE, OnnxRuntimeModel
-from diffusers.pipelines.pipeline_utils import ImagePipelineOutput
-from diffusers.pipelines.stable_diffusion import StableDiffusionUpscalePipeline
+from diffusers.pipelines.onnx_utils import OnnxRuntimeModel
+from diffusers.pipelines.stable_diffusion import OnnxStableDiffusionUpscalePipeline as BasePipeline
 from diffusers.schedulers import DDPMScheduler
 
 logger = getLogger(__name__)
 
 
-NUM_LATENT_CHANNELS = 4
-NUM_UNET_INPUT_CHANNELS = 7
-
-ORT_TO_PT_TYPE = {
-    "float16": torch.float16,
-    "float32": torch.float32,
-}
-
-
-def preprocess(image):
-    if isinstance(image, torch.Tensor):
-        return image
-    elif isinstance(image, PIL.Image.Image):
-        image = [image]
-
-    if isinstance(image[0], PIL.Image.Image):
-        w, h = image[0].size
-        w, h = map(lambda x: x - x % 64, (w, h))  # resize to integer multiple of 32
-
-        image = [np.array(i.resize((w, h)))[None, :] for i in image]
-        image = np.concatenate(image, axis=0)
-        image = np.array(image).astype(np.float32) / 255.0
-        image = image.transpose(0, 3, 1, 2)
-        image = 2.0 * image - 1.0
-        image = torch.from_numpy(image)
-    elif isinstance(image[0], torch.Tensor):
-        image = torch.cat(image, dim=0)
-
-    return image
-
-
 class FakeConfig:
     block_out_channels: List[int]
     scaling_factor: float
@@ -59,7 +17,7 @@ class FakeConfig:
         self.scaling_factor = 0.08333
 
 
-class OnnxStableDiffusionUpscalePipeline(StableDiffusionUpscalePipeline):
+class OnnxStableDiffusionUpscalePipeline(BasePipeline):
     def __init__(
         self,
         vae: OnnxRuntimeModel,
@@ -82,260 +40,3 @@ class OnnxStableDiffusionUpscalePipeline(StableDiffusionUpscalePipeline):
             scheduler,
             max_noise_level=max_noise_level,
         )
-
-    def __call__(
-        self,
-        prompt: Union[str, List[str]],
-        image: Union[torch.FloatTensor, PIL.Image.Image, List[PIL.Image.Image]],
-        num_inference_steps: int = 75,
-        guidance_scale: float = 9.0,
-        noise_level: int = 20,
-        negative_prompt: Optional[Union[str, List[str]]] = None,
-        num_images_per_prompt: Optional[int] = 1,
-        eta: float = 0.0,
-        generator: Optional[Union[torch.Generator, List[torch.Generator]]] = None,
-        latents: Optional[torch.FloatTensor] = None,
-        output_type: Optional[str] = "pil",
-        return_dict: bool = True,
-        callback: Optional[Callable[[int, int, torch.FloatTensor], None]] = None,
-        callback_steps: Optional[int] = 1,
-    ):
-        # 1. Check inputs
-        self.check_inputs(prompt, image, noise_level, callback_steps)
-
-        # 2. Define call parameters
-        batch_size = 1 if isinstance(prompt, str) else len(prompt)
-        device = self._execution_device
-        # here `guidance_scale` is defined analog to the guidance weight `w` of equation (2)
-        # of the Imagen paper: https://arxiv.org/pdf/2205.11487.pdf . `guidance_scale = 1`
-        # corresponds to doing no classifier free guidance.
-        do_classifier_free_guidance = guidance_scale > 1.0
-
-        # 3. Encode input prompt
-        text_embeddings = self._encode_prompt(
-            prompt,
-            # device, device only needed for Torch pipelines
-            num_images_per_prompt,
-            do_classifier_free_guidance,
-            negative_prompt,
-        )
-
-        latents_dtype = ORT_TO_PT_TYPE[str(text_embeddings.dtype)]
-
-        # 4. Preprocess image
-        image = preprocess(image)
-        image = image.cpu()
-
-        # 5. set timesteps
-        self.scheduler.set_timesteps(num_inference_steps, device=device)
-        timesteps = self.scheduler.timesteps
-
-        # 5. Add noise to image
-        noise_level = torch.tensor([noise_level], dtype=torch.long, device=device)
-        noise = torch.randn(
-            image.shape, generator=generator, device=device, dtype=latents_dtype
-        )
-        image = self.low_res_scheduler.add_noise(image, noise, noise_level)
-
-        batch_multiplier = 2 if do_classifier_free_guidance else 1
-        image = np.concatenate([image] * batch_multiplier * num_images_per_prompt)
-        noise_level = np.concatenate([noise_level] * image.shape[0])
-
-        # 6. Prepare latent variables
-        height, width = image.shape[2:]
-        latents = self.prepare_latents(
-            batch_size * num_images_per_prompt,
-            NUM_LATENT_CHANNELS,
-            height,
-            width,
-            latents_dtype,
-            device,
-            generator,
-            latents,
-        )
-
-        # 7. Check that sizes of image and latents match
-        num_channels_image = image.shape[1]
-        if NUM_LATENT_CHANNELS + num_channels_image != NUM_UNET_INPUT_CHANNELS:
-            raise ValueError(
-                "Incorrect configuration settings! The config of `pipeline.unet` expects"
-                f" {NUM_UNET_INPUT_CHANNELS} but received `num_channels_latents`: {NUM_LATENT_CHANNELS} +"
-                f" `num_channels_image`: {num_channels_image} "
-                f" = {NUM_LATENT_CHANNELS+num_channels_image}. Please verify the config of"
-                " `pipeline.unet` or your `image` input."
-            )
-
-        # 8. Prepare extra step kwargs. TODO: Logic should ideally just be moved out of the pipeline
-        extra_step_kwargs = self.prepare_extra_step_kwargs(generator, eta)
-
-        timestep_dtype = next(
-            (
-                input.type
-                for input in self.unet.model.get_inputs()
-                if input.name == "timestep"
-            ),
-            "tensor(float)",
-        )
-        timestep_dtype = ORT_TO_NP_TYPE[timestep_dtype]
-
-        # 9. Denoising loop
-        num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
-        with self.progress_bar(total=num_inference_steps) as progress_bar:
-            for i, t in enumerate(timesteps):
-                # expand the latents if we are doing classifier free guidance
-                latent_model_input = (
-                    np.concatenate([latents] * 2)
-                    if do_classifier_free_guidance
-                    else latents
-                )
-
-                # concat latents, mask, masked_image_latents in the channel dimension
-                latent_model_input = self.scheduler.scale_model_input(
-                    latent_model_input, t
-                )
-                latent_model_input = np.concatenate([latent_model_input, image], axis=1)
-
-                # timestep to tensor
-                timestep = np.array([t], dtype=timestep_dtype)
-
-                # predict the noise residual
-                noise_pred = self.unet(
-                    sample=latent_model_input,
-                    timestep=timestep,
-                    encoder_hidden_states=text_embeddings,
-                    class_labels=noise_level.astype(np.int64),
-                )[0]
-
-                # perform guidance
-                if do_classifier_free_guidance:
-                    noise_pred_uncond, noise_pred_text = np.split(noise_pred, 2)
-                noise_pred = noise_pred_uncond + guidance_scale * (
-                    noise_pred_text - noise_pred_uncond
-                )
-
-                # compute the previous noisy sample x_t -> x_t-1
-                latents = self.scheduler.step(
-                    torch.from_numpy(noise_pred), t, latents, **extra_step_kwargs
-                ).prev_sample
-
-                # call the callback, if provided
-                if i == len(timesteps) - 1 or (
-                    (i + 1) > num_warmup_steps and (i + 1) % self.scheduler.order == 0
-                ):
-                    progress_bar.update()
-                    if callback is not None and i % callback_steps == 0:
-                        callback(i, t, latents)
-
-        # 10. Post-processing
-        image = self.decode_latents(latents.float())
-
-        # 11. Convert to PIL
-        if output_type == "pil":
-            image = self.numpy_to_pil(image)
-
-        if not return_dict:
-            return (image,)
-
-        return ImagePipelineOutput(images=image)
-
-    def decode_latents(self, latents):
-        latents = 1 / 0.08333 * latents
-        image = self.vae(latent_sample=latents)[0]
-        image = np.clip(image / 2 + 0.5, 0, 1)
-        image = image.transpose((0, 2, 3, 1))
-        return image
-
-    def _encode_prompt(
-        self,
-        prompt,
-        device,
-        num_images_per_prompt,
-        do_classifier_free_guidance,
-        negative_prompt,
-    ):
-        batch_size = len(prompt) if isinstance(prompt, list) else 1
-
-        text_inputs = self.tokenizer(
-            prompt,
-            padding="max_length",
-            max_length=self.tokenizer.model_max_length,
-            truncation=True,
-            return_tensors="pt",
-        )
-        text_input_ids = text_inputs.input_ids
-        untruncated_ids = self.tokenizer(
-            prompt, padding="longest", return_tensors="pt"
-        ).input_ids
-
-        if untruncated_ids.shape[-1] >= text_input_ids.shape[-1] and not torch.equal(
-            text_input_ids, untruncated_ids
-        ):
-            removed_text = self.tokenizer.batch_decode(
-                untruncated_ids[:, self.tokenizer.model_max_length - 1 : -1]
-            )
-            logger.warning(
-                "The following part of your input was truncated because CLIP can only handle sequences up to"
-                f" {self.tokenizer.model_max_length} tokens: {removed_text}"
-            )
-
-        # no positional arguments to text_encoder
-        text_embeddings = self.text_encoder(
-            input_ids=text_input_ids.int().to(device),
-        )
-        text_embeddings = text_embeddings[0]
-
-        bs_embed, seq_len, _ = text_embeddings.shape
-        # duplicate text embeddings for each generation per prompt, using mps friendly method
-        text_embeddings = text_embeddings.repeat(1, num_images_per_prompt)
-        text_embeddings = text_embeddings.reshape(
-            bs_embed * num_images_per_prompt, seq_len, -1
-        )
-
-        # get unconditional embeddings for classifier free guidance
-        if do_classifier_free_guidance:
-            uncond_tokens: List[str]
-            if negative_prompt is None:
-                uncond_tokens = [""] * batch_size
-            elif type(prompt) is not type(negative_prompt):
-                raise TypeError(
-                    f"`negative_prompt` should be the same type to `prompt`, but got {type(negative_prompt)} !="
-                    f" {type(prompt)}."
-                )
-            elif isinstance(negative_prompt, str):
-                uncond_tokens = [negative_prompt]
-            elif batch_size != len(negative_prompt):
-                raise ValueError(
-                    f"`negative_prompt`: {negative_prompt} has batch size {len(negative_prompt)}, but `prompt`:"
-                    f" {prompt} has batch size {batch_size}. Please make sure that passed `negative_prompt` matches"
-                    " the batch size of `prompt`."
-                )
-            else:
-                uncond_tokens = negative_prompt
-
-            max_length = text_input_ids.shape[-1]
-            uncond_input = self.tokenizer(
-                uncond_tokens,
-                padding="max_length",
-                max_length=max_length,
-                truncation=True,
-                return_tensors="pt",
-            )
-
-            uncond_embeddings = self.text_encoder(
-                input_ids=uncond_input.input_ids.int().to(device),
-            )
-            uncond_embeddings = uncond_embeddings[0]
-
-            seq_len = uncond_embeddings.shape[1]
-            # duplicate unconditional embeddings for each generation per prompt, using mps friendly method
-            uncond_embeddings = uncond_embeddings.repeat(1, num_images_per_prompt)
-            uncond_embeddings = uncond_embeddings.reshape(
-                batch_size * num_images_per_prompt, seq_len, -1
-            )
-
-            # For classifier free guidance, we need to do two forward passes.
-            # Here we concatenate the unconditional and text embeddings into a single batch
-            # to avoid doing two forward passes
-            text_embeddings = np.concatenate([uncond_embeddings, text_embeddings])
-
-        return text_embeddings

From a9b4303d25ade796a1e4c710568e61ab512ff9e4 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 26 Nov 2023 15:29:07 -0600
Subject: [PATCH 212/240] switch upscaling to np random

---
 api/onnx_web/chain/upscale_stable_diffusion.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/chain/upscale_stable_diffusion.py b/api/onnx_web/chain/upscale_stable_diffusion.py
index bf2fa7ea..6c8a300e 100644
--- a/api/onnx_web/chain/upscale_stable_diffusion.py
+++ b/api/onnx_web/chain/upscale_stable_diffusion.py
@@ -2,7 +2,7 @@ from logging import getLogger
 from os import path
 from typing import Optional
 
-import torch
+import numpy as np
 from PIL import Image
 
 from ..diffusers.load import load_pipeline
@@ -47,7 +47,7 @@ class UpscaleStableDiffusionStage(BaseStage):
             worker.get_device(),
             model=path.join(server.model_path, upscale.upscale_model),
         )
-        generator = torch.manual_seed(params.seed)
+        rng = np.random.RandomState(params.seed)
 
         if not params.is_xl():
             prompt_embeds = encode_prompt(
@@ -63,7 +63,7 @@ class UpscaleStableDiffusionStage(BaseStage):
             result = pipeline(
                 prompt,
                 source,
-                generator=generator,
+                generator=rng,
                 guidance_scale=params.cfg,
                 negative_prompt=negative_prompt,
                 num_inference_steps=params.steps,

From 828c9511a6dc860bf0dfb7b1c113fce861744c06 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 27 Nov 2023 18:53:39 -0600
Subject: [PATCH 213/240] fix(api): restore single-tile code path

---
 api/onnx_web/chain/tile.py                  | 8 +++++++-
 api/onnx_web/diffusers/load.py              | 4 +---
 api/onnx_web/diffusers/pipelines/upscale.py | 4 +++-
 3 files changed, 11 insertions(+), 5 deletions(-)

diff --git a/api/onnx_web/chain/tile.py b/api/onnx_web/chain/tile.py
index a6705e5c..01ea9f2b 100644
--- a/api/onnx_web/chain/tile.py
+++ b/api/onnx_web/chain/tile.py
@@ -266,6 +266,7 @@ def process_tile_stack(
 
     tiles: List[Tuple[int, int, Image.Image]] = []
     tile_coords = tile_generator(width, height, tile, overlap)
+    single_tile = len(tile_coords) == 1
 
     for counter, (left, top) in enumerate(tile_coords):
         logger.info(
@@ -291,7 +292,12 @@ def process_tile_stack(
             needs_margin = True
             bottom_margin = height - bottom
 
-        if needs_margin:
+        if single_tile:
+            logger.debug("using single tile")
+            tile_stack = sources
+            if mask:
+                tile_mask = mask
+        elif needs_margin:
             logger.debug(
                 "tiling with added margins: %s, %s, %s, %s",
                 left_margin,
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 7e78ab62..49c89f8a 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -229,9 +229,7 @@ def load_pipeline(
                 tokenizer_2=components.get("tokenizer_2", None),
             )
         else:
-            logger.debug(
-                "assembling SD pipeline for %s", pipeline_class.__name__
-            )
+            logger.debug("assembling SD pipeline for %s", pipeline_class.__name__)
 
             if pipeline_class == OnnxStableDiffusionUpscalePipeline:
                 # upscale uses a single VAE
diff --git a/api/onnx_web/diffusers/pipelines/upscale.py b/api/onnx_web/diffusers/pipelines/upscale.py
index 2fb3a2e1..aa07cc99 100644
--- a/api/onnx_web/diffusers/pipelines/upscale.py
+++ b/api/onnx_web/diffusers/pipelines/upscale.py
@@ -2,7 +2,9 @@ from logging import getLogger
 from typing import Any, List
 
 from diffusers.pipelines.onnx_utils import OnnxRuntimeModel
-from diffusers.pipelines.stable_diffusion import OnnxStableDiffusionUpscalePipeline as BasePipeline
+from diffusers.pipelines.stable_diffusion import (
+    OnnxStableDiffusionUpscalePipeline as BasePipeline,
+)
 from diffusers.schedulers import DDPMScheduler
 
 logger = getLogger(__name__)

From 042181b9c522dadd75310ba888c5e748ecd778b0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 27 Nov 2023 21:45:32 -0600
Subject: [PATCH 214/240] fix(api): correctly handle image stacks in persist
 stages

---
 api/onnx_web/chain/persist_disk.py |  2 +-
 api/onnx_web/chain/persist_s3.py   | 10 +++++-----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/chain/persist_disk.py b/api/onnx_web/chain/persist_disk.py
index 7a2007ce..28a08848 100644
--- a/api/onnx_web/chain/persist_disk.py
+++ b/api/onnx_web/chain/persist_disk.py
@@ -31,7 +31,7 @@ class PersistDiskStage(BaseStage):
     ) -> StageResult:
         logger.info("persisting %s images to disk: %s", len(sources), output)
 
-        for source, name in zip(sources, output):
+        for source, name in zip(sources.as_image(), output):
             dest = save_image(server, name, source, params=params, size=size)
             logger.info("saved image to %s", dest)
 
diff --git a/api/onnx_web/chain/persist_s3.py b/api/onnx_web/chain/persist_s3.py
index 6bd03f72..060afc4f 100644
--- a/api/onnx_web/chain/persist_s3.py
+++ b/api/onnx_web/chain/persist_s3.py
@@ -1,6 +1,6 @@
 from io import BytesIO
 from logging import getLogger
-from typing import Optional
+from typing import List, Optional
 
 from boto3 import Session
 from PIL import Image
@@ -23,7 +23,7 @@ class PersistS3Stage(BaseStage):
         _params: ImageParams,
         sources: StageResult,
         *,
-        output: str,
+        output: List[str],
         bucket: str,
         endpoint_url: Optional[str] = None,
         profile_name: Optional[str] = None,
@@ -33,14 +33,14 @@ class PersistS3Stage(BaseStage):
         session = Session(profile_name=profile_name)
         s3 = session.client("s3", endpoint_url=endpoint_url)
 
-        for source in sources.as_image():
+        for source, name in zip(sources.as_image(), output):
             data = BytesIO()
             source.save(data, format=server.image_format)
             data.seek(0)
 
             try:
-                s3.upload_fileobj(data, bucket, output)
-                logger.info("saved image to s3://%s/%s", bucket, output)
+                s3.upload_fileobj(data, bucket, name)
+                logger.info("saved image to s3://%s/%s", bucket, name)
             except Exception:
                 logger.exception("error saving image to S3")
 

From 48d0d3e22d22b58283790519802dce343f5b17a1 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Wed, 29 Nov 2023 21:52:32 -0600
Subject: [PATCH 215/240] use presence of stage mask to trigger tiling

---
 api/onnx_web/chain/pipeline.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index ee7015ab..60554071 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -146,7 +146,7 @@ class ChainPipeline:
                 kwargs.pop("params")
 
             # the stage must be split and tiled if any image is larger than the selected/max tile size
-            must_tile = any(
+            must_tile = "mask" in stage_kwargs or any(
                 [
                     needs_tile(
                         stage_pipe.max_tile,
@@ -162,7 +162,7 @@ class ChainPipeline:
             if stage_pipe.max_tile > 0:
                 tile = min(stage_pipe.max_tile, stage_params.tile_size)
 
-            if must_tile or len(stage_sources) > 0:
+            if must_tile:
                 logger.info(
                     "image contains sources or is larger than tile size of %s, tiling stage",
                     tile,

From 74cb1002365163b918cc046ee67742ca052e56cc Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 30 Nov 2023 19:21:05 -0600
Subject: [PATCH 216/240] fix(scripts): update test MSE and references for
 recent tiling changes

---
 .../test-refs/blend-512-muffin-white-0.png    |  4 +--
 api/scripts/test-refs/outpaint-even-256-0.png |  4 +--
 .../test-refs/outpaint-horizontal-512-0.png   |  4 +--
 .../test-refs/outpaint-vertical-512-0.png     |  4 +--
 .../txt2img-sd-v1-5-512-muffin-dpm-0.png      |  4 +--
 .../txt2img-sd-v1-5-512-muffin-heun-0.png     |  4 +--
 .../txt2img-sd-v2-1-512-muffin-0.png          |  4 +--
 .../test-refs/upscale-sd-x4-2048-muffin-0.png |  4 +--
 ...upscale-sd-x4-codeformer-2048-muffin-0.png |  4 +--
 .../upscale-sd-x4-gfpgan-2048-muffin-0.png    |  4 +--
 api/scripts/test-release.py                   | 31 +++++++++++++------
 11 files changed, 41 insertions(+), 30 deletions(-)

diff --git a/api/scripts/test-refs/blend-512-muffin-white-0.png b/api/scripts/test-refs/blend-512-muffin-white-0.png
index 103f582c..f218fb5a 100644
--- a/api/scripts/test-refs/blend-512-muffin-white-0.png
+++ b/api/scripts/test-refs/blend-512-muffin-white-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:be25e2a6252de2cd830c6421f75313067bf3ef29904138536615899c7169ac57
-size 573669
+oid sha256:14833dae2dafa6eb2fe9184087a4ba0781b2be881e2fdedb5dca09baf1843799
+size 572108
diff --git a/api/scripts/test-refs/outpaint-even-256-0.png b/api/scripts/test-refs/outpaint-even-256-0.png
index fdc925e8..c69f41b5 100644
--- a/api/scripts/test-refs/outpaint-even-256-0.png
+++ b/api/scripts/test-refs/outpaint-even-256-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d7d666f57ef942b5b7706b93df8831c06a6872287b44e012bb5a18959d38a63
-size 2018986
+oid sha256:60f019055396a71d387f9c575acac1802b639cdf8ae95ea0287278fa68f051ac
+size 1968972
diff --git a/api/scripts/test-refs/outpaint-horizontal-512-0.png b/api/scripts/test-refs/outpaint-horizontal-512-0.png
index e6669885..311c20fa 100644
--- a/api/scripts/test-refs/outpaint-horizontal-512-0.png
+++ b/api/scripts/test-refs/outpaint-horizontal-512-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0679d0198ec0f321a83c214a1fa178c64aa1f9139d2ba560dac76b653d94fc01
-size 1580841
+oid sha256:b1d1b3417ce63553a15c80e601cbccde7b2ef4af05eef624cfc0d82d5e6a8b35
+size 1579738
diff --git a/api/scripts/test-refs/outpaint-vertical-512-0.png b/api/scripts/test-refs/outpaint-vertical-512-0.png
index 2933eb8e..d5f52320 100644
--- a/api/scripts/test-refs/outpaint-vertical-512-0.png
+++ b/api/scripts/test-refs/outpaint-vertical-512-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8caa4f99dc1520a5d30d563090aa6cc02db89c0abb3eec7f8c3f8750c9dbf20f
-size 1514972
+oid sha256:e59324850e153e768c7f849026fb0753440906a54223d3583f0b18caec6c8ff0
+size 1523624
diff --git a/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-dpm-0.png b/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-dpm-0.png
index 05c93b7d..7919d7d7 100644
--- a/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-dpm-0.png
+++ b/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-dpm-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d4f5506f9f3836dc3383f695c533b1ff2873f60c76b65a37f0850e2231a29495
-size 522478
+oid sha256:93def1c9b1355ed33d25916df16f037a11ba4ba3ee6bcd487d58818371fc7ad5
+size 526093
diff --git a/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-heun-0.png b/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-heun-0.png
index dca24a75..00408050 100644
--- a/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-heun-0.png
+++ b/api/scripts/test-refs/txt2img-sd-v1-5-512-muffin-heun-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce2c5e5510c93d5d4e2e7688cd132e1c6e167e7715173e1250e86f341ac47172
-size 503943
+oid sha256:bb9043d076c9084fb3f74fa5f58ec734c781ef403ae9723be261dff27e191f5e
+size 494092
diff --git a/api/scripts/test-refs/txt2img-sd-v2-1-512-muffin-0.png b/api/scripts/test-refs/txt2img-sd-v2-1-512-muffin-0.png
index 7b1a789a..59c02b8a 100644
--- a/api/scripts/test-refs/txt2img-sd-v2-1-512-muffin-0.png
+++ b/api/scripts/test-refs/txt2img-sd-v2-1-512-muffin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5dee66e2a5b003c6e892e2f5e7b7ba95c471ee301cdad34e11199083544a46d8
-size 502780
+oid sha256:582669cbcc215d32728c18166a46312c583462a7f438ff69108e4854b6c5edf7
+size 501499
diff --git a/api/scripts/test-refs/upscale-sd-x4-2048-muffin-0.png b/api/scripts/test-refs/upscale-sd-x4-2048-muffin-0.png
index 0b713be1..7e52eeb7 100644
--- a/api/scripts/test-refs/upscale-sd-x4-2048-muffin-0.png
+++ b/api/scripts/test-refs/upscale-sd-x4-2048-muffin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1a982c32e952f9fe1d9f0ba1b93f177f04f11b23603736ddc157ece2d45d915e
-size 7313660
+oid sha256:30c2845fc375cd965a574c88f1da9e9c6b1d679514e5f3c4578a5d962726d4dd
+size 6498264
diff --git a/api/scripts/test-refs/upscale-sd-x4-codeformer-2048-muffin-0.png b/api/scripts/test-refs/upscale-sd-x4-codeformer-2048-muffin-0.png
index c37edc5e..a6f36771 100644
--- a/api/scripts/test-refs/upscale-sd-x4-codeformer-2048-muffin-0.png
+++ b/api/scripts/test-refs/upscale-sd-x4-codeformer-2048-muffin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7c381c34884e1c1304fd7f7a7b631c6ab4ba3694ececd99c3b5f43cba9ff5b6
-size 7313667
+oid sha256:9153a0b9b12a0c9c7309b9023477d74fc824e3820cb19aaadaf99cb80be72ace
+size 6711175
diff --git a/api/scripts/test-refs/upscale-sd-x4-gfpgan-2048-muffin-0.png b/api/scripts/test-refs/upscale-sd-x4-gfpgan-2048-muffin-0.png
index cda047d7..a6f36771 100644
--- a/api/scripts/test-refs/upscale-sd-x4-gfpgan-2048-muffin-0.png
+++ b/api/scripts/test-refs/upscale-sd-x4-gfpgan-2048-muffin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f3f34f029ca3b7324b2f7ff851e5af86454cd02c0b7445676655bfd486b8c2c0
-size 7313651
+oid sha256:9153a0b9b12a0c9c7309b9023477d74fc824e3820cb19aaadaf99cb80be72ace
+size 6711175
diff --git a/api/scripts/test-release.py b/api/scripts/test-release.py
index fbd5a6b8..dd8443d5 100644
--- a/api/scripts/test-release.py
+++ b/api/scripts/test-release.py
@@ -30,6 +30,10 @@ FAST_TEST = 10
 SLOW_TEST = 25
 VERY_SLOW_TEST = 75
 
+STRICT_TEST = 1e-4
+LOOSE_TEST = 1e-2
+VERY_LOOSE_TEST = 0.025
+
 
 def test_path(relpath: str) -> str:
     return path.join(path.dirname(__file__), relpath)
@@ -41,7 +45,7 @@ class TestCase:
         name: str,
         query: str,
         max_attempts: int = FAST_TEST,
-        mse_threshold: float = 1e-4,
+        mse_threshold: float = STRICT_TEST,
         source: Union[Image.Image, List[Image.Image]] = None,
         mask: Image.Image = None,
     ) -> None:
@@ -73,10 +77,12 @@ TEST_DATA = [
     TestCase(
         "txt2img-sd-v1-5-512-muffin-heun",
         "txt2img?prompt=a+giant+muffin&seed=0&scheduler=heun",
+        mse_threshold=LOOSE_TEST,
     ),
     TestCase(
         "txt2img-sd-v1-5-512-muffin-unipc",
         "txt2img?prompt=a+giant+muffin&seed=0&scheduler=unipc-multi",
+        mse_threshold=LOOSE_TEST,
     ),
     TestCase(
         "txt2img-sd-v2-1-512-muffin",
@@ -84,7 +90,7 @@ TEST_DATA = [
     ),
     TestCase(
         "txt2img-sd-v2-1-768-muffin",
-        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&model=stable-diffusion-onnx-v2-1&width=768&height=768",
+        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&model=stable-diffusion-onnx-v2-1&width=768&height=768&unet_tile=768",
         max_attempts=SLOW_TEST,
     ),
     TestCase(
@@ -106,7 +112,7 @@ TEST_DATA = [
     ),
     TestCase(
         "img2img-sd-v1-5-256-pumpkin",
-        "img2img?prompt=a+giant+pumpkin&seed=0&scheduler=ddim&sourceFilter=none",
+        "img2img?prompt=a+giant+pumpkin&seed=0&scheduler=ddim&sourceFilter=none&unet_tile=256",
         source="txt2img-sd-v1-5-256-muffin-0",
     ),
     TestCase(
@@ -130,7 +136,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=SLOW_TEST,
-        mse_threshold=0.025,
+        mse_threshold=VERY_LOOSE_TEST,
     ),
     TestCase(
         "outpaint-vertical-512",
@@ -141,7 +147,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=SLOW_TEST,
-        mse_threshold=0.010,
+        mse_threshold=LOOSE_TEST,
     ),
     TestCase(
         "outpaint-horizontal-512",
@@ -152,7 +158,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=SLOW_TEST,
-        mse_threshold=0.010,
+        mse_threshold=LOOSE_TEST,
     ),
     TestCase(
         "upscale-resrgan-x2-1024-muffin",
@@ -229,7 +235,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=VERY_SLOW_TEST,
-        mse_threshold=0.025,
+        mse_threshold=VERY_LOOSE_TEST,
     ),
     TestCase(
         "outpaint-panorama-vertical-512",
@@ -240,7 +246,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=VERY_SLOW_TEST,
-        mse_threshold=0.025,
+        mse_threshold=VERY_LOOSE_TEST,
     ),
     TestCase(
         "outpaint-panorama-horizontal-512",
@@ -251,7 +257,7 @@ TEST_DATA = [
         source="txt2img-sd-v1-5-512-muffin-0",
         mask="mask-black",
         max_attempts=VERY_SLOW_TEST,
-        mse_threshold=0.025,
+        mse_threshold=VERY_LOOSE_TEST,
     ),
     TestCase(
         "upscale-resrgan-x4-codeformer-2048-muffin",
@@ -260,6 +266,7 @@ TEST_DATA = [
             "&correction=correction-codeformer&faces=true&faceOutscale=1&faceStrength=1.0"
         ),
         source="txt2img-sd-v1-5-512-muffin-0",
+        max_attempts=SLOW_TEST,
     ),
     TestCase(
         "upscale-resrgan-x4-gfpgan-2048-muffin",
@@ -268,6 +275,7 @@ TEST_DATA = [
             "&correction=correction-gfpgan&faces=true&faceOutscale=1&faceStrength=1.0"
         ),
         source="txt2img-sd-v1-5-512-muffin-0",
+        max_attempts=SLOW_TEST,
     ),
     TestCase(
         "upscale-swinir-x4-codeformer-2048-muffin",
@@ -276,6 +284,7 @@ TEST_DATA = [
             "&correction=correction-codeformer&faces=true&faceOutscale=1&faceStrength=1.0"
         ),
         source="txt2img-sd-v1-5-512-muffin-0",
+        max_attempts=SLOW_TEST,
     ),
     TestCase(
         "upscale-swinir-x4-gfpgan-2048-muffin",
@@ -284,6 +293,7 @@ TEST_DATA = [
             "&correction=correction-gfpgan&faces=true&faceOutscale=1&faceStrength=1.0"
         ),
         source="txt2img-sd-v1-5-512-muffin-0",
+        max_attempts=SLOW_TEST,
     ),
     TestCase(
         "upscale-sd-x4-codeformer-2048-muffin",
@@ -316,7 +326,7 @@ TEST_DATA = [
     ),
     TestCase(
         "txt2img-sd-v1-5-tall-muffin",
-        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&width=512&height=768",
+        "txt2img?prompt=a+giant+muffin&seed=0&scheduler=ddim&width=512&height=768&unet_tile=768",
     ),
     TestCase(
         "upscale-resrgan-x4-tall-muffin",
@@ -325,6 +335,7 @@ TEST_DATA = [
             "&correction=correction-gfpgan&faces=false&faceOutscale=1&faceStrength=1.0"
         ),
         source="txt2img-sd-v1-5-tall-muffin-0",
+        max_attempts=SLOW_TEST,
     ),
     # TODO: non-square controlnet
 ]

From c7af703abc74880a2380e816c0e455d0d9afe9f0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 30 Nov 2023 19:21:37 -0600
Subject: [PATCH 217/240] make tile size a constant

---
 gui/src/client/utils.ts | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/gui/src/client/utils.ts b/gui/src/client/utils.ts
index e2f06552..967c818d 100644
--- a/gui/src/client/utils.ts
+++ b/gui/src/client/utils.ts
@@ -94,6 +94,8 @@ export function expandRanges(range: string): Array<string | number> {
   return [];
 }
 
+export const GRID_TILE_SIZE = 8192;
+
 // eslint-disable-next-line max-params
 export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams, params: Txt2ImgParams, upscale?: UpscaleParams, highres?: HighresParams): ChainPipeline {
   const pipeline: ChainPipeline = {
@@ -105,7 +107,7 @@ export function makeTxt2ImgGridPipeline(grid: PipelineGrid, model: ModelParams,
   };
 
   const tiles: ChainStageParams = {
-    tiles: 8192,
+    tiles: GRID_TILE_SIZE,
   };
 
   const rows = replaceRandomSeeds(grid.rows.parameter, rangeSplit(grid.rows.parameter, grid.rows.value));

From 0b31ad0ab63cafdc1f8e9327b2d32d20ae258faa Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Thu, 30 Nov 2023 19:23:03 -0600
Subject: [PATCH 218/240] fix(gui): add string for LCM scheduler

---
 gui/src/strings/en.ts | 1 +
 1 file changed, 1 insertion(+)

diff --git a/gui/src/strings/en.ts b/gui/src/strings/en.ts
index 5c312c42..c9d901f9 100644
--- a/gui/src/strings/en.ts
+++ b/gui/src/strings/en.ts
@@ -295,6 +295,7 @@ export const I18N_STRINGS_EN = {
         'k-dpm-2': 'KDPM2',
         'karras-ve': 'Karras Ve',
         'ipndm': 'iPNDM',
+        'lcm': 'LCM',
         'lms-discrete': 'LMS',
         'pndm': 'PNDM',
         'unipc-multi': 'UniPC Multistep',

From 103d1a449a058a65139d95c15ab5f349e41d928f Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 20:06:27 -0600
Subject: [PATCH 219/240] fix(api): resize latents to complete panorama blocks

---
 .../diffusers/pipelines/panorama_xl.py        | 29 ++++++++++++-------
 api/onnx_web/diffusers/utils.py               | 17 +++++++----
 2 files changed, 31 insertions(+), 15 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index fe8a6532..dc178e30 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -1,5 +1,6 @@
 import inspect
 import logging
+from math import ceil
 from typing import Any, Callable, Dict, List, Optional, Tuple, Union
 
 import numpy as np
@@ -13,9 +14,9 @@ from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
 )
 from optimum.pipelines.diffusers.pipeline_utils import rescale_noise_cfg
 
-from onnx_web.chain.tile import make_tile_mask
-
-from ..utils import LATENT_FACTOR, parse_regions, repair_nan
+from ...chain.tile import make_tile_mask
+from ...params import Size
+from ..utils import LATENT_FACTOR, expand_latents, parse_regions, repair_nan
 
 logger = logging.getLogger(__name__)
 
@@ -41,13 +42,16 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         self.window = window
         self.stride = stride
 
-    def get_views(self, panorama_height, panorama_width, window_size, stride):
+    def get_views(
+        self, panorama_height: int, panorama_width: int, window_size: int, stride: int
+    ) -> Tuple[List[Tuple[int, int, int, int]], Tuple[int, int]]:
         # Here, we define the mappings F_i (see Eq. 7 in the MultiDiffusion paper https://arxiv.org/abs/2302.08113)
         panorama_height /= 8
         panorama_width /= 8
 
-        num_blocks_height = abs((panorama_height - window_size) // stride) + 1
-        num_blocks_width = abs((panorama_width - window_size) // stride) + 1
+        num_blocks_height = ceil(abs((panorama_height - window_size) / stride)) + 1
+        num_blocks_width = ceil(abs((panorama_width - window_size) / stride)) + 1
+
         total_num_blocks = int(num_blocks_height * num_blocks_width)
         logger.debug(
             "panorama generated %s views, %s by %s blocks",
@@ -64,7 +68,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             w_end = w_start + window_size
             views.append((h_start, h_end, w_start, w_end))
 
-        return views
+        return (views, (h_end, w_end))
 
     # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
     def prepare_latents_img2img(
@@ -382,9 +386,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         timestep_dtype = self.unet.input_dtype.get("timestep", np.float32)
 
         # 8. Panorama additions
-        views = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like(latents)
-        value = np.zeros_like(latents)
+        views, resize = self.get_views(height, width, self.window, self.stride)
+        count = np.zeros_like((latents[0], latents[1], *resize))
+        value = np.zeros_like((latents[0], latents[1], *resize))
+
+        # adjust latents
+        latents = expand_latents(latents, generator.randint(), Size(width, height))
 
         # 8. Denoising loop
         num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
@@ -560,6 +567,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 if callback is not None and i % callback_steps == 0:
                     callback(i, t, latents)
 
+        # remove extra margins
+        latents = latents[:, :, 0:height, 0:width]
         if output_type == "latent":
             image = latents
         else:
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 140ece45..f01c6703 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -276,6 +276,17 @@ def get_latents_from_seed(seed: int, size: Size, batch: int = 1) -> np.ndarray:
     return image_latents
 
 
+def expand_latents(
+    latents: np.ndarray,
+    seed: int,
+    size: Size,
+) -> np.ndarray:
+    batch, _channels, height, width = latents.shape
+    extra_latents = get_latents_from_seed(seed, size, batch=batch)
+    extra_latents[:, :, 0:height, 0:width] = latents
+    return extra_latents
+
+
 def get_tile_latents(
     full_latents: np.ndarray,
     seed: int,
@@ -301,11 +312,7 @@ def get_tile_latents(
     tile_latents = full_latents[:, :, y:yt, x:xt]
 
     if tile_latents.shape[2] < t or tile_latents.shape[3] < t:
-        extra_latents = get_latents_from_seed(seed, size, batch=tile_latents.shape[0])
-        extra_latents[
-            :, :, 0 : tile_latents.shape[2], 0 : tile_latents.shape[3]
-        ] = tile_latents
-        tile_latents = extra_latents
+        tile_latents = expand_latents(tile_latents, seed, size)
 
     return tile_latents
 

From b54a57b379fbbae37b954cc6a0bbba3fa807ab7b Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 20:21:31 -0600
Subject: [PATCH 220/240] fix(api): complete panorama tiles for SD pipeline

---
 api/onnx_web/diffusers/pipelines/panorama.py  | 26 +++++++++++++++----
 .../diffusers/pipelines/panorama_xl.py        |  7 ++++-
 api/onnx_web/diffusers/utils.py               |  3 ++-
 3 files changed, 29 insertions(+), 7 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 11511fa7..54383ca0 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -26,9 +26,15 @@ from diffusers.schedulers import DDIMScheduler, LMSDiscreteScheduler, PNDMSchedu
 from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
 from transformers import CLIPImageProcessor, CLIPTokenizer
 
-from onnx_web.chain.tile import make_tile_mask
-
-from ..utils import LATENT_CHANNELS, LATENT_FACTOR, parse_regions, repair_nan
+from ...chain.tile import make_tile_mask
+from ...params import Size
+from ..utils import (
+    LATENT_CHANNELS,
+    LATENT_FACTOR,
+    expand_latents,
+    parse_regions,
+    repair_nan,
+)
 
 logger = logging.get_logger(__name__)
 
@@ -373,7 +379,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             w_end = w_start + window_size
             views.append((h_start, h_end, w_start, w_end))
 
-        return views
+        return (views, (h_end, w_end))
 
     @torch.no_grad()
     def text2img(
@@ -552,10 +558,17 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         timestep_dtype = ORT_TO_NP_TYPE[timestep_dtype]
 
         # panorama additions
-        views = self.get_views(height, width, self.window, self.stride)
+        views, resize = self.get_views(height, width, self.window, self.stride)
         count = np.zeros_like(latents)
         value = np.zeros_like(latents)
 
+        latents = expand_latents(
+            latents,
+            generator.randint(),
+            Size(width, height),
+            sigma=self.scheduler.init_noise_sigma,
+        )
+
         for i, t in enumerate(self.progress_bar(self.scheduler.timesteps)):
             last = i == (len(self.scheduler.timesteps) - 1)
             count.fill(0)
@@ -707,6 +720,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             if callback is not None and i % callback_steps == 0:
                 callback(i, t, latents)
 
+        # remove extra margins
+        latents = latents[:, :, 0:height, 0:width]
+
         latents = np.clip(latents, -4, +4)
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index dc178e30..d42936db 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -391,7 +391,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         value = np.zeros_like((latents[0], latents[1], *resize))
 
         # adjust latents
-        latents = expand_latents(latents, generator.randint(), Size(width, height))
+        latents = expand_latents(
+            latents,
+            generator.randint(),
+            Size(width, height),
+            sigma=self.scheduler.init_noise_sigma,
+        )
 
         # 8. Denoising loop
         num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index f01c6703..38687204 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -280,11 +280,12 @@ def expand_latents(
     latents: np.ndarray,
     seed: int,
     size: Size,
+    sigma: float = 1.0,
 ) -> np.ndarray:
     batch, _channels, height, width = latents.shape
     extra_latents = get_latents_from_seed(seed, size, batch=batch)
     extra_latents[:, :, 0:height, 0:width] = latents
-    return extra_latents
+    return extra_latents * np.float64(sigma)
 
 
 def get_tile_latents(

From 4b491ec4d581ea419f158f3ae47723426e18e2f2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 20:31:52 -0600
Subject: [PATCH 221/240] correct resize scale

---
 api/onnx_web/diffusers/pipelines/panorama.py    | 10 +++++-----
 api/onnx_web/diffusers/pipelines/panorama_xl.py |  7 ++++---
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 54383ca0..ba9cb6a4 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -379,7 +379,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             w_end = w_start + window_size
             views.append((h_start, h_end, w_start, w_end))
 
-        return (views, (h_end, w_end))
+        return (views, (h_end * 8, w_end * 8))
 
     @torch.no_grad()
     def text2img(
@@ -559,13 +559,13 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like(latents)
-        value = np.zeros_like(latents)
+        count = np.zeros_like((latents[0], latents[1], *resize))
+        value = np.zeros_like((latents[0], latents[1], *resize))
 
         latents = expand_latents(
             latents,
-            generator.randint(),
-            Size(width, height),
+            generator.randint(np.iinfo(np.int32).max),
+            Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index d42936db..b702a820 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -68,7 +68,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
             w_end = w_start + window_size
             views.append((h_start, h_end, w_start, w_end))
 
-        return (views, (h_end, w_end))
+        return (views, (h_end * 8, w_end * 8))
 
     # Adapted from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion.StableDiffusionPipeline.prepare_latents
     def prepare_latents_img2img(
@@ -393,8 +393,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         # adjust latents
         latents = expand_latents(
             latents,
-            generator.randint(),
-            Size(width, height),
+            generator.randint(np.iinfo(np.int32).max),
+            Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
 
@@ -574,6 +574,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # remove extra margins
         latents = latents[:, :, 0:height, 0:width]
+
         if output_type == "latent":
             image = latents
         else:

From d4611e958cd142283784bd6216d622ed6a883ce8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 20:40:36 -0600
Subject: [PATCH 222/240] complete SD panorama tiles

---
 api/onnx_web/diffusers/pipelines/panorama.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index ba9cb6a4..3a410580 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -13,7 +13,8 @@
 # limitations under the License.
 
 import inspect
-from typing import Callable, List, Optional, Union
+from math import ceil
+from typing import Callable, List, Optional, Tuple, Union
 
 import numpy as np
 import PIL
@@ -356,13 +357,16 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                     f" {negative_prompt_embeds.shape}."
                 )
 
-    def get_views(self, panorama_height, panorama_width, window_size, stride):
+    def get_views(
+        self, panorama_height: int, panorama_width: int, window_size: int, stride: int
+    ) -> Tuple[List[Tuple[int, int, int, int]], Tuple[int, int]]:
         # Here, we define the mappings F_i (see Eq. 7 in the MultiDiffusion paper https://arxiv.org/abs/2302.08113)
         panorama_height /= 8
         panorama_width /= 8
 
-        num_blocks_height = abs((panorama_height - window_size) // stride) + 1
-        num_blocks_width = abs((panorama_width - window_size) // stride) + 1
+        num_blocks_height = ceil(abs((panorama_height - window_size) / stride)) + 1
+        num_blocks_width = ceil(abs((panorama_width - window_size) / stride)) + 1
+
         total_num_blocks = int(num_blocks_height * num_blocks_width)
         logger.debug(
             "panorama generated %s views, %s by %s blocks",

From 728f58f3e7bec8b3482b09efd50c35c0dc19dab0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 22:09:11 -0600
Subject: [PATCH 223/240] divide latents using latent scale

---
 api/onnx_web/diffusers/pipelines/panorama.py    | 6 +++---
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 3a410580..dbdaf622 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -563,8 +563,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like((latents[0], latents[1], *resize))
-        value = np.zeros_like((latents[0], latents[1], *resize))
+        count = np.zeros_like((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros_like((latents.shape[0], latents.shape[1], *resize))
 
         latents = expand_latents(
             latents,
@@ -725,7 +725,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:height, 0:width]
+        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
 
         latents = np.clip(latents, -4, +4)
         latents = 1 / 0.18215 * latents
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index b702a820..67e8e8a4 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -387,8 +387,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like((latents[0], latents[1], *resize))
-        value = np.zeros_like((latents[0], latents[1], *resize))
+        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
 
         # adjust latents
         latents = expand_latents(
@@ -573,7 +573,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                     callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:height, 0:width]
+        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
 
         if output_type == "latent":
             image = latents

From 5035761e66a031e846d27554e265ce740053679c Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sat, 2 Dec 2023 22:10:59 -0600
Subject: [PATCH 224/240] build empty values correctly

---
 api/onnx_web/diffusers/pipelines/panorama.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index dbdaf622..6ca1da88 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -563,8 +563,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros_like((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
 
         latents = expand_latents(
             latents,

From 16911b5f8738b28a1e484fba3de8daf3d80f2c12 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 06:19:17 -0600
Subject: [PATCH 225/240] consistenly unpack views

---
 api/onnx_web/diffusers/pipelines/panorama.py    | 4 ++--
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 6ca1da88..987a07e9 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -973,7 +973,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         timestep_dtype = ORT_TO_NP_TYPE[timestep_dtype]
 
         # panorama additions
-        views = self.get_views(height, width, self.window, self.stride)
+        views, resize = self.get_views(height, width, self.window, self.stride)
         count = np.zeros_like(latents)
         value = np.zeros_like(latents)
 
@@ -1281,7 +1281,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         timestep_dtype = ORT_TO_NP_TYPE[timestep_dtype]
 
         # panorama additions
-        views = self.get_views(height, width, self.window, self.stride)
+        views, resize = self.get_views(height, width, self.window, self.stride)
         count = np.zeros_like(latents)
         value = np.zeros_like(latents)
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 67e8e8a4..c5fea7d8 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -809,7 +809,7 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
         )
 
         # 8. Panorama additions
-        views = self.get_views(height, width, self.window, self.stride)
+        views, resize = self.get_views(height, width, self.window, self.stride)
         count = np.zeros_like(latents)
         value = np.zeros_like(latents)
 

From c42ca9ca38a65d9fa9f483f607fa15b06d3225b1 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 06:28:36 -0600
Subject: [PATCH 226/240] handle panorama margins for img2img and inpaint

---
 api/onnx_web/diffusers/pipelines/panorama.py  | 31 ++++++++++++++++---
 .../diffusers/pipelines/panorama_xl.py        | 14 +++++++--
 2 files changed, 39 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 987a07e9..42f9e721 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -566,6 +566,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
         count = np.zeros((latents.shape[0], latents.shape[1], *resize))
         value = np.zeros((latents.shape[0], latents.shape[1], *resize))
 
+        # adjust latents
         latents = expand_latents(
             latents,
             generator.randint(np.iinfo(np.int32).max),
@@ -974,8 +975,16 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like(latents)
-        value = np.zeros_like(latents)
+        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+
+        # adjust latents
+        latents = expand_latents(
+            latents,
+            generator.randint(np.iinfo(np.int32).max),
+            Size(resize[1], resize[0]),
+            sigma=self.scheduler.init_noise_sigma,
+        )
 
         for i, t in enumerate(self.progress_bar(timesteps)):
             count.fill(0)
@@ -1031,6 +1040,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             if callback is not None and i % callback_steps == 0:
                 callback(i, t, latents)
 
+        # remove extra margins
+        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
         # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
@@ -1282,8 +1294,16 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like(latents)
-        value = np.zeros_like(latents)
+        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+
+        # adjust latents
+        latents = expand_latents(
+            latents,
+            generator.randint(np.iinfo(np.int32).max),
+            Size(resize[1], resize[0]),
+            sigma=self.scheduler.init_noise_sigma,
+        )
 
         for i, t in enumerate(self.progress_bar(self.scheduler.timesteps)):
             count.fill(0)
@@ -1346,6 +1366,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             if callback is not None and i % callback_steps == 0:
                 callback(i, t, latents)
 
+        # remove extra margins
+        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
         # it seems likes there is a strange result for using half-precision vae decoder if batchsize>1
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index c5fea7d8..9cd87b49 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -810,8 +810,15 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros_like(latents)
-        value = np.zeros_like(latents)
+        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+
+        latents = expand_latents(
+            latents,
+            generator.randint(np.iinfo(np.int32).max),
+            Size(resize[1], resize[0]),
+            sigma=self.scheduler.init_noise_sigma,
+        )
 
         # 8. Denoising loop
         num_warmup_steps = len(timesteps) - num_inference_steps * self.scheduler.order
@@ -881,6 +888,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                 if callback is not None and i % callback_steps == 0:
                     callback(i, t, latents)
 
+        # remove extra margins
+        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+
         if output_type == "latent":
             image = latents
         else:

From 10fab12cd03c282dc67f032661d3e16d34f57bc0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 11:11:23 -0600
Subject: [PATCH 227/240] dedupe new latent resizing code

---
 api/onnx_web/chain/source_txt2img.py          |  2 +-
 api/onnx_web/constants.py                     |  3 ++
 api/onnx_web/diffusers/load.py                |  4 +--
 api/onnx_web/diffusers/patches/vae.py         |  2 --
 api/onnx_web/diffusers/pipelines/panorama.py  | 35 +++++++++++--------
 .../diffusers/pipelines/panorama_xl.py        | 29 ++++++++++-----
 api/onnx_web/diffusers/utils.py               | 17 +++++++--
 api/onnx_web/server/params.py                 |  5 ++-
 8 files changed, 64 insertions(+), 33 deletions(-)

diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 21881e18..468ceecd 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -5,9 +5,9 @@ import numpy as np
 import torch
 from PIL import Image
 
+from ..constants import LATENT_FACTOR
 from ..diffusers.load import load_pipeline
 from ..diffusers.utils import (
-    LATENT_FACTOR,
     encode_prompt,
     get_latents_from_seed,
     get_tile_latents,
diff --git a/api/onnx_web/constants.py b/api/onnx_web/constants.py
index 4fe47f98..0eb6c039 100644
--- a/api/onnx_web/constants.py
+++ b/api/onnx_web/constants.py
@@ -1,2 +1,5 @@
 ONNX_MODEL = "model.onnx"
 ONNX_WEIGHTS = "weights.pb"
+
+LATENT_FACTOR = 8
+LATENT_CHANNELS = 4
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 49c89f8a..5088dc60 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -9,11 +9,11 @@ from optimum.onnxruntime import (  # ORTStableDiffusionXLInpaintPipeline,
 )
 from transformers import CLIPTokenizer
 
-from ..constants import ONNX_MODEL
+from ..constants import LATENT_FACTOR, ONNX_MODEL
 from ..convert.diffusion.lora import blend_loras, buffer_external_data_tensors
 from ..convert.diffusion.textual_inversion import blend_textual_inversions
 from ..diffusers.pipelines.upscale import OnnxStableDiffusionUpscalePipeline
-from ..diffusers.utils import LATENT_FACTOR, expand_prompt
+from ..diffusers.utils import expand_prompt
 from ..params import DeviceParams, ImageParams
 from ..server import ModelTypes, ServerContext
 from ..torch_before_ort import InferenceSession
diff --git a/api/onnx_web/diffusers/patches/vae.py b/api/onnx_web/diffusers/patches/vae.py
index 1b46e505..d7e3e1f7 100644
--- a/api/onnx_web/diffusers/patches/vae.py
+++ b/api/onnx_web/diffusers/patches/vae.py
@@ -12,8 +12,6 @@ from ...server import ServerContext
 
 logger = getLogger(__name__)
 
-LATENT_CHANNELS = 4
-
 
 class VAEWrapper(object):
     def __init__(
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 42f9e721..feaaeab3 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -28,13 +28,14 @@ from diffusers.utils import PIL_INTERPOLATION, deprecate, logging
 from transformers import CLIPImageProcessor, CLIPTokenizer
 
 from ...chain.tile import make_tile_mask
+from ...constants import LATENT_CHANNELS, LATENT_FACTOR
 from ...params import Size
 from ..utils import (
-    LATENT_CHANNELS,
-    LATENT_FACTOR,
     expand_latents,
     parse_regions,
+    random_seed,
     repair_nan,
+    resize_latent_shape,
 )
 
 logger = logging.get_logger(__name__)
@@ -563,13 +564,13 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros(resize_latent_shape(latents, resize))
+        value = np.zeros(resize_latent_shape(latents, resize))
 
         # adjust latents
         latents = expand_latents(
             latents,
-            generator.randint(np.iinfo(np.int32).max),
+            random_seed(generator),
             Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
@@ -726,7 +727,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+        latents = latents[
+            :, :, 0 : (height // LATENT_FACTOR), 0 : (width // LATENT_FACTOR)
+        ]
 
         latents = np.clip(latents, -4, +4)
         latents = 1 / 0.18215 * latents
@@ -975,13 +978,13 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros(resize_latent_shape(latents, resize))
+        value = np.zeros(resize_latent_shape(latents, resize))
 
         # adjust latents
         latents = expand_latents(
             latents,
-            generator.randint(np.iinfo(np.int32).max),
+            random_seed(generator),
             Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
@@ -1041,7 +1044,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+        latents = latents[
+            :, :, 0 : (height // LATENT_FACTOR), 0 : (width // LATENT_FACTOR)
+        ]
 
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
@@ -1294,13 +1299,13 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros(resize_latent_shape(latents, resize))
+        value = np.zeros(resize_latent_shape(latents, resize))
 
         # adjust latents
         latents = expand_latents(
             latents,
-            generator.randint(np.iinfo(np.int32).max),
+            random_seed(generator),
             Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
@@ -1367,7 +1372,9 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
                 callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+        latents = latents[
+            :, :, 0 : (height // LATENT_FACTOR), 0 : (width // LATENT_FACTOR)
+        ]
 
         latents = 1 / 0.18215 * latents
         # image = self.vae_decoder(latent_sample=latents)[0]
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 9cd87b49..2650a2a3 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -15,8 +15,15 @@ from optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img import (
 from optimum.pipelines.diffusers.pipeline_utils import rescale_noise_cfg
 
 from ...chain.tile import make_tile_mask
+from ...constants import LATENT_FACTOR
 from ...params import Size
-from ..utils import LATENT_FACTOR, expand_latents, parse_regions, repair_nan
+from ..utils import (
+    expand_latents,
+    parse_regions,
+    random_seed,
+    repair_nan,
+    resize_latent_shape,
+)
 
 logger = logging.getLogger(__name__)
 
@@ -387,13 +394,13 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros(resize_latent_shape(latents, resize))
+        value = np.zeros(resize_latent_shape(latents, resize))
 
         # adjust latents
         latents = expand_latents(
             latents,
-            generator.randint(np.iinfo(np.int32).max),
+            random_seed(generator),
             Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
@@ -573,7 +580,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                     callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+        latents = latents[
+            :, :, 0 : (height // LATENT_FACTOR), 0 : (width // LATENT_FACTOR)
+        ]
 
         if output_type == "latent":
             image = latents
@@ -810,12 +819,12 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
-        count = np.zeros((latents.shape[0], latents.shape[1], *resize))
-        value = np.zeros((latents.shape[0], latents.shape[1], *resize))
+        count = np.zeros(resize_latent_shape(latents, resize))
+        value = np.zeros(resize_latent_shape(latents, resize))
 
         latents = expand_latents(
             latents,
-            generator.randint(np.iinfo(np.int32).max),
+            random_seed(generator),
             Size(resize[1], resize[0]),
             sigma=self.scheduler.init_noise_sigma,
         )
@@ -889,7 +898,9 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
                     callback(i, t, latents)
 
         # remove extra margins
-        latents = latents[:, :, 0:(height // 8), 0:(width // 8)]
+        latents = latents[
+            :, :, 0 : (height // LATENT_FACTOR), 0 : (width // LATENT_FACTOR)
+        ]
 
         if output_type == "latent":
             image = latents
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 38687204..19f3130d 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -9,12 +9,11 @@ import numpy as np
 import torch
 from diffusers import OnnxStableDiffusionPipeline
 
+from ..constants import LATENT_CHANNELS, LATENT_FACTOR
 from ..params import ImageParams, Size
 
 logger = getLogger(__name__)
 
-LATENT_CHANNELS = 4
-LATENT_FACTOR = 8
 MAX_TOKENS_PER_GROUP = 77
 
 ANY_TOKEN = compile(r"\<([^\>]*)\>")
@@ -261,6 +260,13 @@ def get_inversions_from_prompt(prompt: str) -> Tuple[str, List[Tuple[str, float]
     return get_tokens_from_prompt(prompt, INVERSION_TOKEN)
 
 
+def random_seed(generator=None) -> int:
+    if generator is None:
+        generator = np.random
+
+    return generator.randint(np.iinfo(np.int32).max)
+
+
 def get_latents_from_seed(seed: int, size: Size, batch: int = 1) -> np.ndarray:
     """
     From https://www.travelneil.com/stable-diffusion-updates.html.
@@ -288,6 +294,13 @@ def expand_latents(
     return extra_latents * np.float64(sigma)
 
 
+def resize_latent_shape(
+    latents: np.ndarray,
+    size: Size,
+) -> Tuple[int, int, int, int]:
+    return (latents.shape[0], latents.shape[1], size.height, size.width)
+
+
 def get_tile_latents(
     full_latents: np.ndarray,
     seed: int,
diff --git a/api/onnx_web/server/params.py b/api/onnx_web/server/params.py
index b8dfe871..e641b953 100644
--- a/api/onnx_web/server/params.py
+++ b/api/onnx_web/server/params.py
@@ -1,10 +1,10 @@
 from logging import getLogger
 from typing import Dict, Optional, Tuple
 
-import numpy as np
 from flask import request
 
 from ..diffusers.load import get_available_pipelines, get_pipeline_schedulers
+from ..diffusers.utils import random_seed
 from ..params import (
     Border,
     DeviceParams,
@@ -149,8 +149,7 @@ def build_params(
 
     seed = int(data.get("seed", -1))
     if seed == -1:
-        # this one can safely use np.random because it produces a single value
-        seed = np.random.randint(np.iinfo(np.int32).max)
+        seed = random_seed()
 
     params = ImageParams(
         model_path,

From d759c31bb6d8a7c76888a6a6c58db06459a4d0f2 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 11:11:53 -0600
Subject: [PATCH 228/240] update panorama test refs

---
 api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png | 4 ++--
 api/scripts/test-refs/txt2img-panorama-1024x768-muffin-0.png  | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png b/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
index 6a1fbb30..739d4544 100644
--- a/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
+++ b/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1a04ffe1ac885d30c782dd4413a5ed0b14632ab197c5fae5ad86b6f978b39e7
-size 1440395
+oid sha256:5359014a0963adbd896832c8ca0e08a30deb0ec8306d7db5fcbd150d49aad04a
+size 1450590
diff --git a/api/scripts/test-refs/txt2img-panorama-1024x768-muffin-0.png b/api/scripts/test-refs/txt2img-panorama-1024x768-muffin-0.png
index 9e68e223..b52fbe68 100644
--- a/api/scripts/test-refs/txt2img-panorama-1024x768-muffin-0.png
+++ b/api/scripts/test-refs/txt2img-panorama-1024x768-muffin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef46449cb985601a9fd1facdbb2cdef3e6f146fd3ad7bf3745540b1a571be2dc
-size 1317089
+oid sha256:67efb0d6d889c6fddf590876415a7b1cdfd488a3d63082a8c022c42fa1c022ed
+size 1386630

From 05b1ef611f3060ae6957fb988b05174c9b784179 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 11:48:52 -0600
Subject: [PATCH 229/240] fix latent resizing

---
 api/onnx_web/diffusers/utils.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index 19f3130d..ff39d371 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -296,9 +296,9 @@ def expand_latents(
 
 def resize_latent_shape(
     latents: np.ndarray,
-    size: Size,
+    size: Tuple[int, int],
 ) -> Tuple[int, int, int, int]:
-    return (latents.shape[0], latents.shape[1], size.height, size.width)
+    return (latents.shape[0], latents.shape[1], *size)
 
 
 def get_tile_latents(

From 572db45bcb47234517ccc1623f2cbfca0eda49c5 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 12:13:45 -0600
Subject: [PATCH 230/240] lint and type fixes

---
 api/onnx_web/chain/result.py                 | 16 +++++++++++-----
 api/onnx_web/chain/upscale_bsrgan.py         | 11 +++++++++--
 api/onnx_web/chain/upscale_swinir.py         |  4 ++--
 api/onnx_web/diffusers/pipelines/panorama.py |  3 +--
 api/onnx_web/diffusers/utils.py              |  5 +++--
 api/onnx_web/params.py                       |  5 +++--
 api/onnx_web/utils.py                        | 10 ++++++----
 api/pyproject.toml                           | 14 ++++++++++++--
 8 files changed, 47 insertions(+), 21 deletions(-)

diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index 799b7b8e..bd283b1a 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -39,20 +39,26 @@ class StageResult:
     def __len__(self) -> int:
         if self.arrays is not None:
             return len(self.arrays)
-        else:
+        elif self.images is not None:
             return len(self.images)
+        else:
+            raise ValueError("empty stage result")
 
     def as_numpy(self) -> List[np.ndarray]:
         if self.arrays is not None:
             return self.arrays
-
-        return [np.array(i) for i in self.images]
+        elif self.images is not None:
+            return [np.array(i) for i in self.images]
+        else:
+            raise ValueError("empty stage result")
 
     def as_image(self) -> List[Image.Image]:
         if self.images is not None:
             return self.images
-
-        return [Image.fromarray(np.uint8(i), shape_mode(i)) for i in self.arrays]
+        elif self.arrays is not None:
+            return [Image.fromarray(np.uint8(i), shape_mode(i)) for i in self.arrays]
+        else:
+            raise ValueError("empty stage result")
 
 
 def shape_mode(arr: np.ndarray) -> str:
diff --git a/api/onnx_web/chain/upscale_bsrgan.py b/api/onnx_web/chain/upscale_bsrgan.py
index 6ade9580..08c07759 100644
--- a/api/onnx_web/chain/upscale_bsrgan.py
+++ b/api/onnx_web/chain/upscale_bsrgan.py
@@ -6,7 +6,14 @@ import numpy as np
 from PIL import Image
 
 from ..models.onnx import OnnxModel
-from ..params import DeviceParams, ImageParams, Size, StageParams, UpscaleParams
+from ..params import (
+    DeviceParams,
+    ImageParams,
+    Size,
+    SizeChart,
+    StageParams,
+    UpscaleParams,
+)
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
@@ -17,7 +24,7 @@ logger = getLogger(__name__)
 
 
 class UpscaleBSRGANStage(BaseStage):
-    max_tile = 64
+    max_tile = SizeChart.micro
 
     def load(
         self,
diff --git a/api/onnx_web/chain/upscale_swinir.py b/api/onnx_web/chain/upscale_swinir.py
index 62bd6102..ef7d421f 100644
--- a/api/onnx_web/chain/upscale_swinir.py
+++ b/api/onnx_web/chain/upscale_swinir.py
@@ -6,7 +6,7 @@ import numpy as np
 from PIL import Image
 
 from ..models.onnx import OnnxModel
-from ..params import DeviceParams, ImageParams, StageParams, UpscaleParams
+from ..params import DeviceParams, ImageParams, SizeChart, StageParams, UpscaleParams
 from ..server import ModelTypes, ServerContext
 from ..utils import run_gc
 from ..worker import WorkerContext
@@ -17,7 +17,7 @@ logger = getLogger(__name__)
 
 
 class UpscaleSwinIRStage(BaseStage):
-    max_tile = 64
+    max_tile = SizeChart.micro
 
     def load(
         self,
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index feaaeab3..810cf0e7 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -43,7 +43,6 @@ logger = logging.get_logger(__name__)
 
 # inpaint constants
 NUM_UNET_INPUT_CHANNELS = 9
-NUM_LATENT_CHANNELS = 4
 
 DEFAULT_WINDOW = 32
 DEFAULT_STRIDE = 8
@@ -1215,7 +1214,7 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
             negative_prompt_embeds=negative_prompt_embeds,
         )
 
-        num_channels_latents = NUM_LATENT_CHANNELS
+        num_channels_latents = LATENT_CHANNELS
         latents_shape = (
             batch_size * num_images_per_prompt,
             num_channels_latents,
diff --git a/api/onnx_web/diffusers/utils.py b/api/onnx_web/diffusers/utils.py
index ff39d371..b9dc4394 100644
--- a/api/onnx_web/diffusers/utils.py
+++ b/api/onnx_web/diffusers/utils.py
@@ -88,8 +88,8 @@ def expand_prompt(
     negative_prompt: Optional[str] = None,
     prompt_embeds: Optional[np.ndarray] = None,
     negative_prompt_embeds: Optional[np.ndarray] = None,
-    skip_clip_states: Optional[int] = 0,
-) -> "np.NDArray":
+    skip_clip_states: int = 0,
+) -> np.ndarray:
     # self provides:
     #   tokenizer: CLIPTokenizer
     #   encoder: OnnxRuntimeModel
@@ -144,6 +144,7 @@ def expand_prompt(
 
         last_state, _pooled_output, *hidden_states = text_result
         if skip_clip_states > 0:
+            # TODO: why is this normalized?
             layer_norm = torch.nn.LayerNorm(last_state.shape[2])
             norm_state = layer_norm(
                 torch.from_numpy(
diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index 34f1d070..d5e5ebff 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -14,6 +14,7 @@ Point = Tuple[int, int]
 
 
 class SizeChart(IntEnum):
+    micro = 64
     mini = 128  # small tile for very expensive models
     half = 256  # half tile for outpainting
     auto = 512  # auto tile size
@@ -201,7 +202,7 @@ class ImageParams:
     batch: int
     control: Optional[NetworkModel]
     input_prompt: str
-    input_negative_prompt: str
+    input_negative_prompt: Optional[str]
     loopback: int
     tiled_vae: bool
     unet_tile: int
@@ -257,7 +258,7 @@ class ImageParams:
     def do_cfg(self):
         return self.cfg > 1.0
 
-    def get_valid_pipeline(self, group: str, pipeline: str = None) -> str:
+    def get_valid_pipeline(self, group: str, pipeline: Optional[str] = None) -> str:
         pipeline = pipeline or self.pipeline
 
         # if the correct pipeline was already requested, simply use that
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 67e7847d..6ef953c3 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -20,7 +20,7 @@ SAFE_CHARS = "._-"
 
 def split_list(val: str) -> List[str]:
     parts = [part.strip() for part in val.split(",")]
-    return [part for part in parts if len(part.strip()) > 0]
+    return [part for part in parts if len(part) > 0]
 
 
 def base_join(base: str, tail: str) -> str:
@@ -75,13 +75,13 @@ def get_from_list(
 
 
 def get_from_map(
-    args: Any, key: str, values: Dict[str, TElem], default: TElem
+    args: Any, key: str, values: Dict[str, TElem], defaultKey: str
 ) -> TElem:
-    selected = args.get(key, default)
+    selected = args.get(key, defaultKey)
     if selected in values:
         return values[selected]
     else:
-        return values[default]
+        return values[defaultKey]
 
 
 def get_not_empty(args: Any, key: str, default: TElem) -> TElem:
@@ -209,6 +209,8 @@ def load_config(file: str) -> Dict:
         return load_yaml(file)
     elif ext in [".json"]:
         return load_json(file)
+    else:
+        raise ValueError("unknown config file extension")
 
 
 def load_config_str(raw: str) -> Dict:
diff --git a/api/pyproject.toml b/api/pyproject.toml
index f0c3b689..bb47f16d 100644
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@@ -9,12 +9,14 @@ skip_glob = ["*/lpw.py"]
 [tool.mypy]
 # ignore_missing_imports = true
 exclude = [
-    "onnx_web.diffusers.lpw_stable_diffusion_onnx"
+    "onnx_web.diffusers.pipelines.controlnet",
+    "onnx_web.diffusers.pipelines.lpw",
+    "onnx_web.diffusers.pipelines.pix2pix"
 ]
 
 [[tool.mypy.overrides]]
 module = [
-"arpeggio",
+    "arpeggio",
     "basicsr.archs.rrdbnet_arch",
     "basicsr.utils.download_util",
     "basicsr.utils",
@@ -27,8 +29,10 @@ module = [
     "compel",
     "controlnet_aux",
     "cv2",
+    "debugpy",
     "diffusers",
     "diffusers.configuration_utils",
+    "diffusers.image_processor",
     "diffusers.loaders",
     "diffusers.models.attention_processor",
     "diffusers.models.autoencoder_kl",
@@ -44,6 +48,7 @@ module = [
     "diffusers.pipelines.pipeline_utils",
     "diffusers.pipelines.stable_diffusion",
     "diffusers.pipelines.stable_diffusion.convert_from_ckpt",
+    "diffusers.pipelines.stable_diffusion_xl",
     "diffusers.schedulers",
     "diffusers.utils.logging",
     "facexlib.utils",
@@ -56,6 +61,11 @@ module = [
     "mediapipe",
     "onnxruntime",
     "onnxruntime.transformers.float16",
+    "optimum.exporters.onnx",
+    "optimum.onnxruntime",
+    "optimum.onnxruntime.modeling_diffusion",
+    "optimum.pipelines.diffusers.pipeline_stable_diffusion_xl_img2img",
+    "optimum.pipelines.diffusers.pipeline_utils",
     "piexif",
     "piexif.helper",
     "realesrgan",

From b398d65624277b3ca5c051960e4bd04c6e24375e Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 12:14:05 -0600
Subject: [PATCH 231/240] fix(api): restore additional ORT options for
 multi-GPU machines

---
 api/onnx_web/params.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/params.py b/api/onnx_web/params.py
index d5e5ebff..5a84aa1a 100644
--- a/api/onnx_web/params.py
+++ b/api/onnx_web/params.py
@@ -141,7 +141,7 @@ class DeviceParams:
         if self.options is None:
             return self.provider
         else:
-            return self.provider  # (self.provider, self.options)
+            return (self.provider, self.options)
 
     def sess_options(self, cache=True) -> SessionOptions:
         if cache and self.sess_options_cache is not None:

From 9b4ae0916b63c726d34f156d7ee13ae0c1bc9d99 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 12:53:50 -0600
Subject: [PATCH 232/240] lint and test fixes

---
 api/onnx_web/chain/base.py                  | 2 +-
 api/onnx_web/chain/blend_grid.py            | 4 ++--
 api/onnx_web/chain/source_txt2img.py        | 3 +--
 api/onnx_web/chain/upscale_highres.py       | 2 +-
 api/onnx_web/convert/diffusion/diffusion.py | 1 -
 api/onnx_web/convert/diffusion/lora.py      | 2 +-
 api/onnx_web/convert/utils.py               | 4 ++--
 api/onnx_web/diffusers/load.py              | 2 +-
 api/onnx_web/diffusers/patches/unet.py      | 6 +++---
 api/onnx_web/models/meta.py                 | 2 +-
 api/onnx_web/output.py                      | 2 +-
 api/onnx_web/server/load.py                 | 6 +++---
 api/pyproject.toml                          | 1 +
 api/tests/test_diffusers/test_run.py        | 2 ++
 14 files changed, 20 insertions(+), 19 deletions(-)

diff --git a/api/onnx_web/chain/base.py b/api/onnx_web/chain/base.py
index 84034fb8..02ad6c3a 100644
--- a/api/onnx_web/chain/base.py
+++ b/api/onnx_web/chain/base.py
@@ -18,7 +18,7 @@ class BaseStage:
         _stage: StageParams,
         _params: ImageParams,
         _sources: StageResult,
-        *args,
+        *,
         stage_source: Optional[Image.Image] = None,
         **kwargs,
     ) -> StageResult:
diff --git a/api/onnx_web/chain/blend_grid.py b/api/onnx_web/chain/blend_grid.py
index 5ca17151..34e4f535 100644
--- a/api/onnx_web/chain/blend_grid.py
+++ b/api/onnx_web/chain/blend_grid.py
@@ -1,5 +1,5 @@
 from logging import getLogger
-from typing import Optional
+from typing import List, Optional
 
 from PIL import Image
 
@@ -28,7 +28,7 @@ class BlendGridStage(BaseStage):
         # rows: Optional[List[str]] = None,
         # columns: Optional[List[str]] = None,
         # title: Optional[str] = None,
-        order: Optional[int] = None,
+        order: Optional[List[int]] = None,
         stage_source: Optional[Image.Image] = None,
         callback: Optional[ProgressCallback] = None,
         **kwargs,
diff --git a/api/onnx_web/chain/source_txt2img.py b/api/onnx_web/chain/source_txt2img.py
index 468ceecd..571e58ad 100644
--- a/api/onnx_web/chain/source_txt2img.py
+++ b/api/onnx_web/chain/source_txt2img.py
@@ -3,7 +3,6 @@ from typing import Optional, Tuple
 
 import numpy as np
 import torch
-from PIL import Image
 
 from ..constants import LATENT_FACTOR
 from ..diffusers.load import load_pipeline
@@ -41,7 +40,7 @@ class SourceTxt2ImgStage(BaseStage):
         latents: Optional[np.ndarray] = None,
         prompt_index: Optional[int] = None,
         **kwargs,
-    ) -> Image.Image:
+    ) -> StageResult:
         params = params.with_args(**kwargs)
         size = size.with_args(**kwargs)
 
diff --git a/api/onnx_web/chain/upscale_highres.py b/api/onnx_web/chain/upscale_highres.py
index bd7f826a..32f891a6 100644
--- a/api/onnx_web/chain/upscale_highres.py
+++ b/api/onnx_web/chain/upscale_highres.py
@@ -22,7 +22,7 @@ class UpscaleHighresStage(BaseStage):
         stage: StageParams,
         params: ImageParams,
         sources: StageResult,
-        *args,
+        *,
         highres: HighresParams,
         upscale: UpscaleParams,
         stage_source: Optional[Image.Image] = None,
diff --git a/api/onnx_web/convert/diffusion/diffusion.py b/api/onnx_web/convert/diffusion/diffusion.py
index 45762ffe..a8ecbbf7 100644
--- a/api/onnx_web/convert/diffusion/diffusion.py
+++ b/api/onnx_web/convert/diffusion/diffusion.py
@@ -103,7 +103,6 @@ def get_model_version(
             opts["prediction_type"] = "epsilon"
     except Exception:
         logger.debug("unable to load tensor for version check")
-        pass
 
     return (v2, opts)
 
diff --git a/api/onnx_web/convert/diffusion/lora.py b/api/onnx_web/convert/diffusion/lora.py
index f115942f..c4ed7fa8 100644
--- a/api/onnx_web/convert/diffusion/lora.py
+++ b/api/onnx_web/convert/diffusion/lora.py
@@ -76,7 +76,7 @@ def fix_xl_names(keys: Dict[str, Any], nodes: List[NodeProto]) -> Dict[str, Any]
     names = [fix_node_name(node.name) for node in nodes]
 
     for key, value in keys.items():
-        root, *rest = key.split(".")
+        root, *_rest = key.split(".")
         logger.trace("fixing XL node name: %s -> %s", key, root)
 
         simple = False
diff --git a/api/onnx_web/convert/utils.py b/api/onnx_web/convert/utils.py
index 61b6547f..b1babdd5 100644
--- a/api/onnx_web/convert/utils.py
+++ b/api/onnx_web/convert/utils.py
@@ -36,7 +36,7 @@ DEFAULT_OPSET = 14
 class ConversionContext(ServerContext):
     def __init__(
         self,
-        model_path: Optional[str] = None,
+        model_path: str = ".",
         cache_path: Optional[str] = None,
         device: Optional[str] = None,
         half: bool = False,
@@ -120,7 +120,7 @@ def download_progress(urls: List[Tuple[str, str]]):
 
 def tuple_to_source(model: Union[ModelDict, LegacyModel]):
     if isinstance(model, list) or isinstance(model, tuple):
-        name, source, *rest = model
+        name, source, *_rest = model
 
         return {
             "name": name,
diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 5088dc60..8d006f76 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -505,7 +505,7 @@ def load_unet(
 
 
 def load_vae(
-    server: ServerContext, device: DeviceParams, model: str, params: ImageParams
+    _server: ServerContext, device: DeviceParams, model: str, params: ImageParams
 ):
     # one or more VAE models need to be loaded
     vae = path.join(model, "vae", ONNX_MODEL)
diff --git a/api/onnx_web/diffusers/patches/unet.py b/api/onnx_web/diffusers/patches/unet.py
index 6e15597f..81065d97 100644
--- a/api/onnx_web/diffusers/patches/unet.py
+++ b/api/onnx_web/diffusers/patches/unet.py
@@ -28,9 +28,9 @@ class UNetWrapper(object):
 
     def __call__(
         self,
-        sample: np.ndarray = None,
-        timestep: np.ndarray = None,
-        encoder_hidden_states: np.ndarray = None,
+        sample: Optional[np.ndarray] = None,
+        timestep: Optional[np.ndarray] = None,
+        encoder_hidden_states: Optional[np.ndarray] = None,
         **kwargs,
     ):
         logger.trace(
diff --git a/api/onnx_web/models/meta.py b/api/onnx_web/models/meta.py
index fd8b1297..6aaa4e52 100644
--- a/api/onnx_web/models/meta.py
+++ b/api/onnx_web/models/meta.py
@@ -1,6 +1,6 @@
 from typing import List, Literal
 
-NetworkType = Literal["inversion", "lora"]
+NetworkType = Literal["control", "inversion", "lora"]
 
 
 class NetworkModel:
diff --git a/api/onnx_web/output.py b/api/onnx_web/output.py
index d64f79a0..ec76ce3d 100644
--- a/api/onnx_web/output.py
+++ b/api/onnx_web/output.py
@@ -57,7 +57,7 @@ def json_params(
     upscale: Optional[UpscaleParams] = None,
     border: Optional[Border] = None,
     highres: Optional[HighresParams] = None,
-    parent: Dict = None,
+    parent: Optional[Dict] = None,
 ) -> Any:
     json = {
         "input_size": size.tojson(),
diff --git a/api/onnx_web/server/load.py b/api/onnx_web/server/load.py
index 0444cc82..6bf1de2d 100644
--- a/api/onnx_web/server/load.py
+++ b/api/onnx_web/server/load.py
@@ -163,8 +163,8 @@ def load_extras(server: ServerContext):
     global extra_strings
     global extra_tokens
 
-    labels = {}
-    strings = {}
+    labels: Dict[str, str] = {}
+    strings: Dict[str, Any] = {}
 
     extra_schema = load_config("./schemas/extras.yaml")
 
@@ -415,7 +415,7 @@ def load_platforms(server: ServerContext) -> None:
         ):
             if potential == "cuda" or potential == "rocm":
                 for i in range(torch.cuda.device_count()):
-                    options = {
+                    options: Dict[str, Union[int, str]] = {
                         "device_id": i,
                     }
 
diff --git a/api/pyproject.toml b/api/pyproject.toml
index bb47f16d..5d69e906 100644
--- a/api/pyproject.toml
+++ b/api/pyproject.toml
@@ -71,6 +71,7 @@ module = [
     "realesrgan",
     "realesrgan.archs.srvgg_arch",
     "safetensors",
+    "scipy",
     "timm.models.layers",
     "transformers",
     "win10toast"
diff --git a/api/tests/test_diffusers/test_run.py b/api/tests/test_diffusers/test_run.py
index 261566e0..26578f3e 100644
--- a/api/tests/test_diffusers/test_run.py
+++ b/api/tests/test_diffusers/test_run.py
@@ -274,6 +274,7 @@ class TestInpaintPipeline(unittest.TestCase):
                 3.0,
                 1,
                 1,
+                unet_tile=64,
             ),
             Size(*source.size),
             ["test-inpaint-white.png"],
@@ -310,6 +311,7 @@ class TestInpaintPipeline(unittest.TestCase):
                 3.0,
                 1,
                 1,
+                unet_tile=64,
             ),
             Size(*source.size),
             ["test-inpaint-black.png"],

From ae34e466ef73bfcbaa52c661ebb4d944298b9c60 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 12:57:56 -0600
Subject: [PATCH 233/240] more lint, avoid some unnecessary errors

---
 api/onnx_web/chain/result.py | 6 +++---
 api/onnx_web/utils.py        | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/api/onnx_web/chain/result.py b/api/onnx_web/chain/result.py
index bd283b1a..813f5863 100644
--- a/api/onnx_web/chain/result.py
+++ b/api/onnx_web/chain/result.py
@@ -42,7 +42,7 @@ class StageResult:
         elif self.images is not None:
             return len(self.images)
         else:
-            raise ValueError("empty stage result")
+            return 0
 
     def as_numpy(self) -> List[np.ndarray]:
         if self.arrays is not None:
@@ -50,7 +50,7 @@ class StageResult:
         elif self.images is not None:
             return [np.array(i) for i in self.images]
         else:
-            raise ValueError("empty stage result")
+            return []
 
     def as_image(self) -> List[Image.Image]:
         if self.images is not None:
@@ -58,7 +58,7 @@ class StageResult:
         elif self.arrays is not None:
             return [Image.fromarray(np.uint8(i), shape_mode(i)) for i in self.arrays]
         else:
-            raise ValueError("empty stage result")
+            return []
 
 
 def shape_mode(arr: np.ndarray) -> str:
diff --git a/api/onnx_web/utils.py b/api/onnx_web/utils.py
index 6ef953c3..d047ec0d 100644
--- a/api/onnx_web/utils.py
+++ b/api/onnx_web/utils.py
@@ -75,13 +75,13 @@ def get_from_list(
 
 
 def get_from_map(
-    args: Any, key: str, values: Dict[str, TElem], defaultKey: str
+    args: Any, key: str, values: Dict[str, TElem], default_key: str
 ) -> TElem:
-    selected = args.get(key, defaultKey)
+    selected = args.get(key, default_key)
     if selected in values:
         return values[selected]
     else:
-        return values[defaultKey]
+        return values[default_key]
 
 
 def get_not_empty(args: Any, key: str, default: TElem) -> TElem:

From 92311281df17cc4e34d9ad419a89cb2b7b8b4496 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 13:03:38 -0600
Subject: [PATCH 234/240] fix(api): switch pipeline ctor based on VAE presence,
 improve panorama logging

---
 api/onnx_web/diffusers/load.py                  | 6 +++---
 api/onnx_web/diffusers/pipelines/panorama.py    | 6 ++++++
 api/onnx_web/diffusers/pipelines/panorama_xl.py | 4 ++++
 3 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 8d006f76..366ccb17 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -229,10 +229,9 @@ def load_pipeline(
                 tokenizer_2=components.get("tokenizer_2", None),
             )
         else:
-            logger.debug("assembling SD pipeline for %s", pipeline_class.__name__)
-
-            if pipeline_class == OnnxStableDiffusionUpscalePipeline:
+            if "vae" in components:
                 # upscale uses a single VAE
+                logger.debug("assembling SD pipeline for %s with single VAE", pipeline_class.__name__)
                 pipe = pipeline_class(
                     components["vae"],
                     components["text_encoder"],
@@ -242,6 +241,7 @@ def load_pipeline(
                     scheduler,
                 )
             else:
+                logger.debug("assembling SD pipeline for %s with VAE codec", pipeline_class.__name__)
                 pipe = pipeline_class(
                     components["vae_encoder"],
                     components["vae_decoder"],
diff --git a/api/onnx_web/diffusers/pipelines/panorama.py b/api/onnx_web/diffusers/pipelines/panorama.py
index 810cf0e7..317a8515 100644
--- a/api/onnx_web/diffusers/pipelines/panorama.py
+++ b/api/onnx_web/diffusers/pipelines/panorama.py
@@ -563,6 +563,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
+        logger.trace("panorama resized latents to %s", resize)
+
         count = np.zeros(resize_latent_shape(latents, resize))
         value = np.zeros(resize_latent_shape(latents, resize))
 
@@ -977,6 +979,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
+        logger.trace("panorama resized latents to %s", resize)
+
         count = np.zeros(resize_latent_shape(latents, resize))
         value = np.zeros(resize_latent_shape(latents, resize))
 
@@ -1298,6 +1302,8 @@ class OnnxStableDiffusionPanoramaPipeline(DiffusionPipeline):
 
         # panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
+        logger.trace("panorama resized latents to %s", resize)
+
         count = np.zeros(resize_latent_shape(latents, resize))
         value = np.zeros(resize_latent_shape(latents, resize))
 
diff --git a/api/onnx_web/diffusers/pipelines/panorama_xl.py b/api/onnx_web/diffusers/pipelines/panorama_xl.py
index 2650a2a3..5551267b 100644
--- a/api/onnx_web/diffusers/pipelines/panorama_xl.py
+++ b/api/onnx_web/diffusers/pipelines/panorama_xl.py
@@ -394,6 +394,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
+        logger.trace("panorama resized latents to %s", resize)
+
         count = np.zeros(resize_latent_shape(latents, resize))
         value = np.zeros(resize_latent_shape(latents, resize))
 
@@ -819,6 +821,8 @@ class StableDiffusionXLPanoramaPipelineMixin(StableDiffusionXLImg2ImgPipelineMix
 
         # 8. Panorama additions
         views, resize = self.get_views(height, width, self.window, self.stride)
+        logger.trace("panorama resized latents to %s", resize)
+
         count = np.zeros(resize_latent_shape(latents, resize))
         value = np.zeros(resize_latent_shape(latents, resize))
 

From 7c3e9c22d0cb89e8d61cb8d60022a799e3f68f56 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 15:34:34 -0600
Subject: [PATCH 235/240] improve some logs, update test refs for panorama

---
 api/onnx_web/diffusers/load.py                | 10 ++-
 .../img2img-panorama-1024x768-pumpkin-0.png   |  4 +-
 .../outpaint-panorama-horizontal-512-0.png    |  4 +-
 .../outpaint-panorama-vertical-512-0.png      |  4 +-
 api/scripts/test-release.py                   | 70 +++++++++++++++----
 5 files changed, 69 insertions(+), 23 deletions(-)

diff --git a/api/onnx_web/diffusers/load.py b/api/onnx_web/diffusers/load.py
index 366ccb17..30a87863 100644
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@@ -231,7 +231,10 @@ def load_pipeline(
         else:
             if "vae" in components:
                 # upscale uses a single VAE
-                logger.debug("assembling SD pipeline for %s with single VAE", pipeline_class.__name__)
+                logger.debug(
+                    "assembling SD pipeline for %s with single VAE",
+                    pipeline_class.__name__,
+                )
                 pipe = pipeline_class(
                     components["vae"],
                     components["text_encoder"],
@@ -241,7 +244,10 @@ def load_pipeline(
                     scheduler,
                 )
             else:
-                logger.debug("assembling SD pipeline for %s with VAE codec", pipeline_class.__name__)
+                logger.debug(
+                    "assembling SD pipeline for %s with VAE codec",
+                    pipeline_class.__name__,
+                )
                 pipe = pipeline_class(
                     components["vae_encoder"],
                     components["vae_decoder"],
diff --git a/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png b/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
index 739d4544..4bfe6bd7 100644
--- a/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
+++ b/api/scripts/test-refs/img2img-panorama-1024x768-pumpkin-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5359014a0963adbd896832c8ca0e08a30deb0ec8306d7db5fcbd150d49aad04a
-size 1450590
+oid sha256:613ce059320abadb89f4adf00546d45a20d504ea508106499ceca78df389515f
+size 1469930
diff --git a/api/scripts/test-refs/outpaint-panorama-horizontal-512-0.png b/api/scripts/test-refs/outpaint-panorama-horizontal-512-0.png
index 56761cfc..14d22eee 100644
--- a/api/scripts/test-refs/outpaint-panorama-horizontal-512-0.png
+++ b/api/scripts/test-refs/outpaint-panorama-horizontal-512-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:151c811488c933d9b858b70157da49ef626e2ce99207120fddc3791238e5a065
-size 1949395
+oid sha256:f6c4cd00f206bc3127c888dbb026edcef08fcc86be0487bf73abb77fd64bc419
+size 1680355
diff --git a/api/scripts/test-refs/outpaint-panorama-vertical-512-0.png b/api/scripts/test-refs/outpaint-panorama-vertical-512-0.png
index f467648a..fdf38af0 100644
--- a/api/scripts/test-refs/outpaint-panorama-vertical-512-0.png
+++ b/api/scripts/test-refs/outpaint-panorama-vertical-512-0.png
@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2311f9f2c273065a854636113f43fbbae642792e7c7f265c8bb3cbda0e308182
-size 1894231
+oid sha256:2c5486aebb193a2cfc155553934b33ad8fe224ef7fbf04b56dbefdea3ac14a30
+size 1584202
diff --git a/api/scripts/test-release.py b/api/scripts/test-release.py
index dd8443d5..42806b55 100644
--- a/api/scripts/test-release.py
+++ b/api/scripts/test-release.py
@@ -69,6 +69,7 @@ TEST_DATA = [
     TestCase(
         "txt2img-sd-v1-5-512-muffin-deis",
         "txt2img?prompt=a+giant+muffin&seed=0&scheduler=deis",
+        mse_threshold=LOOSE_TEST,
     ),
     TestCase(
         "txt2img-sd-v1-5-512-muffin-dpm",
@@ -346,6 +347,39 @@ class TestError(Exception):
         return super().__str__()
 
 
+class TestResult:
+    error: Optional[str]
+    mse: Optional[float]
+    name: str
+    passed: bool
+
+    def __init__(self, name: str, error = None, passed = True, mse = None) -> None:
+        self.error = error
+        self.mse = mse
+        self.name = name
+        self.passed = passed
+
+    def __repr__(self) -> str:
+        if self.passed:
+            if self.mse is not None:
+                return f"{self.name} ({self.mse})"
+            else:
+                return self.name
+        else:
+            if self.mse is not None:
+                return f"{self.name}: {self.error} ({self.mse})"
+            else:
+                return f"{self.name}: {self.error}"
+
+    @classmethod
+    def passed(self, name: str, mse = None):
+        return TestResult(name, mse=mse)
+
+    @classmethod
+    def failed(self, name: str, error: str, mse = None):
+        return TestResult(name, error=error, mse=mse, passed=False)
+
+
 def parse_args(args: List[str]):
     parser = ArgumentParser(
         prog="onnx-web release tests",
@@ -452,14 +486,14 @@ def run_test(
     host: str,
     test: TestCase,
     mse_mult: float = 1.0,
-) -> bool:
+) -> TestResult:
     """
     Generate an image, wait for it to be ready, and calculate the MSE from the reference.
     """
 
     keys = generate_images(host, test)
     if keys is None:
-        raise ValueError("could not generate image")
+        return TestResult.failed(test.name, "could not generate image")
 
     ready = False
     for attempt in tqdm(range(test.max_attempts)):
@@ -472,13 +506,13 @@ def run_test(
             sleep(6)
 
     if not ready:
-        raise ValueError("image was not ready in time")
+        return TestResult.failed(test.name, "image was not ready in time")
 
     results = download_images(host, keys)
-    if results is None:
-        raise ValueError("could not download image")
+    if results is None or len(results) == 0:
+        return TestResult.failed(test.name, "could not download image")
 
-    passed = True
+    passed = False
     for i in range(len(results)):
         result = results[i]
         result.save(test_path(path.join("test-results", f"{test.name}-{i}.png")))
@@ -491,11 +525,15 @@ def run_test(
 
         if mse < threshold:
             logger.info("MSE within threshold: %.5f < %.5f", mse, threshold)
+            passed = True
         else:
             logger.warning("MSE above threshold: %.5f > %.5f", mse, threshold)
-            passed = False
+            return TestResult.failed(test.name, error="MSE above threshold", mse=mse)
 
-    return passed
+    if passed:
+        return TestResult.passed(test.name)
+    else:
+        return TestResult.failed(test.name, "no images tested")
 
 
 def main():
@@ -516,24 +554,26 @@ def main():
     passed = []
     failed = []
     for test in tests:
-        test_passed = False
+        result = None
 
         for _i in range(3):
             try:
                 logger.info("starting test: %s", test.name)
-                if run_test(args.host, test, mse_mult=args.mse):
+                result = run_test(args.host, test, mse_mult=args.mse)
+                if result.passed:
                     logger.info("test passed: %s", test.name)
-                    test_passed = True
                     break
                 else:
                     logger.warning("test failed: %s", test.name)
             except Exception:
                 logger.exception("error running test for %s", test.name)
+                result = TestResult.failed(test.name, "TODO: exception message")
 
-        if test_passed:
-            passed.append(test.name)
-        else:
-            failed.append(test.name)
+        if result is not None:
+            if result.passed:
+                passed.append(result)
+            else:
+                failed.append(result)
 
     logger.info("%s of %s tests passed", len(passed), len(tests))
     failed = list(set(failed))

From 1d6547977c5fdadcb474952cf0e49ac8c20f7fec Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 15:37:03 -0600
Subject: [PATCH 236/240] fix(docs): note LCM in readme

---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index 564927f0..ed10a950 100644
--- a/README.md
+++ b/README.md
@@ -24,6 +24,7 @@ details](https://github.com/ssube/onnx-web/blob/main/docs/user-guide.md).
 This is an incomplete list of new and interesting features, with links to the user guide:
 
 - SDXL support
+- LCM support
 - hardware acceleration on both AMD and Nvidia
   - tested on CUDA, DirectML, and ROCm
   - [half-precision support for low-memory GPUs](docs/user-guide.md#optimizing-models-for-lower-memory-usage) on both

From b29837d773115c65b05a2a7cc130069341386055 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Sun, 3 Dec 2023 15:52:36 -0600
Subject: [PATCH 237/240] fix(api): convert SD models without extracting Torch
 intermediate (#404)

---
 api/onnx_web/convert/utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/api/onnx_web/convert/utils.py b/api/onnx_web/convert/utils.py
index b1babdd5..ef44ba20 100644
--- a/api/onnx_web/convert/utils.py
+++ b/api/onnx_web/convert/utils.py
@@ -69,7 +69,7 @@ class ConversionContext(ServerContext):
     def from_environ(cls):
         context = super().from_environ()
         context.control = get_boolean(environ, "ONNX_WEB_CONVERT_CONTROL", True)
-        context.extract = get_boolean(environ, "ONNX_WEB_CONVERT_EXTRACT", True)
+        context.extract = get_boolean(environ, "ONNX_WEB_CONVERT_EXTRACT", False)
         context.reload = get_boolean(environ, "ONNX_WEB_CONVERT_RELOAD", True)
         context.share_unet = get_boolean(environ, "ONNX_WEB_CONVERT_SHARE_UNET", True)
         context.opset = int(environ.get("ONNX_WEB_CONVERT_OPSET", DEFAULT_OPSET))

From 95a62b17edc952ee58704a2f489db339843516b0 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 4 Dec 2023 18:44:58 -0600
Subject: [PATCH 238/240] fix(api): detect all mask keys, immediately bubble up
 cancellation errors

---
 api/onnx_web/chain/pipeline.py | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 60554071..221c7cf4 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -5,7 +5,7 @@ from typing import Any, List, Optional, Tuple
 
 from PIL import Image
 
-from ..errors import RetryException
+from ..errors import CancelledException, RetryException
 from ..output import save_image
 from ..params import ImageParams, Size, StageParams
 from ..server import ServerContext
@@ -146,7 +146,7 @@ class ChainPipeline:
                 kwargs.pop("params")
 
             # the stage must be split and tiled if any image is larger than the selected/max tile size
-            must_tile = "mask" in stage_kwargs or any(
+            must_tile = has_mask(stage_kwargs) or any(
                 [
                     needs_tile(
                         stage_pipe.max_tile,
@@ -192,6 +192,10 @@ class ChainPipeline:
                                     save_image(server, f"last-tile-{j}.png", image)
 
                             return tile_result
+                        except CancelledException as err:
+                            worker.retries = 0
+                            logger.exception("job was cancelled while tiling")
+                            raise err
                         except Exception:
                             worker.retries = worker.retries - 1
                             logger.exception(
@@ -234,6 +238,10 @@ class ChainPipeline:
                         # does not like, so it throws
                         stage_sources = stage_result
                         break
+                    except CancelledException as err:
+                        worker.retries = 0
+                        logger.exception("job was cancelled during stage")
+                        raise err
                     except Exception:
                         worker.retries = worker.retries - 1
                         logger.exception(
@@ -264,3 +272,9 @@ class ChainPipeline:
             len(stage_sources),
         )
         return stage_sources
+
+
+MASK_KEYS = ["mask", "stage_mask", "tile_mask"]
+
+def has_mask(args: List[str]) -> bool:
+    return any([key in args for key in MASK_KEYS])

From d95cfc582a5f0257568a74826fc12663c17fcd77 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Mon, 4 Dec 2023 18:45:28 -0600
Subject: [PATCH 239/240] apply lint

---
 api/onnx_web/chain/pipeline.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/api/onnx_web/chain/pipeline.py b/api/onnx_web/chain/pipeline.py
index 221c7cf4..ff3fae81 100644
--- a/api/onnx_web/chain/pipeline.py
+++ b/api/onnx_web/chain/pipeline.py
@@ -276,5 +276,6 @@ class ChainPipeline:
 
 MASK_KEYS = ["mask", "stage_mask", "tile_mask"]
 
+
 def has_mask(args: List[str]) -> bool:
     return any([key in args for key in MASK_KEYS])

From 6e614aa1e05a284ffcbc24dd09e56d628be429b8 Mon Sep 17 00:00:00 2001
From: Sean Sube <seansube@gmail.com>
Date: Tue, 5 Dec 2023 22:16:22 -0600
Subject: [PATCH 240/240] fix(docs): add missing web UI setup step

---
 docs/setup-guide.md | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/docs/setup-guide.md b/docs/setup-guide.md
index 1035b09e..078b3c2a 100644
--- a/docs/setup-guide.md
+++ b/docs/setup-guide.md
@@ -16,6 +16,7 @@ This guide covers the setup process for onnx-web, including downloading the Wind
       - [For CPU everywhere: PyTorch CPU and ONNX runtime CPU](#for-cpu-everywhere-pytorch-cpu-and-onnx-runtime-cpu)
       - [For Nvidia everywhere: Install PyTorch GPU and ONNX GPU](#for-nvidia-everywhere-install-pytorch-gpu-and-onnx-gpu)
     - [Test the models](#test-the-models)
+    - [Download the web UI bundle](#download-the-web-ui-bundle)
   - [Windows-specific methods](#windows-specific-methods)
     - [Windows all-in-one bundle](#windows-all-in-one-bundle)
     - [Windows Python installer](#windows-python-installer)
@@ -215,6 +216,24 @@ If the script works, there will be an image of an astronaut in `outputs/test.png
 
 If you get any errors, check [the known errors section of the user guide](user-guide.md#known-errors).
 
+### Download the web UI bundle
+
+Once the server environment is working, you will need the latest files for the web UI. This is a Javascript bundle and
+you can download a pre-built copy from Github or compile your own.
+
+From [the `gh-pages` branch](https://github.com/ssube/onnx-web/tree/gh-pages), select the version matching your server
+and download all three files:
+
+- `bundle/main.js`
+- `config.json`
+- `index.html`
+
+Copy them into your local `api/gui` folder, making sure to keep the `main.js` bundle in the `bundle` subfolder.
+
+For example, for a v0.11 server, copy the files from https://github.com/ssube/onnx-web/tree/gh-pages/v0.11.0 into your
+local copy of https://github.com/ssube/onnx-web/tree/main/api/gui and
+https://github.com/ssube/onnx-web/tree/main/api/gui/bundle.
+
 ## Windows-specific methods
 
 These methods are specific to Windows, tested on Windows 10, and still experimental. They should provide an easier