feat(api): add parameters for noise source and blend op to inpaint

2023-01-15 09:21:09 -06:00 · 2023-01-15 09:21:09 -06:00 · e403980a44
parent 77470a610a
commit e403980a44
2 changed files with 104 additions and 15 deletions
--- a/api/onnx_web/image.py
+++ b/api/onnx_web/image.py
@ -13,9 +13,26 @@ def blend_imult(a):
    return 1.0 - blend_mult(a)
-def blend_mask_inverse_source(source: Tuple[int, int, int], mask: Tuple[int, int, int], noise: Tuple[int, int, int]) -> Tuple[int, int, int]:
+def blend_mask_source(source: Tuple[int, int, int], mask: Tuple[int, int, int], noise: Tuple[int, int, int]) -> Tuple[int, int, int]:
    '''
    Blend operation, linear interpolation from noise to source based on mask: `(s * (1 - m)) + (n * m)`
    Black = noise
    White = source
    '''
    return (
        int((source[0] * blend_mult(mask[0])) +
            (noise[0] * blend_imult(mask[0]))),
        int((source[1] * blend_mult(mask[1])) +
            (noise[1] * blend_imult(mask[1]))),
        int((source[2] * blend_mult(mask[2])) +
            (noise[2] * blend_imult(mask[2]))),
    )
 def blend_source_mask(source: Tuple[int, int, int], mask: Tuple[int, int, int], noise: Tuple[int, int, int]) -> Tuple[int, int, int]:
    '''
    Blend operation, linear interpolation from source to noise based on mask: `(s * (1 - m)) + (n * m)`
    Black = source
    White = noise
    '''
    return (
        int((source[0] * blend_imult(mask[0])) +
@ -27,20 +44,28 @@ def blend_mask_inverse_source(source: Tuple[int, int, int], mask: Tuple[int, int
    )
-def noise_source_original(source_image: Image, dims: Tuple[int, int], origin: Tuple[int, int]) -> Tuple[float, float, float]:
+def noise_source_fill(source_image: Image, dims: Tuple[int, int], origin: Tuple[int, int], fill='white') -> Tuple[float, float, float]:
    '''
    Identity transform, source image centered on white canvas.
    '''
    width, height = dims
-    noise = Image.new('RGB', (width, height), 'white')
+    noise = Image.new('RGB', (width, height), fill)
    noise.paste(source_image, origin)
    return noise
-def noise_source_gaussian(source_image: Image, dims: Tuple[int, int], origin: Tuple[int, int]) -> Tuple[float, float, float]:
+def noise_source_gaussian(source_image: Image, dims: Tuple[int, int], origin: Tuple[int, int], rounds=3) -> Tuple[float, float, float]:
    '''
    Gaussian blur, source image centered on white canvas.
    '''
    width, height = dims
    noise = Image.new('RGB', (width, height), 'white')
    noise.paste(source_image, origin)
    for i in range(rounds):
        noise.filter(ImageFilter.GaussianBlur(5))
    return noise
@ -127,7 +152,7 @@ def expand_image(
        expand_by: Tuple[int, int, int, int],
        fill='white',
        noise_source=noise_source_histogram,
-        blend_op=blend_mask_inverse_source
+        blend_op=blend_source_mask
 ):
    left, right, top, bottom = expand_by
--- a/api/onnx_web/serve.py
+++ b/api/onnx_web/serve.py
@ -29,7 +29,7 @@ from struct import pack
 from os import environ, makedirs, path, scandir
 from typing import Any, Dict, Tuple, Union
-from .image import expand_image
+from .image import expand_image, noise_source_gaussian, noise_source_histogram, noise_source_normal, noise_source_fill, noise_source_uniform, blend_source_mask, blend_imult, blend_mask_source, blend_mult
 import json
 import numpy as np
@ -72,6 +72,17 @@ pipeline_schedulers = {
    'lms-discrete': LMSDiscreteScheduler,
    'pndm': PNDMScheduler,
 }
 noise_sources = {
    'fill': noise_source_fill,
    'gaussian': noise_source_gaussian,
    'histogram': noise_source_histogram,
    'normal': noise_source_normal,
    'uniform': noise_source_uniform,
 }
 blend_modes = {
    'mask-source': blend_mask_source,
    'source-mask': blend_source_mask,
 }
 def get_and_clamp_float(args, key: str, default_value: float, max_value: float, min_value=0.0) -> float:
@ -264,7 +275,27 @@ def run_img2img_pipeline(model, provider, scheduler, prompt, negative_prompt, cf
    print('saved img2img output: %s' % (output))
-def run_inpaint_pipeline(model, provider, scheduler, prompt, negative_prompt, cfg, steps, seed, output, height, width, source_image, mask_image, left, right, top, bottom):
+def run_inpaint_pipeline(
    model: str,
    provider: str,
    scheduler: Any,
    prompt: str,
    negative_prompt: Union[str, None],
    cfg: float,
    steps: int,
    seed: int,
    output: str,
    height: int,
    width: int,
    source_image: Image,
    mask_image: Image,
    left: int,
    right: int,
    top: int,
    bottom: int,
    noise_source: Any,
    blend_op: Any
 ):
    pipe = load_pipeline(OnnxStableDiffusionInpaintPipeline,
                         model, provider, scheduler)
@ -273,7 +304,12 @@ def run_inpaint_pipeline(model, provider, scheduler, prompt, negative_prompt, cf
    if left > 0 or right > 0 or top > 0 or bottom > 0:
        print('expanding image for outpainting')
-        source_image, mask_image, _full_noise, _full_dims = expand_image(source_image, mask_image, (left, right, top, bottom))
+        source_image, mask_image, _full_noise, _full_dims = expand_image(
            source_image,
            mask_image,
            (left, right, top, bottom),
            noise_source=noise_source,
            blend_op=blend_op)
    image = pipe(
        prompt,
@ -445,10 +481,18 @@ def inpaint():
    (model, provider, scheduler, prompt, negative_prompt, cfg, steps, height,
     width, seed) = pipeline_from_request()
-    left = get_and_clamp_int(request.args, 'left', 0, config_params.get('width').get('max'), 0)
+    left = get_and_clamp_int(request.args, 'left', 0,
-    right = get_and_clamp_int(request.args, 'right', 0, config_params.get('width').get('max'), 0)
+                             config_params.get('width').get('max'), 0)
-    top = get_and_clamp_int(request.args, 'top', 0, config_params.get('height').get('max'), 0)
+    right = get_and_clamp_int(request.args, 'right',
-    bottom = get_and_clamp_int(request.args, 'bottom', 0, config_params.get('height').get('max'), 0)
+                              0, config_params.get('width').get('max'), 0)
    top = get_and_clamp_int(request.args, 'top', 0,
                            config_params.get('height').get('max'), 0)
    bottom = get_and_clamp_int(
        request.args, 'bottom', 0, config_params.get('height').get('max'), 0)
    noise_source = get_from_map(
        request.args, 'noise', noise_sources, 'histogram')
    blend_op = get_from_map(request.args, 'blend', blend_modes, 'mask-source')
    (output_file, output_full) = make_output_path(
        'inpaint', seed, (prompt, cfg, steps, height, width, seed, left, right, top, bottom))
@ -456,8 +500,28 @@ def inpaint():
    source_image.thumbnail((width, height))
    mask_image.thumbnail((width, height))
-    executor.submit_stored(output_file, run_inpaint_pipeline, model, provider, scheduler, prompt, negative_prompt,
+    executor.submit_stored(
-                           cfg, steps, seed, output_full, height, width, source_image, mask_image, left, right, top, bottom)
+        output_file,
        run_inpaint_pipeline,
        model,
        provider,
        scheduler,
        prompt,
        negative_prompt,
        cfg,
        steps,
        seed,
        output_full,
        height,
        width,
        source_image,
        mask_image,
        left,
        right,
        top,
        bottom,
        noise_source,
        blend_op)
    return jsonify({
        'output': output_file,