onnx-web/api/onnx_web/upscale.py

from basicsr.archs.rrdbnet_arch import RRDBNet
from diffusers import (
    AutoencoderKL,
    DDPMScheduler,
    StableDiffusionUpscalePipeline,
)
from gfpgan import GFPGANer
from os import path
from PIL import Image
from realesrgan import RealESRGANer
from typing import Literal, Optional

import numpy as np
import torch

from .chain import (
    ChainPipeline,
    StageParams,
)
from .onnx import (
    ONNXNet,
    OnnxStableDiffusionUpscalePipeline,
)
from .utils import (
    ImageParams,
    ServerContext,
    Size,
)


class UpscaleParams():
    def __init__(
        self,
        upscale_model: str,
        provider: str,
        correction_model: Optional[str] = None,
        denoise: float = 0.5,
        faces=True,
        face_strength: float = 0.5,
        format: Literal['onnx', 'pth'] = 'onnx',
        half=False,
        outscale: int = 1,
        scale: int = 4,
        pre_pad: int = 0,
        tile_pad: int = 10,
    ) -> None:
        self.upscale_model = upscale_model
        self.provider = provider
        self.correction_model = correction_model
        self.denoise = denoise
        self.faces = faces
        self.face_strength = face_strength
        self.format = format
        self.half = half
        self.outscale = outscale
        self.pre_pad = pre_pad
        self.scale = scale
        self.tile_pad = tile_pad

    def resize(self, size: Size) -> Size:
        return Size(size.width * self.outscale, size.height * self.outscale)


def load_resrgan(ctx: ServerContext, params: UpscaleParams, tile=0):
    '''
    TODO: cache this instance
    '''
    model_file = '%s.%s' % (params.upscale_model, params.format)
    model_path = path.join(ctx.model_path, model_file)
    if not path.isfile(model_path):
        raise Exception('Real ESRGAN model not found at %s' % model_path)

    # use ONNX acceleration, if available
    if params.format == 'onnx':
        model = ONNXNet(ctx, model_file, provider=params.provider)
    elif params.format == 'pth':
        model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,
                        num_block=23, num_grow_ch=32, scale=params.scale)
        raise Exception('unknown platform %s' % params.format)

    dni_weight = None
    if params.upscale_model == 'realesr-general-x4v3' and params.denoise != 1:
        wdn_model_path = model_path.replace(
            'realesr-general-x4v3', 'realesr-general-wdn-x4v3')
        model_path = [model_path, wdn_model_path]
        dni_weight = [params.denoise, 1 - params.denoise]

    # TODO: shouldn't need the PTH file
    upsampler = RealESRGANer(
        scale=params.scale,
        model_path=path.join(ctx.model_path, '%s.pth' % params.upscale_model),
        dni_weight=dni_weight,
        model=model,
        tile=tile,
        tile_pad=params.tile_pad,
        pre_pad=params.pre_pad,
        half=params.half)

    return upsampler


def load_stable_diffusion(ctx: ServerContext, upscale: UpscaleParams):
    '''
    TODO: cache this instance
    '''
    if upscale.format == 'onnx':
        model_path = path.join(ctx.model_path, upscale.upscale_model)
        # ValueError: Pipeline <class 'onnx_web.onnx.pipeline_onnx_stable_diffusion_upscale.OnnxStableDiffusionUpscalePipeline'>
        # expected {'vae', 'unet', 'text_encoder', 'tokenizer', 'scheduler', 'low_res_scheduler'},
        # but only {'scheduler', 'tokenizer', 'text_encoder', 'unet'} were passed.
        pipeline = OnnxStableDiffusionUpscalePipeline.from_pretrained(
            model_path,
            vae=AutoencoderKL.from_pretrained(
                model_path, subfolder='vae_encoder'),
            low_res_scheduler=DDPMScheduler.from_pretrained(
                model_path, subfolder='scheduler'),
        )
    else:
        pipeline = StableDiffusionUpscalePipeline.from_pretrained(
            'stabilityai/stable-diffusion-x4-upscaler')

    return pipeline


def upscale_resrgan(
    ctx: ServerContext,
    stage: StageParams,
    params: ImageParams,
    source_image: Image.Image,
    *,
    upscale: UpscaleParams,
) -> Image:
    print('upscaling image with Real ESRGAN', upscale.scale)

    output = np.array(source_image)
    upsampler = load_resrgan(ctx, upscale, tile=stage.tile_size)

    output, _ = upsampler.enhance(output, outscale=upscale.outscale)

    output = Image.fromarray(output, 'RGB')
    print('final output image size', output.size)
    return output


def upscale_gfpgan(
    ctx: ServerContext,
    stage: StageParams,
    params: ImageParams,
    image: Image.Image,
    *,
    upscale: UpscaleParams,
    upsampler: Optional[RealESRGANer] = None,
) -> Image:
    if upscale.correction_model is None:
        print('no face model given, skipping')
        return image

    print('correcting faces with GFPGAN model: %s' % upscale.correction_model)

    if upsampler is None:
        upsampler = load_resrgan(ctx, upscale)

    face_path = path.join(ctx.model_path, '%s.pth' %
                          (upscale.correction_model))

    # TODO: doesn't have a model param, not sure how to pass ONNX model
    face_enhancer = GFPGANer(
        model_path=face_path,
        upscale=upscale.outscale,
        arch='clean',
        channel_multiplier=2,
        bg_upsampler=upsampler)

    _, _, output = face_enhancer.enhance(
        image, has_aligned=False, only_center_face=False, paste_back=True, weight=upscale.face_strength)

    return output


def upscale_stable_diffusion(
    ctx: ServerContext,
    stage: StageParams,
    params: ImageParams,
    source: Image.Image,
    *,
    upscale: UpscaleParams,
) -> Image:
    print('upscaling with Stable Diffusion')

    pipeline = load_stable_diffusion(ctx, upscale)
    generator = torch.manual_seed(params.seed)
    seed = generator.initial_seed()

    def upscale_stage(_ctx: ServerContext, stage: StageParams, params: ImageParams, image: Image.Image) -> Image:
        return pipeline(
            params.prompt,
            image,
            generator=torch.manual_seed(seed),
            num_inference_steps=params.steps,
        ).images[0]

    chain = ChainPipeline(stages=[
        (upscale_stage, stage)
    ])
    return chain(ctx, params, source)


def run_upscale_correction(
    ctx: ServerContext,
    stage: StageParams,
    params: ImageParams,
    image: Image.Image,
    *,
    upscale: UpscaleParams,
) -> Image.Image:
    print('running upscale pipeline')

    if upscale.scale > 1:
        if 'esrgan' in upscale.upscale_model:
            stage = StageParams(tile_size=stage.tile_size,
                                outscale=upscale.outscale)
            image = upscale_resrgan(ctx, stage, params, image, upscale=upscale)
        elif 'stable-diffusion' in upscale.upscale_model:
            mini_tile = min(128, stage.tile_size)
            stage = StageParams(tile_size=mini_tile, outscale=upscale.outscale)
            image = upscale_stable_diffusion(
                ctx, stage, params, image, upscale=upscale)

    if upscale.faces:
        stage = StageParams(tile_size=stage.tile_size,
                            outscale=upscale.outscale)
        image = upscale_gfpgan(ctx, stage, params, image, upscale=upscale)

    return image
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`from basicsr.archs.rrdbnet_arch import RRDBNet`
load additional components for SD upscaling 2023-01-26 03:29:18 +00:00			`from diffusers import (`
			`AutoencoderKL,`
			`DDPMScheduler,`
attempt to run SD upscaling in smaller tiles 2023-01-27 04:44:20 +00:00			`StableDiffusionUpscalePipeline,`
load additional components for SD upscaling 2023-01-26 03:29:18 +00:00			`)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`from gfpgan import GFPGANer`
			`from os import path`
			`from PIL import Image`
			`from realesrgan import RealESRGANer`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`from typing import Literal, Optional`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): convert image to numpy before upscaling 2023-01-16 00:13:28 +00:00			`import numpy as np`
use a torch rng 2023-01-27 05:15:24 +00:00			`import torch`
fix(api): convert image to numpy before upscaling 2023-01-16 00:13:28 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`from .chain import (`
			`ChainPipeline,`
			`StageParams,`
attempt to run SD upscaling in smaller tiles 2023-01-27 04:44:20 +00:00			`)`
feat(api): initial support for Stable Diffusion upscaling (#66) 2023-01-26 03:04:00 +00:00			`from .onnx import (`
			`ONNXNet,`
			`OnnxStableDiffusionUpscalePipeline,`
			`)`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`from .utils import (`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`ImageParams,`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`ServerContext,`
			`Size,`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`)`

feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`class UpscaleParams():`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`def __init__(`
			`self,`
			`upscale_model: str,`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`provider: str,`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`correction_model: Optional[str] = None,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`denoise: float = 0.5,`
			`faces=True,`
fix: send missing model params, add face strength control 2023-01-17 04:54:01 +00:00			`face_strength: float = 0.5,`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`format: Literal['onnx', 'pth'] = 'onnx',`
			`half=False,`
			`outscale: int = 1,`
			`scale: int = 4,`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`pre_pad: int = 0,`
			`tile_pad: int = 10,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`) -> None:`
			`self.upscale_model = upscale_model`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.provider = provider`
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`self.correction_model = correction_model`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`self.denoise = denoise`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`self.faces = faces`
fix: send missing model params, add face strength control 2023-01-17 04:54:01 +00:00			`self.face_strength = face_strength`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.format = format`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`self.half = half`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.outscale = outscale`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`self.pre_pad = pre_pad`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.scale = scale`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`self.tile_pad = tile_pad`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`def resize(self, size: Size) -> Size:`
fix(api): report accurate image size when upscaling 2023-01-20 01:42:27 +00:00			`return Size(size.width * self.outscale, size.height * self.outscale)`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`def load_resrgan(ctx: ServerContext, params: UpscaleParams, tile=0):`
			`'''`
			`TODO: cache this instance`
			`'''`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`model_file = '%s.%s' % (params.upscale_model, params.format)`
fix(api): pass model to ONNX instances 2023-01-16 20:58:27 +00:00			`model_path = path.join(ctx.model_path, model_file)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`if not path.isfile(model_path):`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`raise Exception('Real ESRGAN model not found at %s' % model_path)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`# use ONNX acceleration, if available`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`if params.format == 'onnx':`
			`model = ONNXNet(ctx, model_file, provider=params.provider)`
			`elif params.format == 'pth':`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,`
			`num_block=23, num_grow_ch=32, scale=params.scale)`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`raise Exception('unknown platform %s' % params.format)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
			`dni_weight = None`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`if params.upscale_model == 'realesr-general-x4v3' and params.denoise != 1:`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`wdn_model_path = model_path.replace(`
			`'realesr-general-x4v3', 'realesr-general-wdn-x4v3')`
			`model_path = [model_path, wdn_model_path]`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`dni_weight = [params.denoise, 1 - params.denoise]`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`# TODO: shouldn't need the PTH file`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`upsampler = RealESRGANer(`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`scale=params.scale,`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`model_path=path.join(ctx.model_path, '%s.pth' % params.upscale_model),`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`dni_weight=dni_weight,`
			`model=model,`
			`tile=tile,`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`tile_pad=params.tile_pad,`
			`pre_pad=params.pre_pad,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`half=params.half)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00			`return upsampler`


feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`def load_stable_diffusion(ctx: ServerContext, upscale: UpscaleParams):`
			`'''`
			`TODO: cache this instance`
			`'''`
			`if upscale.format == 'onnx':`
			`model_path = path.join(ctx.model_path, upscale.upscale_model)`
			`# ValueError: Pipeline <class 'onnx_web.onnx.pipeline_onnx_stable_diffusion_upscale.OnnxStableDiffusionUpscalePipeline'>`
			`# expected {'vae', 'unet', 'text_encoder', 'tokenizer', 'scheduler', 'low_res_scheduler'},`
			`# but only {'scheduler', 'tokenizer', 'text_encoder', 'unet'} were passed.`
			`pipeline = OnnxStableDiffusionUpscalePipeline.from_pretrained(`
			`model_path,`
			`vae=AutoencoderKL.from_pretrained(`
			`model_path, subfolder='vae_encoder'),`
			`low_res_scheduler=DDPMScheduler.from_pretrained(`
			`model_path, subfolder='scheduler'),`
			`)`
			`else:`
			`pipeline = StableDiffusionUpscalePipeline.from_pretrained(`
			`'stabilityai/stable-diffusion-x4-upscaler')`

			`return pipeline`


			`def upscale_resrgan(`
			`ctx: ServerContext,`
			`stage: StageParams,`
			`params: ImageParams,`
			`source_image: Image.Image,`
			`*,`
			`upscale: UpscaleParams,`
			`) -> Image:`
			`print('upscaling image with Real ESRGAN', upscale.scale)`
fix(api): get upscale params from request 2023-01-16 19:12:08 +00:00
fix(api): skip upscaling if scale is 1 2023-01-17 05:01:15 +00:00			`output = np.array(source_image)`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`upsampler = load_resrgan(ctx, upscale, tile=stage.tile_size)`
fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`output, _ = upsampler.enhance(output, outscale=upscale.outscale)`
fix(api): convert back to PIL after upscaling 2023-01-16 00:25:12 +00:00
lint(api): improve logging while upscaling 2023-01-18 04:30:25 +00:00			`output = Image.fromarray(output, 'RGB')`
			`print('final output image size', output.size)`
			`return output`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00

feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`def upscale_gfpgan(`
			`ctx: ServerContext,`
			`stage: StageParams,`
			`params: ImageParams,`
			`image: Image.Image,`
			`*,`
			`upscale: UpscaleParams,`
			`upsampler: Optional[RealESRGANer] = None,`
			`) -> Image:`
			`if upscale.correction_model is None:`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`print('no face model given, skipping')`
			`return image`
fix(api): get upscale params from request 2023-01-16 19:12:08 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`print('correcting faces with GFPGAN model: %s' % upscale.correction_model)`

fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`if upsampler is None:`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`upsampler = load_resrgan(ctx, upscale)`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`face_path = path.join(ctx.model_path, '%s.pth' %`
			`(upscale.correction_model))`
fix(api): resolve face correction model relative to model path 2023-01-16 22:45:17 +00:00
feat(api): add support for Stable Diffusion models to conversion script 2023-01-16 23:48:50 +00:00			`# TODO: doesn't have a model param, not sure how to pass ONNX model`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`face_enhancer = GFPGANer(`
fix(api): resolve face correction model relative to model path 2023-01-16 22:45:17 +00:00			`model_path=face_path,`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`upscale=upscale.outscale,`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`arch='clean',`
			`channel_multiplier=2,`
			`bg_upsampler=upsampler)`

fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00			`_, _, output = face_enhancer.enhance(`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`image, has_aligned=False, only_center_face=False, paste_back=True, weight=upscale.face_strength)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
			`return output`
lint(api): consolidate upscale/correction logic 2023-01-26 02:31:39 +00:00

feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`def upscale_stable_diffusion(`
			`ctx: ServerContext,`
			`stage: StageParams,`
			`params: ImageParams,`
			`source: Image.Image,`
			`*,`
			`upscale: UpscaleParams,`
			`) -> Image:`
feat(api): initial support for Stable Diffusion upscaling (#66) 2023-01-26 03:04:00 +00:00			`print('upscaling with Stable Diffusion')`

feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`pipeline = load_stable_diffusion(ctx, upscale)`
			`generator = torch.manual_seed(params.seed)`
			`seed = generator.initial_seed()`
feat(api): initial support for Stable Diffusion upscaling (#66) 2023-01-26 03:04:00 +00:00
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`def upscale_stage(_ctx: ServerContext, stage: StageParams, params: ImageParams, image: Image.Image) -> Image:`
			`return pipeline(`
			`params.prompt,`
fix parameter order for chain pipeline 2023-01-27 23:26:48 +00:00			`image,`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`generator=torch.manual_seed(seed),`
			`num_inference_steps=params.steps,`
			`).images[0]`

			`chain = ChainPipeline(stages=[`
			`(upscale_stage, stage)`
			`])`
			`return chain(ctx, params, source)`


			`def run_upscale_correction(`
			`ctx: ServerContext,`
			`stage: StageParams,`
			`params: ImageParams,`
			`image: Image.Image,`
			`*,`
			`upscale: UpscaleParams,`
			`) -> Image.Image:`
lint(api): consolidate upscale/correction logic 2023-01-26 02:31:39 +00:00			`print('running upscale pipeline')`

feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`if upscale.scale > 1:`
			`if 'esrgan' in upscale.upscale_model:`
			`stage = StageParams(tile_size=stage.tile_size,`
			`outscale=upscale.outscale)`
			`image = upscale_resrgan(ctx, stage, params, image, upscale=upscale)`
			`elif 'stable-diffusion' in upscale.upscale_model:`
fix parameter order for chain pipeline 2023-01-27 23:26:48 +00:00			`mini_tile = min(128, stage.tile_size)`
feat(api): start implementing chain pipelines 2023-01-27 23:08:36 +00:00			`stage = StageParams(tile_size=mini_tile, outscale=upscale.outscale)`
			`image = upscale_stable_diffusion(`
			`ctx, stage, params, image, upscale=upscale)`

			`if upscale.faces:`
			`stage = StageParams(tile_size=stage.tile_size,`
			`outscale=upscale.outscale)`
			`image = upscale_gfpgan(ctx, stage, params, image, upscale=upscale)`
lint(api): consolidate upscale/correction logic 2023-01-26 02:31:39 +00:00
feat(api): initial support for Stable Diffusion upscaling (#66) 2023-01-26 03:04:00 +00:00			`return image`