onnx-web/api/onnx_web/upscale.py

from basicsr.archs.rrdbnet_arch import RRDBNet
from gfpgan import GFPGANer
from onnxruntime import InferenceSession
from os import path
from PIL import Image
from realesrgan import RealESRGANer
from typing import Any, Literal, Union

import numpy as np
import torch

from .utils import (
    ServerContext,
    Size,
)

# TODO: these should all be params or config
pre_pad = 0
tile_pad = 10


class ONNXImage():
    def __init__(self, source) -> None:
        self.source = source
        self.data = self

    def __getitem__(self, *args):
        return torch.from_numpy(self.source.__getitem__(*args)).to(torch.float32)

    def squeeze(self):
        self.source = np.squeeze(self.source, (0))
        return self

    def float(self):
        return self

    def cpu(self):
        return self

    def clamp_(self, min, max):
        self.source = np.clip(self.source, min, max)
        return self

    def numpy(self):
        return self.source

    def size(self):
        return np.shape(self.source)


class ONNXNet():
    '''
    Provides the RRDBNet interface using an ONNX session for DirectML acceleration.
    '''

    def __init__(self, ctx: ServerContext, model: str, provider='DmlExecutionProvider') -> None:
        '''
        TODO: get platform provider from request params
        '''
        model_path = path.join(ctx.model_path, model)
        self.session = InferenceSession(
            model_path, providers=[provider])

    def __call__(self, image: Any) -> Any:
        input_name = self.session.get_inputs()[0].name
        output_name = self.session.get_outputs()[0].name
        output = self.session.run([output_name], {
            input_name: image.cpu().numpy()
        })[0]
        return ONNXImage(output)

    def eval(self) -> None:
        pass

    def half(self):
        return self

    def load_state_dict(self, _net, _strict=True) -> None:
        pass

    def to(self, _device):
        return self


class UpscaleParams():
    def __init__(
        self,
        upscale_model: str,
        provider: str,
        correction_model: Union[str, None] = None,
        denoise: float = 0.5,
        faces=True,
        face_strength: float = 0.5,
        format: Literal['onnx', 'pth'] = 'onnx',
        half=False,
        outscale: int = 1,
        scale: int = 4,
    ) -> None:
        self.upscale_model = upscale_model
        self.provider = provider
        self.correction_model = correction_model
        self.denoise = denoise
        self.faces = faces
        self.face_strength = face_strength
        self.format = format
        self.half = half
        self.outscale = outscale
        self.scale = scale

    def resize(self, size: Size) -> Size:
        return Size(size.width * self.outscale, size.height * self.outscale)


def make_resrgan(ctx: ServerContext, params: UpscaleParams, tile=0):
    model_file = '%s.%s' % (params.upscale_model, params.format)
    model_path = path.join(ctx.model_path, model_file)
    if not path.isfile(model_path):
        raise Exception('Real ESRGAN model not found at %s' % model_path)

    # use ONNX acceleration, if available
    if params.format == 'onnx':
        model = ONNXNet(ctx, model_file, provider=params.provider)
    elif params.format == 'pth':
        model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,
                        num_block=23, num_grow_ch=32, scale=params.scale)
    else:
        raise Exception('unknown platform %s' % params.format)

    dni_weight = None
    if params.upscale_model == 'realesr-general-x4v3' and params.denoise != 1:
        wdn_model_path = model_path.replace(
            'realesr-general-x4v3', 'realesr-general-wdn-x4v3')
        model_path = [model_path, wdn_model_path]
        dni_weight = [params.denoise, 1 - params.denoise]

    # TODO: shouldn't need the PTH file
    upsampler = RealESRGANer(
        scale=params.scale,
        model_path=path.join(ctx.model_path, '%s.pth' % params.upscale_model),
        dni_weight=dni_weight,
        model=model,
        tile=tile,
        tile_pad=tile_pad,
        pre_pad=pre_pad,
        half=params.half)

    return upsampler


def upscale_resrgan(ctx: ServerContext, params: UpscaleParams, source_image: Image) -> Image:
    print('upscaling image with Real ESRGAN', params.scale)

    output = np.array(source_image)
    upsampler = make_resrgan(ctx, params, tile=512)

    if params.scale > 1:
        output, _ = upsampler.enhance(output, outscale=params.outscale)

    if params.faces:
        output = upscale_gfpgan(ctx, params, output, upsampler=upsampler)

    output = Image.fromarray(output, 'RGB')
    print('final output image size', output.size)
    return output


def upscale_gfpgan(ctx: ServerContext, params: UpscaleParams, image, upsampler=None) -> Image:
    print('correcting faces with GFPGAN model: %s' % params.correction_model)

    if params.correction_model is None:
        print('no face model given, skipping')
        return image

    if upsampler is None:
        upsampler = make_resrgan(ctx, params)

    face_path = path.join(ctx.model_path, '%s.pth' % (params.correction_model))

    # TODO: doesn't have a model param, not sure how to pass ONNX model
    face_enhancer = GFPGANer(
        model_path=face_path,
        upscale=params.outscale,
        arch='clean',
        channel_multiplier=2,
        bg_upsampler=upsampler)

    _, _, output = face_enhancer.enhance(
        image, has_aligned=False, only_center_face=False, paste_back=True, weight=params.face_strength)

    return output
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`from basicsr.archs.rrdbnet_arch import RRDBNet`
			`from gfpgan import GFPGANer`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`from onnxruntime import InferenceSession`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`from os import path`
			`from PIL import Image`
			`from realesrgan import RealESRGANer`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`from typing import Any, Literal, Union`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): convert image to numpy before upscaling 2023-01-16 00:13:28 +00:00			`import numpy as np`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`import torch`
fix(api): convert image to numpy before upscaling 2023-01-16 00:13:28 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`from .utils import (`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`ServerContext,`
			`Size,`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`)`

			`# TODO: these should all be params or config`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`pre_pad = 0`
			`tile_pad = 10`

feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00
wrap image output 2023-01-16 17:06:50 +00:00			`class ONNXImage():`
stub out other methods for output image 2023-01-16 17:16:06 +00:00			`def __init__(self, source) -> None:`
			`self.source = source`
			`self.data = self`

add subscript for fake image 2023-01-16 18:02:37 +00:00			`def __getitem__(self, *args):`
			`return torch.from_numpy(self.source.__getitem__(*args)).to(torch.float32)`

stub out other methods for output image 2023-01-16 17:16:06 +00:00			`def squeeze(self):`
			`self.source = np.squeeze(self.source, (0))`
			`return self`

			`def float(self):`
			`return self`

			`def cpu(self):`
			`return self`

fix(api): correct stub method name 2023-01-16 17:45:31 +00:00			`def clamp_(self, min, max):`
stub out other methods for output image 2023-01-16 17:16:06 +00:00			`self.source = np.clip(self.source, min, max)`
return fake image throughout chain 2023-01-16 17:46:06 +00:00			`return self`
stub out other methods for output image 2023-01-16 17:16:06 +00:00
			`def numpy(self):`
			`return self.source`
wrap image output 2023-01-16 17:06:50 +00:00
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`def size(self):`
			`return np.shape(self.source)`

feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00
			`class ONNXNet():`
			`'''`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`Provides the RRDBNet interface using an ONNX session for DirectML acceleration.`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`'''`

fix(api): pass model to ONNX instances 2023-01-16 20:58:27 +00:00			`def __init__(self, ctx: ServerContext, model: str, provider='DmlExecutionProvider') -> None:`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`'''`
			`TODO: get platform provider from request params`
			`'''`
fix(api): pass model to ONNX instances 2023-01-16 20:58:27 +00:00			`model_path = path.join(ctx.model_path, model)`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`self.session = InferenceSession(`
fix(api): pass model to ONNX instances 2023-01-16 20:58:27 +00:00			`model_path, providers=[provider])`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00
			`def __call__(self, image: Any) -> Any:`
			`input_name = self.session.get_inputs()[0].name`
			`output_name = self.session.get_outputs()[0].name`
			`output = self.session.run([output_name], {`
			`input_name: image.cpu().numpy()`
			`})[0]`
wrap image output 2023-01-16 17:06:50 +00:00			`return ONNXImage(output)`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00
			`def eval(self) -> None:`
			`pass`

			`def half(self):`
			`return self`

lint(api): mark some unused vars 2023-01-22 16:08:26 +00:00			`def load_state_dict(self, _net, _strict=True) -> None:`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`pass`

lint(api): mark some unused vars 2023-01-22 16:08:26 +00:00			`def to(self, _device):`
feat(api): add ONNX implementation of Real ESRGAN net 2023-01-16 16:55:40 +00:00			`return self`
feat(api): add conversion script for models 2023-01-16 15:57:59 +00:00
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`class UpscaleParams():`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`def __init__(`
			`self,`
			`upscale_model: str,`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`provider: str,`
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`correction_model: Union[str, None] = None,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`denoise: float = 0.5,`
			`faces=True,`
fix: send missing model params, add face strength control 2023-01-17 04:54:01 +00:00			`face_strength: float = 0.5,`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`format: Literal['onnx', 'pth'] = 'onnx',`
			`half=False,`
			`outscale: int = 1,`
			`scale: int = 4,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`) -> None:`
			`self.upscale_model = upscale_model`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.provider = provider`
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`self.correction_model = correction_model`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`self.denoise = denoise`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`self.faces = faces`
fix: send missing model params, add face strength control 2023-01-17 04:54:01 +00:00			`self.face_strength = face_strength`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.format = format`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`self.half = half`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`self.outscale = outscale`
			`self.scale = scale`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`def resize(self, size: Size) -> Size:`
fix(api): report accurate image size when upscaling 2023-01-20 01:42:27 +00:00			`return Size(size.width * self.outscale, size.height * self.outscale)`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
			`def make_resrgan(ctx: ServerContext, params: UpscaleParams, tile=0):`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`model_file = '%s.%s' % (params.upscale_model, params.format)`
fix(api): pass model to ONNX instances 2023-01-16 20:58:27 +00:00			`model_path = path.join(ctx.model_path, model_file)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`if not path.isfile(model_path):`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`raise Exception('Real ESRGAN model not found at %s' % model_path)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`# use ONNX acceleration, if available`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`if params.format == 'onnx':`
			`model = ONNXNet(ctx, model_file, provider=params.provider)`
			`elif params.format == 'pth':`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,`
			`num_block=23, num_grow_ch=32, scale=params.scale)`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`else:`
fix(api): pass hardware platform to upscaling pipeline (#77) 2023-01-22 22:35:53 +00:00			`raise Exception('unknown platform %s' % params.format)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
			`dni_weight = None`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`if params.upscale_model == 'realesr-general-x4v3' and params.denoise != 1:`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`wdn_model_path = model_path.replace(`
			`'realesr-general-x4v3', 'realesr-general-wdn-x4v3')`
			`model_path = [model_path, wdn_model_path]`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`dni_weight = [params.denoise, 1 - params.denoise]`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`# TODO: shouldn't need the PTH file`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`upsampler = RealESRGANer(`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`scale=params.scale,`
fix(api): report accurate sizes 2023-01-16 21:11:40 +00:00			`model_path=path.join(ctx.model_path, '%s.pth' % params.upscale_model),`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`dni_weight=dni_weight,`
			`model=model,`
			`tile=tile,`
			`tile_pad=tile_pad,`
			`pre_pad=pre_pad,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`half=params.half)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00			`return upsampler`


fix(api): pass upscale params when creating RESRGAN 2023-01-16 20:17:50 +00:00			`def upscale_resrgan(ctx: ServerContext, params: UpscaleParams, source_image: Image) -> Image:`
lint(api): improve logging while upscaling 2023-01-18 04:30:25 +00:00			`print('upscaling image with Real ESRGAN', params.scale)`
fix(api): get upscale params from request 2023-01-16 19:12:08 +00:00
fix(api): skip upscaling if scale is 1 2023-01-17 05:01:15 +00:00			`output = np.array(source_image)`
mostly fix face correction 2023-01-17 04:35:34 +00:00			`upsampler = make_resrgan(ctx, params, tile=512)`
fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00
fix(api): skip upscaling if scale is 1 2023-01-17 05:01:15 +00:00			`if params.scale > 1:`
			`output, _ = upsampler.enhance(output, outscale=params.outscale)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`if params.faces:`
mostly fix face correction 2023-01-17 04:35:34 +00:00			`output = upscale_gfpgan(ctx, params, output, upsampler=upsampler)`
fix(api): convert back to PIL after upscaling 2023-01-16 00:25:12 +00:00
lint(api): improve logging while upscaling 2023-01-18 04:30:25 +00:00			`output = Image.fromarray(output, 'RGB')`
			`print('final output image size', output.size)`
			`return output`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00

fix(api): pass upscale params when creating RESRGAN 2023-01-16 20:17:50 +00:00			`def upscale_gfpgan(ctx: ServerContext, params: UpscaleParams, image, upsampler=None) -> Image:`
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`print('correcting faces with GFPGAN model: %s' % params.correction_model)`
feat: add outscaling option 2023-01-16 20:52:56 +00:00
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`if params.correction_model is None:`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`print('no face model given, skipping')`
			`return image`
fix(api): get upscale params from request 2023-01-16 19:12:08 +00:00
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00			`if upsampler is None:`
mostly fix face correction 2023-01-17 04:35:34 +00:00			`upsampler = make_resrgan(ctx, params)`
fix(api): get ESRGAN/GFPGAN paths from server context, clean up test scripts 2023-01-16 19:02:15 +00:00
feat(api): return all types of models 2023-01-17 02:10:52 +00:00			`face_path = path.join(ctx.model_path, '%s.pth' % (params.correction_model))`
fix(api): resolve face correction model relative to model path 2023-01-16 22:45:17 +00:00
feat(api): add support for Stable Diffusion models to conversion script 2023-01-16 23:48:50 +00:00			`# TODO: doesn't have a model param, not sure how to pass ONNX model`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`face_enhancer = GFPGANer(`
fix(api): resolve face correction model relative to model path 2023-01-16 22:45:17 +00:00			`model_path=face_path,`
feat: add outscaling option 2023-01-16 20:52:56 +00:00			`upscale=params.outscale,`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00			`arch='clean',`
			`channel_multiplier=2,`
			`bg_upsampler=upsampler)`

fix(api): load upscaling model from models dir 2023-01-16 00:41:58 +00:00			`_, _, output = face_enhancer.enhance(`
fix: send missing model params, add face strength control 2023-01-17 04:54:01 +00:00			`image, has_aligned=False, only_center_face=False, paste_back=True, weight=params.face_strength)`
feat(api): add basic upscaling 2023-01-16 00:04:10 +00:00
			`return output`