1
0
Fork 0
onnx-web/api/onnx_web/upscale.py

181 lines
5.0 KiB
Python
Raw Normal View History

2023-01-16 00:04:10 +00:00
from basicsr.archs.rrdbnet_arch import RRDBNet
from gfpgan import GFPGANer
from onnxruntime import InferenceSession
2023-01-16 00:04:10 +00:00
from os import path
from PIL import Image
from realesrgan import RealESRGANer
2023-01-16 20:52:56 +00:00
from typing import Any, Union
2023-01-16 00:04:10 +00:00
import numpy as np
import torch
from .utils import (
2023-01-16 21:11:40 +00:00
ServerContext,
Size,
)
# TODO: these should all be params or config
2023-01-16 00:04:10 +00:00
pre_pad = 0
tile_pad = 10
2023-01-16 17:06:50 +00:00
class ONNXImage():
def __init__(self, source) -> None:
self.source = source
self.data = self
2023-01-16 18:02:37 +00:00
def __getitem__(self, *args):
return torch.from_numpy(self.source.__getitem__(*args)).to(torch.float32)
def squeeze(self):
self.source = np.squeeze(self.source, (0))
return self
def float(self):
return self
def cpu(self):
return self
2023-01-16 17:45:31 +00:00
def clamp_(self, min, max):
self.source = np.clip(self.source, min, max)
2023-01-16 17:46:06 +00:00
return self
def numpy(self):
return self.source
2023-01-16 17:06:50 +00:00
2023-01-16 20:52:56 +00:00
def size(self):
return np.shape(self.source)
class ONNXNet():
'''
2023-01-16 21:11:40 +00:00
Provides the RRDBNet interface using an ONNX session for DirectML acceleration.
'''
2023-01-16 20:58:27 +00:00
def __init__(self, ctx: ServerContext, model: str, provider='DmlExecutionProvider') -> None:
'''
TODO: get platform provider from request params
'''
2023-01-16 20:58:27 +00:00
model_path = path.join(ctx.model_path, model)
self.session = InferenceSession(
2023-01-16 20:58:27 +00:00
model_path, providers=[provider])
def __call__(self, image: Any) -> Any:
input_name = self.session.get_inputs()[0].name
output_name = self.session.get_outputs()[0].name
output = self.session.run([output_name], {
input_name: image.cpu().numpy()
})[0]
2023-01-16 17:06:50 +00:00
return ONNXImage(output)
def eval(self) -> None:
pass
def half(self):
return self
def load_state_dict(self, net, strict=True) -> None:
pass
def to(self, device):
return self
2023-01-16 00:04:10 +00:00
class UpscaleParams():
2023-01-16 20:52:56 +00:00
def __init__(
self,
upscale_model: str,
scale: int = 4,
outscale: int = 1,
denoise: float = 0.5,
faces=True,
face_model: Union[str, None] = None,
platform: str = 'onnx',
half=False
) -> None:
self.upscale_model = upscale_model
self.scale = scale
2023-01-16 20:52:56 +00:00
self.outscale = outscale
self.denoise = denoise
self.faces = faces
2023-01-16 20:52:56 +00:00
self.face_model = face_model
self.platform = platform
2023-01-16 20:52:56 +00:00
self.half = half
2023-01-16 21:11:40 +00:00
def resize(self, size: Size) -> Size:
return Size(size.width * self.scale * self.outscale, size.height * self.scale * self.outscale)
def make_resrgan(ctx: ServerContext, params: UpscaleParams, tile=0):
2023-01-16 20:58:27 +00:00
model_file = '%s.%s' % (params.upscale_model, params.platform)
model_path = path.join(ctx.model_path, model_file)
2023-01-16 00:04:10 +00:00
if not path.isfile(model_path):
2023-01-16 20:52:56 +00:00
raise Exception('Real ESRGAN model not found at %s' % model_path)
2023-01-16 00:04:10 +00:00
# use ONNX acceleration, if available
if params.platform == 'onnx':
2023-01-16 20:58:27 +00:00
model = ONNXNet(ctx, model_file)
2023-01-16 20:52:56 +00:00
elif params.platform == 'pth':
model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,
num_block=23, num_grow_ch=32, scale=params.scale)
2023-01-16 20:52:56 +00:00
else:
raise Exception('unknown platform %s' % params.platform)
2023-01-16 00:04:10 +00:00
dni_weight = None
2023-01-16 20:52:56 +00:00
if params.upscale_model == 'realesr-general-x4v3' and params.denoise != 1:
2023-01-16 00:04:10 +00:00
wdn_model_path = model_path.replace(
'realesr-general-x4v3', 'realesr-general-wdn-x4v3')
model_path = [model_path, wdn_model_path]
dni_weight = [params.denoise, 1 - params.denoise]
2023-01-16 00:04:10 +00:00
2023-01-16 21:11:40 +00:00
# TODO: shouldn't need the PTH file
2023-01-16 00:04:10 +00:00
upsampler = RealESRGANer(
scale=params.scale,
2023-01-16 21:11:40 +00:00
model_path=path.join(ctx.model_path, '%s.pth' % params.upscale_model),
2023-01-16 00:04:10 +00:00
dni_weight=dni_weight,
model=model,
tile=tile,
tile_pad=tile_pad,
pre_pad=pre_pad,
2023-01-16 20:52:56 +00:00
half=params.half)
2023-01-16 00:04:10 +00:00
return upsampler
def upscale_resrgan(ctx: ServerContext, params: UpscaleParams, source_image: Image) -> Image:
print('upscaling image with Real ESRGAN', params)
image = np.array(source_image)
upsampler = make_resrgan(ctx, params)
2023-01-16 20:52:56 +00:00
output, _ = upsampler.enhance(image, outscale=params.outscale)
2023-01-16 00:04:10 +00:00
if params.faces:
output = upscale_gfpgan(ctx, params, output)
return Image.fromarray(output, 'RGB')
2023-01-16 00:04:10 +00:00
def upscale_gfpgan(ctx: ServerContext, params: UpscaleParams, image, upsampler=None) -> Image:
2023-01-16 20:52:56 +00:00
print('correcting faces with GFPGAN model: %s' % params.face_model)
if params.face_model is None:
print('no face model given, skipping')
return image
if upsampler is None:
upsampler = make_resrgan(ctx, params, tile=512)
2023-01-16 00:04:10 +00:00
face_enhancer = GFPGANer(
2023-01-16 20:52:56 +00:00
model_path=params.face_model,
upscale=params.outscale,
2023-01-16 00:04:10 +00:00
arch='clean',
channel_multiplier=2,
bg_upsampler=upsampler)
_, _, output = face_enhancer.enhance(
image, has_aligned=False, only_center_face=False, paste_back=True)
2023-01-16 00:04:10 +00:00
return output