feat(api): add basic upscaling

2023-01-15 18:04:10 -06:00 · 2023-01-15 18:04:10 -06:00 · 77cb84c60e
parent 64fac4d7aa
commit 77cb84c60e
3 changed files with 78 additions and 0 deletions
--- a/README.md
+++ b/README.md
@ -52,6 +52,7 @@ Based on guides by:
    - [Note about setup paths](#note-about-setup-paths)
    - [Create a virtual environment](#create-a-virtual-environment)
    - [Install pip packages](#install-pip-packages)
      - [For upscaling and face correction](#for-upscaling-and-face-correction)
      - [For AMD on Windows: Install ONNX DirectML](#for-amd-on-windows-install-onnx-directml)
      - [For CPU on Linux: Install PyTorch CPU](#for-cpu-on-linux-install-pytorch-cpu)
      - [For CPU on Windows: Install PyTorch CPU](#for-cpu-on-windows-install-pytorch-cpu)
@ -190,6 +191,12 @@ sure you are not using `numpy>=1.24`.
 [This SO question](https://stackoverflow.com/questions/74844262/how-to-solve-error-numpy-has-no-attribute-float-in-python)
 has more details.
 #### For upscaling and face correction
 ```shell
 > pip install basicsr facexlib gfpgan realesrgan
 ```
 #### For AMD on Windows: Install ONNX DirectML
 If you are running on Windows, install the DirectML ONNX runtime as well:
--- a/api/onnx_web/serve.py
+++ b/api/onnx_web/serve.py
@ -44,6 +44,11 @@ from .image import (
    noise_source_uniform,
 )
 from .upscale import (
    upscale_gfpgan,
    upscale_resrgan,
 )
 import json
 import numpy as np
 import time
@ -268,6 +273,8 @@ def run_txt2img_pipeline(model, provider, scheduler, prompt, negative_prompt, cf
        negative_prompt=negative_prompt,
        num_inference_steps=steps,
    ).images[0]
    image = upscale_resrgan(image)
    image.save(output)
    print('saved txt2img output: %s' % (output))
--- a/api/onnx_web/upscale.py
+++ b/api/onnx_web/upscale.py
@ -0,0 +1,64 @@
 from basicsr.archs.rrdbnet_arch import RRDBNet
 from basicsr.utils.download_util import load_file_from_url
 from gfpgan import GFPGANer
 from os import path
 from PIL import Image
 from realesrgan import RealESRGANer
 denoise_strength = 0.5
 gfpgan_url = 'https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth'
 resrgan_url = [
    'https://github.com/xinntao/Real-ESRGAN/releases/download/v0.1.0/RealESRGAN_x4plus.pth']
 fp32 = True
 model_name = 'RealESRGAN_x4plus'
 netscale = 4
 outscale = 4
 pre_pad = 0
 tile = 0
 tile_pad = 10
 def upscale_resrgan(source_image: Image) -> Image:
    model_path = path.join('weights', model_name + '.pth')
    if not path.isfile(model_path):
        ROOT_DIR = os.path.dirname(path.abspath(__file__))
        for url in resrgan_url:
            model_path = load_file_from_url(
                url=url, model_dir=path.join(ROOT_DIR, 'weights'), progress=True, file_name=None)
    model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64,
                    num_block=23, num_grow_ch=32, scale=4)
    dni_weight = None
    if model_name == 'realesr-general-x4v3' and denoise_strength != 1:
        wdn_model_path = model_path.replace(
            'realesr-general-x4v3', 'realesr-general-wdn-x4v3')
        model_path = [model_path, wdn_model_path]
        dni_weight = [denoise_strength, 1 - denoise_strength]
    upsampler = RealESRGANer(
        scale=netscale,
        model_path=model_path,
        dni_weight=dni_weight,
        model=model,
        tile=tile,
        tile_pad=tile_pad,
        pre_pad=pre_pad,
        half=fp32)
    output, _ = upsampler.enhance(source_image, outscale=outscale)
    return upscale_gfpgan(output, upsampler)
 def upscale_gfpgan(source_image: Image, upsampler) -> Image:
    face_enhancer = GFPGANer(
        model_path=gfpgan_url,
        upscale=outscale,
        arch='clean',
        channel_multiplier=2,
        bg_upsampler=upsampler)
    _, _, output = face_enhancer.enhance(source_image, has_aligned=False, only_center_face=False, paste_back=True)
    return output