feat(api): add support for DAT upscalers

2023-12-31 11:20:51 -06:00 · 2023-12-31 11:20:51 -06:00 · 4a9ca4c4a8
parent b7f2313489
commit 4a9ca4c4a8
6 changed files with 1290 additions and 1 deletions
--- a/api/onnx_web/chain/stages.py
+++ b/api/onnx_web/chain/stages.py
@ -18,6 +18,7 @@ from .source_s3 import SourceS3Stage
 from .source_txt2img import SourceTxt2ImgStage
 from .source_url import SourceURLStage
 from .upscale_bsrgan import UpscaleBSRGANStage
+from .upscale_dat import UpscaleDATStage
 from .upscale_highres import UpscaleHighresStage
 from .upscale_outpaint import UpscaleOutpaintStage
 from .upscale_resrgan import UpscaleRealESRGANStage
@ -47,6 +48,7 @@ CHAIN_STAGES = {
    "source-txt2img": SourceTxt2ImgStage,
    "source-url": SourceURLStage,
    "upscale-bsrgan": UpscaleBSRGANStage,
+    "upscale-dat": UpscaleDATStage,
    "upscale-highres": UpscaleHighresStage,
    "upscale-outpaint": UpscaleOutpaintStage,
    "upscale-resrgan": UpscaleRealESRGANStage,
--- a/api/onnx_web/chain/upscale_dat.py
+++ b/api/onnx_web/chain/upscale_dat.py
@ -0,0 +1,116 @@
+from logging import getLogger
+from os import path
+from typing import Optional
+
+import numpy as np
+from PIL import Image
+
+from ..models.onnx import OnnxModel
+from ..params import (
+    DeviceParams,
+    ImageParams,
+    Size,
+    SizeChart,
+    StageParams,
+    UpscaleParams,
+)
+from ..server import ModelTypes, ServerContext
+from ..utils import run_gc
+from ..worker import WorkerContext
+from .base import BaseStage
+from .result import StageResult
+
+logger = getLogger(__name__)
+
+
+class UpscaleDATStage(BaseStage):
+    max_tile = SizeChart.micro
+
+    def load(
+        self,
+        server: ServerContext,
+        _stage: StageParams,
+        upscale: UpscaleParams,
+        device: DeviceParams,
+    ):
+        # must be within the load function for patch to take effect
+        model_path = path.join(server.model_path, "%s.onnx" % (upscale.upscale_model))
+        cache_key = (model_path,)
+        cache_pipe = server.cache.get(ModelTypes.upscaling, cache_key)
+
+        if cache_pipe is not None:
+            logger.debug("reusing existing DAT pipeline")
+            return cache_pipe
+
+        logger.info("loading DAT model from %s", model_path)
+
+        pipe = OnnxModel(
+            server,
+            model_path,
+            provider=device.ort_provider(),
+            sess_options=device.sess_options(),
+        )
+
+        server.cache.set(ModelTypes.upscaling, cache_key, pipe)
+        run_gc([device])
+
+        return pipe
+
+    def run(
+        self,
+        worker: WorkerContext,
+        server: ServerContext,
+        stage: StageParams,
+        _params: ImageParams,
+        sources: StageResult,
+        *,
+        upscale: UpscaleParams,
+        stage_source: Optional[Image.Image] = None,
+        **kwargs,
+    ) -> StageResult:
+        upscale = upscale.with_args(**kwargs)
+
+        if upscale.upscale_model is None:
+            logger.warning("no upscaling model given, skipping")
+            return sources
+
+        logger.info("upscaling with DAT model: %s", upscale.upscale_model)
+        device = worker.get_device()
+        dat = self.load(server, stage, upscale, device)
+
+        outputs = []
+        for source in sources.as_numpy():
+            image = source / 255.0
+            image = image[:, :, [2, 1, 0]].astype(np.float32).transpose((2, 0, 1))
+            image = np.expand_dims(image, axis=0)
+            logger.trace("DAT input shape: %s", image.shape)
+
+            scale = upscale.outscale
+            logger.trace(
+                "DAT output shape: %s",
+                (
+                    image.shape[0],
+                    image.shape[1],
+                    image.shape[2] * scale,
+                    image.shape[3] * scale,
+                ),
+            )
+
+            output = dat(image)
+
+            output = np.clip(np.squeeze(output, axis=0), 0, 1)
+            output = output[[2, 1, 0], :, :].transpose((1, 2, 0))
+            output = (output * 255.0).round().astype(np.uint8)
+
+            logger.debug("output image shape: %s", output.shape)
+            outputs.append(output)
+
+        return StageResult(arrays=outputs)
+
+    def steps(
+        self,
+        params: ImageParams,
+        size: Size,
+    ) -> int:
+        tile = min(params.unet_tile, self.max_tile)
+        return size.width // tile * size.height // tile
--- a/api/onnx_web/convert/main.py
+++ b/api/onnx_web/convert/main.py
@ -25,6 +25,7 @@ from .diffusion.diffusion_xl import convert_diffusion_diffusers_xl
 from .diffusion.lora import blend_loras
 from .diffusion.textual_inversion import blend_textual_inversions
 from .upscaling.bsrgan import convert_upscaling_bsrgan
+from .upscaling.dat import convert_upscaling_dat
 from .upscaling.resrgan import convert_upscale_resrgan
 from .upscaling.swinir import convert_upscaling_swinir
 from .utils import (
@ -395,7 +396,9 @@ def convert_model_upscaling(conversion: ConversionContext, model):
    model_type = model.get("model", "resrgan")
    if model_type == "bsrgan":
        convert_upscaling_bsrgan(conversion, model, source)
-    elif model_type == "resrgan":
+    elif model_type == "dat":
+        convert_upscaling_dat(conversion, model, source)
+    elif model_type in ["esrgan", "resrgan"]:
        convert_upscale_resrgan(conversion, model, source)
    elif model_type == "swinir":
        convert_upscaling_swinir(conversion, model, source)
--- a/api/onnx_web/convert/upscaling/dat.py
+++ b/api/onnx_web/convert/upscaling/dat.py
@ -0,0 +1,70 @@
+from logging import getLogger
+from os import path
+
+import torch
+from torch.onnx import export
+
+from ...models.dat import DAT
+from ..utils import ConversionContext, ModelDict
+
+logger = getLogger(__name__)
+
+
+@torch.no_grad()
+def convert_upscaling_dat(
+    conversion: ConversionContext,
+    model: ModelDict,
+    source: str,
+):
+    name = model.get("name")
+    source = source or model.get("source")
+    scale = model.get("scale", 1)
+
+    dest = path.join(conversion.model_path, name + ".onnx")
+    logger.info("converting DAT model: %s -> %s", name, dest)
+
+    if path.isfile(dest):
+        logger.info("ONNX model already exists, skipping")
+        return
+
+    model = DAT(
+        # TODO: params
+        num_in_ch=3,
+        num_out_ch=3,
+        num_feat=64,
+        num_block=23,
+        num_grow_ch=32,
+        scale=scale,
+    )
+
+    torch_model = torch.load(source, map_location=conversion.map_location)
+    if "params_ema" in torch_model:
+        model.load_state_dict(torch_model["params_ema"], strict=False)
+    elif "params" in torch_model:
+        model.load_state_dict(torch_model["params"], strict=False)
+    else:
+        model.load_state_dict(torch_model, strict=False)
+
+    model.to(conversion.training_device).train(False)
+    model.eval()
+
+    rng = torch.rand(1, 3, 64, 64, device=conversion.map_location)
+    input_names = ["input"]
+    output_names = ["output"]
+    dynamic_axes = {
+        "input": {2: "h", 3: "w"},
+        "output": {2: "h", 3: "w"},
+    }
+
+    logger.info("exporting ONNX model to %s", dest)
+    export(
+        model,
+        rng,
+        dest,
+        input_names=input_names,
+        output_names=output_names,
+        dynamic_axes=dynamic_axes,
+        opset_version=conversion.opset,
+        export_params=True,
+    )
+    logger.info("DAT exported to ONNX successfully")
--- a/api/onnx_web/models/dat.py
+++ b/api/onnx_web/models/dat.py
--- a/api/schemas/extras.yaml
+++ b/api/schemas/extras.yaml
@ -145,6 +145,8 @@ $defs:
            type: string
            enum: [
              bsrgan,
+              dat,
+              esrgan,
              resrgan,
              swinir
            ]