1
0
Fork 0
onnx-web/api/onnx_web/chain/correct_gfpgan.py

95 lines
2.7 KiB
Python

from logging import getLogger
from os import path
from typing import Optional
from PIL import Image
from ..params import (
DeviceParams,
HighresParams,
ImageParams,
StageParams,
UpscaleParams,
)
from ..server import ModelTypes, ServerContext
from ..utils import run_gc
from ..worker import WorkerContext
from .base import BaseStage
from .result import StageResult
logger = getLogger(__name__)
class CorrectGFPGANStage(BaseStage):
def load(
self,
server: ServerContext,
_stage: StageParams,
upscale: UpscaleParams,
device: DeviceParams,
):
# must be within the load function for patch to take effect
# TODO: rewrite and remove
from gfpgan import GFPGANer
face_path = path.join(server.cache_path, "%s.pth" % (upscale.correction_model))
cache_key = (face_path,)
cache_pipe = server.cache.get(ModelTypes.correction, cache_key)
if cache_pipe is not None:
logger.info("reusing existing GFPGAN pipeline")
return cache_pipe
logger.debug("loading GFPGAN model from %s", face_path)
# TODO: find a way to pass the ONNX model to underlying architectures
gfpgan = GFPGANer(
arch="clean",
bg_upsampler=None,
channel_multiplier=2,
device=device.torch_str(),
model_path=face_path,
upscale=upscale.face_outscale,
)
server.cache.set(ModelTypes.correction, cache_key, gfpgan)
run_gc([device])
return gfpgan
def run(
self,
worker: WorkerContext,
server: ServerContext,
stage: StageParams,
_params: ImageParams,
sources: StageResult,
*,
upscale: UpscaleParams,
highres: Optional[HighresParams] = None,
stage_source: Optional[Image.Image] = None,
**kwargs,
) -> StageResult:
upscale = upscale.with_args(**kwargs)
if upscale.correction_model is None:
logger.warning("no face model given, skipping")
return sources
logger.info("correcting faces with GFPGAN model: %s", upscale.correction_model)
device = worker.get_device()
gfpgan = self.load(server, stage, upscale, device)
outputs = []
for source in sources.as_arrays():
cropped, restored, result = gfpgan.enhance(
source,
has_aligned=False,
only_center_face=False,
paste_back=True,
weight=upscale.face_strength,
)
outputs.append(result)
return StageResult.from_arrays(outputs, metadata=sources.metadata)