onnx-web/api/onnx_web/convert/__main__.py

import warnings
from argparse import ArgumentParser
from json import loads
from logging import getLogger
from os import environ, makedirs, path
from sys import exit
from typing import Dict, List, Optional, Tuple
from yaml import safe_load
from jsonschema import validate, ValidationError

import torch

from .correction_gfpgan import convert_correction_gfpgan
from .diffusion_original import convert_diffusion_original
from .diffusion_stable import convert_diffusion_stable
from .upscale_resrgan import convert_upscale_resrgan
from .utils import ConversionContext, download_progress, source_format, tuple_to_correction, tuple_to_diffusion, tuple_to_upscaling

# suppress common but harmless warnings, https://github.com/ssube/onnx-web/issues/75
warnings.filterwarnings(
    "ignore", ".*The shape inference of prim::Constant type is missing.*"
)
warnings.filterwarnings("ignore", ".*Only steps=1 can be constant folded.*")
warnings.filterwarnings(
    "ignore",
    ".*Converting a tensor to a Python boolean might cause the trace to be incorrect.*",
)

Models = Dict[str, List[Tuple[str, str, Optional[int]]]]

logger = getLogger(__name__)


model_sources: Dict[str, Tuple[str, str]] = {
    "civitai://": ("Civitai", "https://civitai.com/api/download/models/%s"),
}

model_source_huggingface = "huggingface://"

# recommended models
base_models: Models = {
    "diffusion": [
        # v1.x
        (
            "stable-diffusion-onnx-v1-5",
            model_source_huggingface + "runwayml/stable-diffusion-v1-5",
        ),
        (
            "stable-diffusion-onnx-v1-inpainting",
            model_source_huggingface + "runwayml/stable-diffusion-inpainting",
        ),
        # v2.x
        (
            "stable-diffusion-onnx-v2-1",
            model_source_huggingface + "stabilityai/stable-diffusion-2-1",
        ),
        (
            "stable-diffusion-onnx-v2-inpainting",
            model_source_huggingface + "stabilityai/stable-diffusion-2-inpainting",
        ),
        # TODO: should have its own converter
        (
            "upscaling-stable-diffusion-x4",
            model_source_huggingface + "stabilityai/stable-diffusion-x4-upscaler",
            True,
        ),
    ],
    "correction": [
        (
            "correction-gfpgan-v1-3",
            "https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth",
            4,
        ),
        (
            "correction-codeformer",
            "https://github.com/sczhou/CodeFormer/releases/download/v0.1.0/codeformer.pth",
            1,
        ),
    ],
    "upscaling": [
        (
            "upscaling-real-esrgan-x2-plus",
            "https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.1/RealESRGAN_x2plus.pth",
            2,
        ),
        (
            "upscaling-real-esrgan-x4-plus",
            "https://github.com/xinntao/Real-ESRGAN/releases/download/v0.1.0/RealESRGAN_x4plus.pth",
            4,
        ),
        (
            "upscaling-real-esrgan-x4-v3",
            "https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.5.0/realesr-general-x4v3.pth",
            4,
        ),
    ],
}

model_path = environ.get("ONNX_WEB_MODEL_PATH", path.join("..", "models"))
training_device = "cuda" if torch.cuda.is_available() else "cpu"


def fetch_model(ctx: ConversionContext, name: str, source: str, format: Optional[str] = None) -> str:
    cache_name = path.join(ctx.cache_path, name)
    if format is not None:
        # add an extension if possible, some of the conversion code checks for it
        cache_name = "%s.%s" % (cache_name, format)

    for proto in model_sources:
        api_name, api_root = model_sources.get(proto)
        if source.startswith(proto):
            api_source = api_root % (source.removeprefix(proto))
            logger.info("Downloading model from %s: %s -> %s", api_name, api_source, cache_name)
            return download_progress([(api_source, cache_name)])

    if source.startswith(model_source_huggingface):
        hub_source = source.removeprefix(model_source_huggingface)
        logger.info("Downloading model from Huggingface Hub: %s", hub_source)
        # from_pretrained has a bunch of useful logic that snapshot_download by itself down not
        return hub_source
    elif source.startswith("https://"):
        logger.info("Downloading model from: %s", source)
        return download_progress([(source, cache_name)])
    elif source.startswith("http://"):
        logger.warning("Downloading model from insecure source: %s", source)
        return download_progress([(source, cache_name)])
    elif source.startswith(path.sep) or source.startswith("."):
        logger.info("Using local model: %s", source)
        return source
    else:
        logger.info("Unknown model location, using path as provided: %s", source)
        return source


def convert_models(ctx: ConversionContext, args, models: Models):
    if args.diffusion:
        for model in models.get("diffusion"):
            model = tuple_to_diffusion(model)
            name = model.get("name")

            if name in args.skip:
                logger.info("Skipping model: %s", name)
            else:
                format = source_format(model)
                source = fetch_model(ctx, name, model["source"], format=format)

                if format in ["safetensors", "ckpt"]:
                    convert_diffusion_original(
                        ctx,
                        model,
                        source,
                    )
                else:
                    convert_diffusion_stable(
                        ctx,
                        model,
                        source,
                    )

    if args.upscaling:
        for model in models.get("upscaling"):
            model = tuple_to_upscaling(model)
            name = model.get("name")

            if name in args.skip:
                logger.info("Skipping model: %s", name)
            else:
                format = source_format(model)
                source = fetch_model(ctx, name, model["source"], format=format)
                convert_upscale_resrgan(ctx, model, source)

    if args.correction:
        for model in models.get("correction"):
            model = tuple_to_correction(model)
            name = model.get("name")

            if name in args.skip:
                logger.info("Skipping model: %s", name)
            else:
                format = source_format(model)
                source = fetch_model(ctx, name, model["source"], format=format)
                convert_correction_gfpgan(ctx, model, source)


def main() -> int:
    parser = ArgumentParser(
        prog="onnx-web model converter", description="convert checkpoint models to ONNX"
    )

    # model groups
    parser.add_argument("--correction", action="store_true", default=False)
    parser.add_argument("--diffusion", action="store_true", default=False)
    parser.add_argument("--upscaling", action="store_true", default=False)

    # extra models
    parser.add_argument("--extras", nargs="*", type=str, default=[])
    parser.add_argument("--skip", nargs="*", type=str, default=[])

    # export options
    parser.add_argument(
        "--half",
        action="store_true",
        default=False,
        help="Export models for half precision, faster on some Nvidia cards.",
    )
    parser.add_argument(
        "--opset",
        default=14,
        type=int,
        help="The version of the ONNX operator set to use.",
    )
    parser.add_argument(
        "--token",
        type=str,
        help="HuggingFace token with read permissions for downloading models.",
    )

    args = parser.parse_args()
    logger.info("CLI arguments: %s", args)

    ctx = ConversionContext(model_path, training_device, half=args.half, opset=args.opset, token=args.token)
    logger.info("Converting models in %s using %s", ctx.model_path, ctx.training_device)

    if not path.exists(model_path):
        logger.info("Model path does not existing, creating: %s", model_path)
        makedirs(model_path)

    logger.info("Converting base models.")
    convert_models(ctx, args, base_models)

    for file in args.extras:
        if file is not None and file != "":
            logger.info("Loading extra models from %s", file)
            try:
                with open(file, "r") as f:
                    data = safe_load(f.read())

                with open("./schemas/extras.yaml", "r") as f:
                    schema = safe_load(f.read())

                logger.debug("validating chain request: %s against %s", data, schema)

                try:
                    validate(data, schema)
                    logger.info("Converting extra models.")
                    convert_models(ctx, args, data)
                except ValidationError as err:
                    logger.error("Invalid data in extras file: %s", err)
            except Exception as err:
                logger.error("Error converting extra models: %s", err)

    return 0


if __name__ == "__main__":
    exit(main())
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`import warnings`
			`from argparse import ArgumentParser`
			`from json import loads`
			`from logging import getLogger`
			`from os import environ, makedirs, path`
			`from sys import exit`
			`from typing import Dict, List, Optional, Tuple`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`from yaml import safe_load`
			`from jsonschema import validate, ValidationError`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00
			`import torch`

feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`from .correction_gfpgan import convert_correction_gfpgan`
			`from .diffusion_original import convert_diffusion_original`
			`from .diffusion_stable import convert_diffusion_stable`
			`from .upscale_resrgan import convert_upscale_resrgan`
			`from .utils import ConversionContext, download_progress, source_format, tuple_to_correction, tuple_to_diffusion, tuple_to_upscaling`

feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`# suppress common but harmless warnings, https://github.com/ssube/onnx-web/issues/75`
			`warnings.filterwarnings(`
			`"ignore", ".The shape inference of prim::Constant type is missing."`
			`)`
			`warnings.filterwarnings("ignore", ".Only steps=1 can be constant folded.")`
			`warnings.filterwarnings(`
			`"ignore",`
			`".Converting a tensor to a Python boolean might cause the trace to be incorrect.",`
			`)`

			`Models = Dict[str, List[Tuple[str, str, Optional[int]]]]`

			`logger = getLogger(__name__)`


feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`model_sources: Dict[str, Tuple[str, str]] = {`
			`"civitai://": ("Civitai", "https://civitai.com/api/download/models/%s"),`
			`}`

			`model_source_huggingface = "huggingface://"`

feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`# recommended models`
			`base_models: Models = {`
			`"diffusion": [`
			`# v1.x`
			`(`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`"stable-diffusion-onnx-v1-5",`
			`model_source_huggingface + "runwayml/stable-diffusion-v1-5",`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`),`
fix(api): launch with included extras if user does not provide their own 2023-02-11 05:06:30 +00:00			`(`
			`"stable-diffusion-onnx-v1-inpainting",`
			`model_source_huggingface + "runwayml/stable-diffusion-inpainting",`
			`),`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`# v2.x`
fix(api): launch with included extras if user does not provide their own 2023-02-11 05:06:30 +00:00			`(`
			`"stable-diffusion-onnx-v2-1",`
			`model_source_huggingface + "stabilityai/stable-diffusion-2-1",`
			`),`
			`(`
			`"stable-diffusion-onnx-v2-inpainting",`
			`model_source_huggingface + "stabilityai/stable-diffusion-2-inpainting",`
			`),`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`# TODO: should have its own converter`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`(`
			`"upscaling-stable-diffusion-x4",`
			`model_source_huggingface + "stabilityai/stable-diffusion-x4-upscaler",`
			`True,`
			`),`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`],`
			`"correction": [`
			`(`
			`"correction-gfpgan-v1-3",`
			`"https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth",`
			`4,`
			`),`
			`(`
			`"correction-codeformer",`
			`"https://github.com/sczhou/CodeFormer/releases/download/v0.1.0/codeformer.pth",`
			`1,`
			`),`
			`],`
			`"upscaling": [`
			`(`
			`"upscaling-real-esrgan-x2-plus",`
			`"https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.1/RealESRGAN_x2plus.pth",`
			`2,`
			`),`
			`(`
			`"upscaling-real-esrgan-x4-plus",`
			`"https://github.com/xinntao/Real-ESRGAN/releases/download/v0.1.0/RealESRGAN_x4plus.pth",`
			`4,`
			`),`
			`(`
			`"upscaling-real-esrgan-x4-v3",`
			`"https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.5.0/realesr-general-x4v3.pth",`
			`4,`
			`),`
			`],`
			`}`

			`model_path = environ.get("ONNX_WEB_MODEL_PATH", path.join("..", "models"))`
			`training_device = "cuda" if torch.cuda.is_available() else "cpu"`


feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`def fetch_model(ctx: ConversionContext, name: str, source: str, format: Optional[str] = None) -> str:`
			`cache_name = path.join(ctx.cache_path, name)`
			`if format is not None:`
			`# add an extension if possible, some of the conversion code checks for it`
			`cache_name = "%s.%s" % (cache_name, format)`

			`for proto in model_sources:`
			`api_name, api_root = model_sources.get(proto)`
			`if source.startswith(proto):`
			`api_source = api_root % (source.removeprefix(proto))`
			`logger.info("Downloading model from %s: %s -> %s", api_name, api_source, cache_name)`
			`return download_progress([(api_source, cache_name)])`

			`if source.startswith(model_source_huggingface):`
			`hub_source = source.removeprefix(model_source_huggingface)`
			`logger.info("Downloading model from Huggingface Hub: %s", hub_source)`
			`# from_pretrained has a bunch of useful logic that snapshot_download by itself down not`
			`return hub_source`
			`elif source.startswith("https://"):`
			`logger.info("Downloading model from: %s", source)`
			`return download_progress([(source, cache_name)])`
			`elif source.startswith("http://"):`
			`logger.warning("Downloading model from insecure source: %s", source)`
			`return download_progress([(source, cache_name)])`
			`elif source.startswith(path.sep) or source.startswith("."):`
			`logger.info("Using local model: %s", source)`
			`return source`
			`else:`
			`logger.info("Unknown model location, using path as provided: %s", source)`
			`return source`


			`def convert_models(ctx: ConversionContext, args, models: Models):`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`if args.diffusion:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`for model in models.get("diffusion"):`
			`model = tuple_to_diffusion(model)`
			`name = model.get("name")`

feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`if name in args.skip:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`logger.info("Skipping model: %s", name)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`else:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`format = source_format(model)`
			`source = fetch_model(ctx, name, model["source"], format=format)`

			`if format in ["safetensors", "ckpt"]:`
			`convert_diffusion_original(`
			`ctx,`
			`model,`
			`source,`
			`)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`else:`
			`convert_diffusion_stable(`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`ctx,`
			`model,`
			`source,`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`)`

			`if args.upscaling:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`for model in models.get("upscaling"):`
			`model = tuple_to_upscaling(model)`
			`name = model.get("name")`

			`if name in args.skip:`
			`logger.info("Skipping model: %s", name)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`else:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`format = source_format(model)`
			`source = fetch_model(ctx, name, model["source"], format=format)`
			`convert_upscale_resrgan(ctx, model, source)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00
			`if args.correction:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`for model in models.get("correction"):`
			`model = tuple_to_correction(model)`
			`name = model.get("name")`

			`if name in args.skip:`
			`logger.info("Skipping model: %s", name)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`else:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`format = source_format(model)`
			`source = fetch_model(ctx, name, model["source"], format=format)`
			`convert_correction_gfpgan(ctx, model, source)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00

			`def main() -> int:`
			`parser = ArgumentParser(`
			`prog="onnx-web model converter", description="convert checkpoint models to ONNX"`
			`)`

			`# model groups`
			`parser.add_argument("--correction", action="store_true", default=False)`
			`parser.add_argument("--diffusion", action="store_true", default=False)`
			`parser.add_argument("--upscaling", action="store_true", default=False)`

			`# extra models`
			`parser.add_argument("--extras", nargs="*", type=str, default=[])`
			`parser.add_argument("--skip", nargs="*", type=str, default=[])`

			`# export options`
			`parser.add_argument(`
			`"--half",`
			`action="store_true",`
			`default=False,`
			`help="Export models for half precision, faster on some Nvidia cards.",`
			`)`
			`parser.add_argument(`
			`"--opset",`
			`default=14,`
			`type=int,`
			`help="The version of the ONNX operator set to use.",`
			`)`
			`parser.add_argument(`
			`"--token",`
			`type=str,`
			`help="HuggingFace token with read permissions for downloading models.",`
			`)`

			`args = parser.parse_args()`
			`logger.info("CLI arguments: %s", args)`

feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`ctx = ConversionContext(model_path, training_device, half=args.half, opset=args.opset, token=args.token)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`logger.info("Converting models in %s using %s", ctx.model_path, ctx.training_device)`

			`if not path.exists(model_path):`
			`logger.info("Model path does not existing, creating: %s", model_path)`
			`makedirs(model_path)`

			`logger.info("Converting base models.")`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`convert_models(ctx, args, base_models)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00
			`for file in args.extras:`
			`if file is not None and file != "":`
			`logger.info("Loading extra models from %s", file)`
			`try:`
			`with open(file, "r") as f:`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`data = safe_load(f.read())`

			`with open("./schemas/extras.yaml", "r") as f:`
			`schema = safe_load(f.read())`

			`logger.debug("validating chain request: %s against %s", data, schema)`

			`try:`
			`validate(data, schema)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`logger.info("Converting extra models.")`
feat(api): add a way to download models from civitai or other https sources (#117) 2023-02-11 04:41:24 +00:00			`convert_models(ctx, args, data)`
			`except ValidationError as err:`
			`logger.error("Invalid data in extras file: %s", err)`
feat(api): convert from SD checkpoints (#117) 2023-02-09 04:35:54 +00:00			`except Exception as err:`
			`logger.error("Error converting extra models: %s", err)`

			`return 0`


			`if __name__ == "__main__":`
			`exit(main())`