onnx-web/api/onnx_web/server/load.py

from functools import cmp_to_key
from glob import glob
from logging import getLogger
from os import path
from typing import Any, Dict, List, Union

import torch
import yaml
from jsonschema import ValidationError, validate
from yaml import safe_load

from ..image import (  # mask filters; noise sources
    mask_filter_gaussian_multiply,
    mask_filter_gaussian_screen,
    mask_filter_none,
    noise_source_fill_edge,
    noise_source_fill_mask,
    noise_source_gaussian,
    noise_source_histogram,
    noise_source_normal,
    noise_source_uniform,
)
from ..params import DeviceParams
from ..torch_before_ort import get_available_providers
from ..utils import merge
from .context import ServerContext

logger = getLogger(__name__)

# config caching
config_params: Dict[str, Dict[str, Union[float, int, str]]] = {}

# pipeline params
platform_providers = {
    "cpu": "CPUExecutionProvider",
    "cuda": "CUDAExecutionProvider",
    "directml": "DmlExecutionProvider",
    "rocm": "ROCMExecutionProvider",
}
noise_sources = {
    "fill-edge": noise_source_fill_edge,
    "fill-mask": noise_source_fill_mask,
    "gaussian": noise_source_gaussian,
    "histogram": noise_source_histogram,
    "normal": noise_source_normal,
    "uniform": noise_source_uniform,
}
mask_filters = {
    "none": mask_filter_none,
    "gaussian-multiply": mask_filter_gaussian_multiply,
    "gaussian-screen": mask_filter_gaussian_screen,
}


# Available ORT providers
available_platforms: List[DeviceParams] = []

# loaded from model_path
correction_models: List[str] = []
diffusion_models: List[str] = []
inversion_models: List[str] = []
upscaling_models: List[str] = []

# Loaded from extra_models
extra_strings: Dict[str, Any] = {}


def get_config_params():
    return config_params


def get_available_platforms():
    return available_platforms


def get_correction_models():
    return correction_models


def get_diffusion_models():
    return diffusion_models


def get_inversion_models():
    return inversion_models


def get_upscaling_models():
    return upscaling_models


def get_extra_strings():
    return extra_strings


def get_mask_filters():
    return mask_filters


def get_noise_sources():
    return noise_sources


def get_config_value(key: str, subkey: str = "default", default=None):
    return config_params.get(key, {}).get(subkey, default)


def get_model_name(model: str) -> str:
    base = path.basename(model)
    (file, _ext) = path.splitext(base)
    return file


def load_extras(context: ServerContext):
    """
    Load the extras file(s) and collect the relevant parts for the server: labels and strings
    """
    global extra_strings

    labels = {}
    strings = {}

    with open("./schemas/extras.yaml", "r") as f:
        extra_schema = safe_load(f.read())

    for file in context.extra_models:
        if file is not None and file != "":
            logger.info("loading extra models from %s", file)
            try:
                with open(file, "r") as f:
                    data = safe_load(f.read())

                logger.debug("validating extras file %s", data)
                try:
                    validate(data, extra_schema)
                except ValidationError:
                    logger.exception("invalid data in extras file")
                    continue

                if "strings" in data:
                    logger.debug("collecting strings from %s", file)
                    merge(strings, data["strings"])

                for model_type in ["diffusion", "correction", "upscaling"]:
                    if model_type in data:
                        for model in data[model_type]:
                            if "label" in model:
                                model_name = model["name"]
                                logger.debug(
                                    "collecting label for model %s from %s",
                                    model_name,
                                    file,
                                )
                                labels[model_name] = model["label"]

                            if "inversions" in model:
                                for inversion in model["inversions"]:
                                    if "label" in inversion:
                                        inversion_name = inversion["name"]
                                        logger.debug(
                                            "collecting label for inversion %s from %s",
                                            inversion_name,
                                            model_name,
                                        )
                                        labels[
                                            f"inversion-{inversion_name}"
                                        ] = inversion["label"]

            except Exception:
                logger.exception("error loading extras file")

    logger.debug("adding labels to strings: %s", labels)
    merge(
        strings,
        {
            "en": {
                "translation": {
                    "model": labels,
                }
            }
        },
    )

    extra_strings = strings


def list_model_globs(context: ServerContext, globs: List[str]) -> List[str]:
    models = []
    for pattern in globs:
        pattern_path = path.join(context.model_path, pattern)
        logger.debug("loading models from %s", pattern_path)

        models.extend([get_model_name(f) for f in glob(pattern_path)])

    unique_models = list(set(models))
    unique_models.sort()
    return unique_models


def load_models(context: ServerContext) -> None:
    global correction_models
    global diffusion_models
    global inversion_models
    global upscaling_models

    diffusion_models = list_model_globs(
        context,
        [
            "diffusion-*",
            "stable-diffusion-*",
        ],
    )
    logger.debug("loaded diffusion models from disk: %s", diffusion_models)

    correction_models = list_model_globs(
        context,
        [
            "correction-*",
        ],
    )
    logger.debug("loaded correction models from disk: %s", correction_models)

    inversion_models = list_model_globs(
        context,
        [
            "inversion-*",
        ],
    )
    logger.debug("loaded inversion models from disk: %s", inversion_models)

    upscaling_models = list_model_globs(
        context,
        [
            "upscaling-*",
        ],
    )
    logger.debug("loaded upscaling models from disk: %s", upscaling_models)


def load_params(context: ServerContext) -> None:
    global config_params

    params_file = path.join(context.params_path, "params.json")
    logger.debug("loading server parameters from file: %s", params_file)

    with open(params_file, "r") as f:
        config_params = yaml.safe_load(f)

        if "platform" in config_params and context.default_platform is not None:
            logger.info(
                "overriding default platform from environment: %s",
                context.default_platform,
            )
            config_platform = config_params.get("platform", {})
            config_platform["default"] = context.default_platform


def load_platforms(context: ServerContext) -> None:
    global available_platforms

    providers = list(get_available_providers())
    logger.debug("loading available platforms from providers: %s", providers)

    for potential in platform_providers:
        if (
            platform_providers[potential] in providers
            and potential not in context.block_platforms
        ):
            if potential == "cuda":
                for i in range(torch.cuda.device_count()):
                    options = {
                        "device_id": i,
                    }

                    if context.memory_limit is not None:
                        options["arena_extend_strategy"] = "kSameAsRequested"
                        options["gpu_mem_limit"] = context.memory_limit

                    available_platforms.append(
                        DeviceParams(
                            potential,
                            platform_providers[potential],
                            options,
                            context.optimizations,
                        )
                    )
            else:
                available_platforms.append(
                    DeviceParams(
                        potential,
                        platform_providers[potential],
                        None,
                        context.optimizations,
                    )
                )

    if context.any_platform:
        # the platform should be ignored when the job is scheduled, but set to CPU just in case
        available_platforms.append(
            DeviceParams(
                "any",
                platform_providers["cpu"],
                None,
                context.optimizations,
            )
        )

    # make sure CPU is last on the list
    def any_first_cpu_last(a: DeviceParams, b: DeviceParams):
        if a.device == b.device:
            return 0

        # any should be first, if it's available
        if a.device == "any":
            return -1

        # cpu should be last, if it's available
        if a.device == "cpu":
            return 1

        return -1

    available_platforms = sorted(
        available_platforms, key=cmp_to_key(any_first_cpu_last)
    )

    logger.info(
        "available acceleration platforms: %s",
        ", ".join([str(p) for p in available_platforms]),
    )
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`from functools import cmp_to_key`
			`from glob import glob`
			`from logging import getLogger`
			`from os import path`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`from typing import Any, Dict, List, Union`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
			`import torch`
			`import yaml`
apply lint 2023-03-05 13:19:48 +00:00			`from jsonschema import ValidationError, validate`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`from yaml import safe_load`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
			`from ..image import ( # mask filters; noise sources`
			`mask_filter_gaussian_multiply,`
			`mask_filter_gaussian_screen,`
			`mask_filter_none,`
			`noise_source_fill_edge,`
			`noise_source_fill_mask,`
			`noise_source_gaussian,`
			`noise_source_histogram,`
			`noise_source_normal,`
			`noise_source_uniform,`
			`)`
lint all the new stuff 2023-02-26 20:15:30 +00:00			`from ..params import DeviceParams`
fix imports, lint 2023-02-26 21:21:58 +00:00			`from ..torch_before_ort import get_available_providers`
apply lint 2023-03-05 13:19:48 +00:00			`from ..utils import merge`
lint all the new stuff 2023-02-26 20:15:30 +00:00			`from .context import ServerContext`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
			`logger = getLogger(__name__)`

			`# config caching`
			`config_params: Dict[str, Dict[str, Union[float, int, str]]] = {}`

			`# pipeline params`
			`platform_providers = {`
			`"cpu": "CPUExecutionProvider",`
			`"cuda": "CUDAExecutionProvider",`
			`"directml": "DmlExecutionProvider",`
			`"rocm": "ROCMExecutionProvider",`
			`}`
			`noise_sources = {`
			`"fill-edge": noise_source_fill_edge,`
			`"fill-mask": noise_source_fill_mask,`
			`"gaussian": noise_source_gaussian,`
			`"histogram": noise_source_histogram,`
			`"normal": noise_source_normal,`
			`"uniform": noise_source_uniform,`
			`}`
			`mask_filters = {`
			`"none": mask_filter_none,`
			`"gaussian-multiply": mask_filter_gaussian_multiply,`
			`"gaussian-screen": mask_filter_gaussian_screen,`
			`}`


			`# Available ORT providers`
			`available_platforms: List[DeviceParams] = []`

			`# loaded from model_path`
			`correction_models: List[str] = []`
			`diffusion_models: List[str] = []`
			`inversion_models: List[str] = []`
			`upscaling_models: List[str] = []`

feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`# Loaded from extra_models`
			`extra_strings: Dict[str, Any] = {}`

feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
			`def get_config_params():`
			`return config_params`


			`def get_available_platforms():`
			`return available_platforms`


			`def get_correction_models():`
			`return correction_models`


			`def get_diffusion_models():`
			`return diffusion_models`


			`def get_inversion_models():`
			`return inversion_models`


			`def get_upscaling_models():`
			`return upscaling_models`


feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`def get_extra_strings():`
			`return extra_strings`


feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`def get_mask_filters():`
			`return mask_filters`


			`def get_noise_sources():`
			`return noise_sources`


			`def get_config_value(key: str, subkey: str = "default", default=None):`
			`return config_params.get(key, {}).get(subkey, default)`


			`def get_model_name(model: str) -> str:`
			`base = path.basename(model)`
			`(file, _ext) = path.splitext(base)`
			`return file`


feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`def load_extras(context: ServerContext):`
			`"""`
			`Load the extras file(s) and collect the relevant parts for the server: labels and strings`
			`"""`
			`global extra_strings`

			`labels = {}`
			`strings = {}`

			`with open("./schemas/extras.yaml", "r") as f:`
			`extra_schema = safe_load(f.read())`

			`for file in context.extra_models:`
			`if file is not None and file != "":`
			`logger.info("loading extra models from %s", file)`
			`try:`
			`with open(file, "r") as f:`
			`data = safe_load(f.read())`

			`logger.debug("validating extras file %s", data)`
			`try:`
			`validate(data, extra_schema)`
fix(api): use exception level logs 2023-03-17 03:29:07 +00:00			`except ValidationError:`
			`logger.exception("invalid data in extras file")`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`continue`

			`if "strings" in data:`
			`logger.debug("collecting strings from %s", file)`
			`merge(strings, data["strings"])`

			`for model_type in ["diffusion", "correction", "upscaling"]:`
			`if model_type in data:`
			`for model in data[model_type]:`
			`if "label" in model:`
			`model_name = model["name"]`
apply lint 2023-03-05 13:19:48 +00:00			`logger.debug(`
			`"collecting label for model %s from %s",`
			`model_name,`
			`file,`
			`)`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`labels[model_name] = model["label"]`

feat(api): collect labels from textual inversions (#144) 2023-03-05 14:00:25 +00:00			`if "inversions" in model:`
			`for inversion in model["inversions"]:`
			`if "label" in inversion:`
			`inversion_name = inversion["name"]`
			`logger.debug(`
			`"collecting label for inversion %s from %s",`
			`inversion_name,`
			`model_name,`
			`)`
apply lint 2023-03-05 14:14:47 +00:00			`labels[`
			`f"inversion-{inversion_name}"`
			`] = inversion["label"]`
feat(api): collect labels from textual inversions (#144) 2023-03-05 14:00:25 +00:00
fix(api): use exception level logs 2023-03-17 03:29:07 +00:00			`except Exception:`
			`logger.exception("error loading extras file")`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00
			`logger.debug("adding labels to strings: %s", labels)`
apply lint 2023-03-05 13:19:48 +00:00			`merge(`
			`strings,`
			`{`
			`"en": {`
			`"translation": {`
			`"model": labels,`
			`}`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00			`}`
apply lint 2023-03-05 13:19:48 +00:00			`},`
			`)`
feat: allow users to add their own labels for models (#144) 2023-03-05 04:57:31 +00:00
			`extra_strings = strings`


chore(api): dedupe model listing logic 2023-03-05 04:26:27 +00:00			`def list_model_globs(context: ServerContext, globs: List[str]) -> List[str]:`
			`models = []`
			`for pattern in globs:`
			`pattern_path = path.join(context.model_path, pattern)`
			`logger.debug("loading models from %s", pattern_path)`

apply lint 2023-03-05 13:19:48 +00:00			`models.extend([get_model_name(f) for f in glob(pattern_path)])`
chore(api): dedupe model listing logic 2023-03-05 04:26:27 +00:00
			`unique_models = list(set(models))`
			`unique_models.sort()`
			`return unique_models`


feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`def load_models(context: ServerContext) -> None:`
			`global correction_models`
			`global diffusion_models`
			`global inversion_models`
			`global upscaling_models`

apply lint 2023-03-05 13:19:48 +00:00			`diffusion_models = list_model_globs(`
			`context,`
			`[`
			`"diffusion-*",`
			`"stable-diffusion-*",`
			`],`
			`)`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loaded diffusion models from disk: %s", diffusion_models)`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
apply lint 2023-03-05 13:19:48 +00:00			`correction_models = list_model_globs(`
			`context,`
			`[`
			`"correction-*",`
			`],`
			`)`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loaded correction models from disk: %s", correction_models)`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
apply lint 2023-03-05 13:19:48 +00:00			`inversion_models = list_model_globs(`
			`context,`
			`[`
			`"inversion-*",`
			`],`
			`)`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loaded inversion models from disk: %s", inversion_models)`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
apply lint 2023-03-05 13:19:48 +00:00			`upscaling_models = list_model_globs(`
			`context,`
			`[`
			`"upscaling-*",`
			`],`
			`)`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loaded upscaling models from disk: %s", upscaling_models)`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00

			`def load_params(context: ServerContext) -> None:`
			`global config_params`
track started and finished jobs 2023-02-27 02:09:42 +00:00
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`params_file = path.join(context.params_path, "params.json")`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loading server parameters from file: %s", params_file)`

feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`with open(params_file, "r") as f:`
			`config_params = yaml.safe_load(f)`

			`if "platform" in config_params and context.default_platform is not None:`
			`logger.info(`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`"overriding default platform from environment: %s",`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`context.default_platform,`
			`)`
			`config_platform = config_params.get("platform", {})`
			`config_platform["default"] = context.default_platform`


			`def load_platforms(context: ServerContext) -> None:`
			`global available_platforms`

			`providers = list(get_available_providers())`
track started and finished jobs 2023-02-27 02:09:42 +00:00			`logger.debug("loading available platforms from providers: %s", providers)`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00
			`for potential in platform_providers:`
			`if (`
			`platform_providers[potential] in providers`
			`and potential not in context.block_platforms`
			`):`
			`if potential == "cuda":`
			`for i in range(torch.cuda.device_count()):`
feat(api): add server setting for CUDA memory limit (#211) 2023-03-18 18:40:15 +00:00			`options = {`
			`"device_id": i,`
			`}`

			`if context.memory_limit is not None:`
			`options["arena_extend_strategy"] = "kSameAsRequested"`
			`options["gpu_mem_limit"] = context.memory_limit`

feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`available_platforms.append(`
			`DeviceParams(`
			`potential,`
			`platform_providers[potential],`
feat(api): add server setting for CUDA memory limit (#211) 2023-03-18 18:40:15 +00:00			`options,`
feat(api): remove Flask app from global scope 2023-02-26 16:15:12 +00:00			`context.optimizations,`
			`)`
			`)`
			`else:`
			`available_platforms.append(`
			`DeviceParams(`
			`potential,`
			`platform_providers[potential],`
			`None,`
			`context.optimizations,`
			`)`
			`)`

			`if context.any_platform:`
			`# the platform should be ignored when the job is scheduled, but set to CPU just in case`
			`available_platforms.append(`
			`DeviceParams(`
			`"any",`
			`platform_providers["cpu"],`
			`None,`
			`context.optimizations,`
			`)`
			`)`

			`# make sure CPU is last on the list`
			`def any_first_cpu_last(a: DeviceParams, b: DeviceParams):`
			`if a.device == b.device:`
			`return 0`

			`# any should be first, if it's available`
			`if a.device == "any":`
			`return -1`

			`# cpu should be last, if it's available`
			`if a.device == "cpu":`
			`return 1`

			`return -1`

			`available_platforms = sorted(`
			`available_platforms, key=cmp_to_key(any_first_cpu_last)`
			`)`

			`logger.info(`
			`"available acceleration platforms: %s",`
			`", ".join([str(p) for p in available_platforms]),`
			`)`