onnx-web/api/onnx_web/server/model_cache.py

from enum import Enum
from logging import getLogger
from typing import Any, List, Tuple

logger = getLogger(__name__)

cache: List[Tuple[str, Any, Any]] = []


class ModelTypes(str, Enum):
    correction = "correction"
    diffusion = "diffusion"
    scheduler = "scheduler"
    upscaling = "upscaling"
    safety = "safety"


class ModelCache:
    # cache: List[Tuple[str, Any, Any]]
    limit: int

    def __init__(self, limit: int) -> None:
        self.limit = limit
        logger.debug("creating model cache with limit of %s models", limit)

    def drop(self, tag: str, key: Any) -> int:
        global cache

        logger.debug("dropping item from cache: %s %s", tag, key)
        removed = [model for model in cache if model[0] == tag and model[1] == key]
        for item in removed:
            cache.remove(item)

        return len(removed)

    def get(self, tag: str, key: Any) -> Any:
        global cache

        for t, k, v in cache:
            if tag == t and key == k:
                logger.debug("found cached model: %s %s", tag, key)
                return v

        logger.debug("model not found in cache: %s %s", tag, key)
        return None

    def set(self, tag: str, key: Any, value: Any) -> None:
        global cache

        if self.limit == 0:
            logger.debug("cache limit set to 0, not caching model: %s", tag)
            return

        for i in range(len(cache)):
            t, k, _v = cache[i]
            if tag == t and key != k:
                logger.debug("updating model cache: %s %s", tag, key)
                cache[i] = (tag, key, value)
                return

        logger.debug("adding new model to cache: %s %s", tag, key)
        cache.append((tag, key, value))
        self.prune()

    def clear(self):
        global cache

        cache.clear()

    def prune(self):
        global cache

        total = len(cache)
        overage = total - self.limit
        if overage > 0:
            removed = cache[:overage]
            logger.info(
                "removing %s of %s models from cache, %s",
                overage,
                total,
                [m[0] for m in removed],
            )
            cache[:] = cache[-self.limit :]
        else:
            logger.debug("model cache below limit, %s of %s", total, self.limit)

    @property
    def size(self):
        global cache

        return len(cache)
fix(api): use consistent cache key for each model type 2023-07-03 16:33:56 +00:00			`from enum import Enum`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`from logging import getLogger`
fix type 2023-02-14 00:12:40 +00:00			`from typing import Any, List, Tuple`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00
			`logger = getLogger(__name__)`

fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`cache: List[Tuple[str, Any, Any]] = []`

feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00
fix(api): use consistent cache key for each model type 2023-07-03 16:33:56 +00:00			`class ModelTypes(str, Enum):`
			`correction = "correction"`
			`diffusion = "diffusion"`
			`scheduler = "scheduler"`
			`upscaling = "upscaling"`
cache horde safety models 2024-01-14 15:59:19 +00:00			`safety = "safety"`
fix(api): use consistent cache key for each model type 2023-07-03 16:33:56 +00:00

feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`class ModelCache:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`# cache: List[Tuple[str, Any, Any]]`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`limit: int`

			`def __init__(self, limit: int) -> None:`
			`self.limit = limit`
fix(api): remove unused num_workers logic from server 2023-03-11 14:17:27 +00:00			`logger.debug("creating model cache with limit of %s models", limit)`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00
fix(api): track items removed from cache 2023-03-06 13:34:09 +00:00			`def drop(self, tag: str, key: Any) -> int:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`global cache`

apply lint 2023-03-07 14:02:53 +00:00			`logger.debug("dropping item from cache: %s %s", tag, key)`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`removed = [model for model in cache if model[0] == tag and model[1] == key]`
fix(api): track items removed from cache 2023-03-06 13:34:09 +00:00			`for item in removed:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`cache.remove(item)`
fix(api): track items removed from cache 2023-03-06 13:34:09 +00:00
			`return len(removed)`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00
			`def get(self, tag: str, key: Any) -> Any:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`global cache`

			`for t, k, v in cache:`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`if tag == t and key == k:`
fix(api): include cache keys in logs 2023-03-06 03:50:01 +00:00			`logger.debug("found cached model: %s %s", tag, key)`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`return v`

fix(api): include cache keys in logs 2023-03-06 03:50:01 +00:00			`logger.debug("model not found in cache: %s %s", tag, key)`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`return None`

			`def set(self, tag: str, key: Any, value: Any) -> None:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`global cache`

fix(api): bypass model cache entirely when limit is 0 2023-02-15 23:17:28 +00:00			`if self.limit == 0:`
lint(api): lowercase log messages 2023-02-17 00:42:05 +00:00			`logger.debug("cache limit set to 0, not caching model: %s", tag)`
fix(api): bypass model cache entirely when limit is 0 2023-02-15 23:17:28 +00:00			`return`

fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`for i in range(len(cache)):`
fix(api): make request parsing consistent between JSON and forms 2023-09-13 22:27:44 +00:00			`t, k, _v = cache[i]`
apply sonar lint 2023-02-19 13:53:20 +00:00			`if tag == t and key != k:`
fix(api): include cache keys in logs 2023-03-06 03:50:01 +00:00			`logger.debug("updating model cache: %s %s", tag, key)`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`cache[i] = (tag, key, value)`
apply sonar lint 2023-02-19 13:53:20 +00:00			`return`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00
fix(api): include cache keys in logs 2023-03-06 03:50:01 +00:00			`logger.debug("adding new model to cache: %s %s", tag, key)`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`cache.append((tag, key, value))`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`self.prune()`

fix(tests): clear cache between tests 2023-03-11 19:59:09 +00:00			`def clear(self):`
			`global cache`

			`cache.clear()`

feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`def prune(self):`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`global cache`

			`total = len(cache)`
log which cache items have been pruned 2023-03-11 14:06:22 +00:00			`overage = total - self.limit`
			`if overage > 0:`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`removed = cache[:overage]`
feat(api): add GFPGAN and Real ESRGAN to model cache 2023-02-14 00:10:11 +00:00			`logger.info(`
log which cache items have been pruned 2023-03-11 14:06:22 +00:00			`"removing %s of %s models from cache, %s",`
			`overage,`
			`total,`
			`[m[0] for m in removed],`
feat(api): add GFPGAN and Real ESRGAN to model cache 2023-02-14 00:10:11 +00:00			`)`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`cache[:] = cache[-self.limit :]`
feat(api): add model cache for diffusion models 2023-02-14 00:04:46 +00:00			`else:`
lint(api): lowercase log messages 2023-02-17 00:42:05 +00:00			`logger.debug("model cache below limit, %s of %s", total, self.limit)`
fix(api): track items removed from cache 2023-03-06 13:34:09 +00:00
			`@property`
			`def size(self):`
fix(api): make cache global within each worker process (#227) 2023-03-11 19:30:11 +00:00			`global cache`

			`return len(cache)`