1
0
Fork 0
onnx-web/api/onnx_web/server/model_cache.py

92 lines
2.3 KiB
Python
Raw Normal View History

from enum import Enum
from logging import getLogger
2023-02-14 00:12:40 +00:00
from typing import Any, List, Tuple
logger = getLogger(__name__)
cache: List[Tuple[str, Any, Any]] = []
class ModelTypes(str, Enum):
correction = "correction"
diffusion = "diffusion"
scheduler = "scheduler"
upscaling = "upscaling"
2024-01-14 15:59:19 +00:00
safety = "safety"
class ModelCache:
# cache: List[Tuple[str, Any, Any]]
limit: int
def __init__(self, limit: int) -> None:
self.limit = limit
logger.debug("creating model cache with limit of %s models", limit)
def drop(self, tag: str, key: Any) -> int:
global cache
2023-03-07 14:02:53 +00:00
logger.debug("dropping item from cache: %s %s", tag, key)
removed = [model for model in cache if model[0] == tag and model[1] == key]
for item in removed:
cache.remove(item)
return len(removed)
def get(self, tag: str, key: Any) -> Any:
global cache
for t, k, v in cache:
if tag == t and key == k:
2023-03-06 03:50:01 +00:00
logger.debug("found cached model: %s %s", tag, key)
return v
2023-03-06 03:50:01 +00:00
logger.debug("model not found in cache: %s %s", tag, key)
return None
def set(self, tag: str, key: Any, value: Any) -> None:
global cache
if self.limit == 0:
2023-02-17 00:42:05 +00:00
logger.debug("cache limit set to 0, not caching model: %s", tag)
return
for i in range(len(cache)):
t, k, _v = cache[i]
2023-02-19 13:53:20 +00:00
if tag == t and key != k:
2023-03-06 03:50:01 +00:00
logger.debug("updating model cache: %s %s", tag, key)
cache[i] = (tag, key, value)
2023-02-19 13:53:20 +00:00
return
2023-03-06 03:50:01 +00:00
logger.debug("adding new model to cache: %s %s", tag, key)
cache.append((tag, key, value))
self.prune()
2023-03-11 19:59:09 +00:00
def clear(self):
global cache
cache.clear()
def prune(self):
global cache
total = len(cache)
2023-03-11 14:06:22 +00:00
overage = total - self.limit
if overage > 0:
removed = cache[:overage]
logger.info(
2023-03-11 14:06:22 +00:00
"removing %s of %s models from cache, %s",
overage,
total,
[m[0] for m in removed],
)
cache[:] = cache[-self.limit :]
else:
2023-02-17 00:42:05 +00:00
logger.debug("model cache below limit, %s of %s", total, self.limit)
@property
def size(self):
global cache
return len(cache)