Spaces:
Running
on
Zero
Running
on
Zero
import asyncio | |
import inspect | |
import json | |
import pickle | |
import threading | |
import time | |
from contextlib import asynccontextmanager | |
from copy import copy | |
from typing import Any, Optional | |
import redis | |
from inference.core import logger | |
from inference.core.cache.base import BaseCache | |
from inference.core.entities.responses.inference import InferenceResponseImage | |
from inference.core.env import MEMORY_CACHE_EXPIRE_INTERVAL | |
class RedisCache(BaseCache): | |
""" | |
MemoryCache is an in-memory cache that implements the BaseCache interface. | |
Attributes: | |
cache (dict): A dictionary to store the cache values. | |
expires (dict): A dictionary to store the expiration times of the cache values. | |
zexpires (dict): A dictionary to store the expiration times of the sorted set values. | |
_expire_thread (threading.Thread): A thread that runs the _expire method. | |
""" | |
def __init__( | |
self, | |
host: str = "localhost", | |
port: int = 6379, | |
db: int = 0, | |
ssl: bool = False, | |
timeout: float = 2.0, | |
) -> None: | |
""" | |
Initializes a new instance of the MemoryCache class. | |
""" | |
self.client = redis.Redis( | |
host=host, | |
port=port, | |
db=db, | |
decode_responses=True, | |
ssl=ssl, | |
socket_timeout=timeout, | |
socket_connect_timeout=timeout, | |
) | |
logger.debug("Attempting to diagnose Redis connection...") | |
self.client.ping() | |
logger.debug("Redis connection established.") | |
self.zexpires = dict() | |
self._expire_thread = threading.Thread(target=self._expire, daemon=True) | |
self._expire_thread.start() | |
def _expire(self): | |
""" | |
Removes the expired keys from the cache and zexpires dictionaries. | |
This method runs in an infinite loop and sleeps for MEMORY_CACHE_EXPIRE_INTERVAL seconds between each iteration. | |
""" | |
while True: | |
logger.debug("Redis cleaner thread starts cleaning...") | |
now = time.time() | |
for k, v in copy(list(self.zexpires.items())): | |
if v < now: | |
tolerance_factor = 1e-14 # floating point accuracy | |
self.zremrangebyscore( | |
k[0], k[1] - tolerance_factor, k[1] + tolerance_factor | |
) | |
del self.zexpires[k] | |
logger.debug("Redis cleaner finished task.") | |
sleep_time = MEMORY_CACHE_EXPIRE_INTERVAL - (time.time() - now) | |
time.sleep(max(sleep_time, 0)) | |
def get(self, key: str): | |
""" | |
Gets the value associated with the given key. | |
Args: | |
key (str): The key to retrieve the value. | |
Returns: | |
str: The value associated with the key, or None if the key does not exist or is expired. | |
""" | |
item = self.client.get(key) | |
if item is not None: | |
try: | |
return json.loads(item) | |
except TypeError: | |
return item | |
def set(self, key: str, value: str, expire: float = None): | |
""" | |
Sets a value for a given key with an optional expire time. | |
Args: | |
key (str): The key to store the value. | |
value (str): The value to store. | |
expire (float, optional): The time, in seconds, after which the key will expire. Defaults to None. | |
""" | |
if not isinstance(value, bytes): | |
value = json.dumps(value) | |
self.client.set(key, value, ex=expire) | |
def zadd(self, key: str, value: Any, score: float, expire: float = None): | |
""" | |
Adds a member with the specified score to the sorted set stored at key. | |
Args: | |
key (str): The key of the sorted set. | |
value (str): The value to add to the sorted set. | |
score (float): The score associated with the value. | |
expire (float, optional): The time, in seconds, after which the key will expire. Defaults to None. | |
""" | |
# serializable_value = self.ensure_serializable(value) | |
value = json.dumps(value) | |
self.client.zadd(key, {value: score}) | |
if expire: | |
self.zexpires[(key, score)] = expire + time.time() | |
def zrangebyscore( | |
self, | |
key: str, | |
min: Optional[float] = -1, | |
max: Optional[float] = float("inf"), | |
withscores: bool = False, | |
): | |
""" | |
Retrieves a range of members from a sorted set. | |
Args: | |
key (str): The key of the sorted set. | |
start (int, optional): The starting score of the range. Defaults to -1. | |
stop (int, optional): The ending score of the range. Defaults to float("inf"). | |
withscores (bool, optional): Whether to return the scores along with the values. Defaults to False. | |
Returns: | |
list: A list of values (or value-score pairs if withscores is True) in the specified score range. | |
""" | |
res = self.client.zrangebyscore(key, min, max, withscores=withscores) | |
if withscores: | |
return [(json.loads(x), y) for x, y in res] | |
else: | |
return [json.loads(x) for x in res] | |
def zremrangebyscore( | |
self, | |
key: str, | |
min: Optional[float] = -1, | |
max: Optional[float] = float("inf"), | |
): | |
""" | |
Removes all members in a sorted set within the given scores. | |
Args: | |
key (str): The key of the sorted set. | |
start (int, optional): The minimum score of the range. Defaults to -1. | |
stop (int, optional): The maximum score of the range. Defaults to float("inf"). | |
Returns: | |
int: The number of members removed from the sorted set. | |
""" | |
return self.client.zremrangebyscore(key, min, max) | |
def ensure_serializable(self, value: Any): | |
if isinstance(value, dict): | |
for k, v in value.items(): | |
if isinstance(v, Exception): | |
value[k] = str(v) | |
elif inspect.isclass(v) and isinstance(v, InferenceResponseImage): | |
value[k] = v.dict() | |
return value | |
def acquire_lock(self, key: str, expire=None) -> Any: | |
l = self.client.lock(key, blocking=True, timeout=expire) | |
acquired = l.acquire(blocking_timeout=expire) | |
if not acquired: | |
raise TimeoutError("Couldn't get lock") | |
# refresh the lock | |
if expire is not None: | |
l.extend(expire) | |
return l | |
def set_numpy(self, key: str, value: Any, expire: float = None): | |
serialized_value = pickle.dumps(value) | |
self.set(key, serialized_value, expire=expire) | |
def get_numpy(self, key: str) -> Any: | |
serialized_value = self.get(key) | |
if serialized_value is not None: | |
return pickle.loads(serialized_value) | |
else: | |
return None | |