Spaces:

Shyamnath
/

inferencing-llm

Sleeping

App Files Files Community

inferencing-llm / litellm /types /caching.py

Shyamnath

Push core package and essential files

469eae6 6 days ago

raw

history blame contribute delete

1.98 kB

	from enum import Enum
	from typing import Any, Dict, Literal, Optional, TypedDict, Union

	from pydantic import BaseModel


	class LiteLLMCacheType(str, Enum):
	LOCAL = "local"
	REDIS = "redis"
	REDIS_SEMANTIC = "redis-semantic"
	S3 = "s3"
	DISK = "disk"
	QDRANT_SEMANTIC = "qdrant-semantic"


	CachingSupportedCallTypes = Literal[
	"completion",
	"acompletion",
	"embedding",
	"aembedding",
	"atranscription",
	"transcription",
	"atext_completion",
	"text_completion",
	"arerank",
	"rerank",
	]


	class RedisPipelineIncrementOperation(TypedDict):
	"""
	TypeDict for 1 Redis Pipeline Increment Operation
	"""

	key: str
	increment_value: float
	ttl: Optional[int]


	DynamicCacheControl = TypedDict(
	"DynamicCacheControl",
	{
	# Will cache the response for the user-defined amount of time (in seconds).
	"ttl": Optional[int],
	# Namespace to use for caching
	"namespace": Optional[str],
	# Max Age to use for caching
	"s-maxage": Optional[int],
	"s-max-age": Optional[int],
	# Will not return a cached response, but instead call the actual endpoint.
	"no-cache": Optional[bool],
	# Will not store the response in the cache.
	"no-store": Optional[bool],
	},
	)


	class CachePingResponse(BaseModel):
	status: str
	cache_type: str
	ping_response: Optional[bool] = None
	set_cache_response: Optional[str] = None
	litellm_cache_params: Optional[str] = None

	# intentionally a dict, since we run masker.mask_dict() on HealthCheckCacheParams
	health_check_cache_params: Optional[dict] = None


	class HealthCheckCacheParams(BaseModel):
	"""
	Cache Params returned on /cache/ping call
	"""

	host: Optional[str] = None
	port: Optional[Union[str, int]] = None
	redis_kwargs: Optional[Dict[str, Any]] = None
	namespace: Optional[str] = None
	redis_version: Optional[Union[str, int, float]] = None