import os from dataclasses import dataclass from graphgen.utils import logger, load_json, write_json from graphgen.models.storage.base_storage import BaseKVStorage @dataclass class JsonKVStorage(BaseKVStorage): _data: dict[str, str] = None def __post_init__(self): self._file_name = os.path.join(self.working_dir, f"{self.namespace}.json") self._data = load_json(self._file_name) or {} logger.info("Load KV %s with %d data", self.namespace, len(self._data)) @property def data(self): return self._data async def all_keys(self) -> list[str]: return list(self._data.keys()) async def index_done_callback(self): write_json(self._data, self._file_name) async def get_by_id(self, id): return self._data.get(id, None) async def get_by_ids(self, ids, fields=None) -> list: if fields is None: return [self._data.get(id, None) for id in ids] return [ ( {k: v for k, v in self._data[id].items() if k in fields} if self._data.get(id, None) else None ) for id in ids ] async def filter_keys(self, data: list[str]) -> set[str]: return {s for s in data if s not in self._data} async def upsert(self, data: dict): left_data = {k: v for k, v in data.items() if k not in self._data} self._data.update(left_data) return left_data async def drop(self): self._data = {}