Quent1Fvr's picture
v2.
e2e8616
raw
history blame
No virus
1.99 kB
import math
class Block:
def __init__(self, doc: str= '',title: str = '', content: str = '',
index: str = '', rank: int = 0, level: int = 0, distance: float = 99999):
self.doc = doc
self.title = title
self.content = content
self.index = index
self.rank = rank
self.level = level
self.distance = distance
@property
def distance_str(self) -> str:
return format(self.distance, '.2f')
def separate_1_block_in_n(self, max_size=4500):
"""
Separate a block in n blocks of equal size
"""
content_length = len(self.content)
n = math.ceil(content_length / max_size)
block_size = content_length // n
new_blocks = []
for i in range(n):
start = i * block_size
end = (i + 1) * block_size if i < n - 1 else None
new_blocks.append(Block(doc=self.doc,
title=self.title + f"_part{i}",
content=self.content[start:end],
index=self.index + f"_{i}",
rank=self.rank,
level=self.level))
return new_blocks
def to_dict(self) -> {}:
block_dict = {'doc': self.doc,
'title': self.title,
'content': self.content,
'index': self.index,
'rank': self.rank,
'level': self.level,
'distance': self.distance}
return block_dict
def from_dict(self, block_dict: {}):
self.doc = block_dict['doc']
self.title = block_dict['title']
self.content = block_dict['content']
self.index = block_dict['index']
self.rank = block_dict['rank']
self.level = block_dict['level']
self.distance = block_dict['distance']
return self