vilson
App
9db894e
from typing import List
def split_document(data: List, chunk_size: int = 3000) -> List:
from langchain.text_splitter import RecursiveCharacterTextSplitter
text_splitter = RecursiveCharacterTextSplitter(chunk_size=chunk_size, chunk_overlap=400)
docs = text_splitter.split_documents(data)
return docs