from langchain_community.embeddings.sentence_transformer import ( SentenceTransformerEmbeddings, ) from langchain_community.vectorstores import Chroma # create the open-source embedding function embedding_function = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2") # load Chroma db = Chroma(embedding_function=embedding_function, persist_directory="./chroma_db") print("There are", db._collection.count(), " docs in the collection") docs = db._collection.peek(10) for doc in docs['documents']: print(doc)