Zaman
commited on
Commit
β’
18cb72e
1
Parent(s):
3e47a11
added 100 chunk db
Browse files- .gitattributes +2 -0
- Dockerfile +2 -1
- bot.py +2 -2
- openai_db_100chunksize/chroma-collections.parquet +3 -0
- openai_db_100chunksize/chroma-embeddings.parquet +3 -0
- openai_db_100chunksize/index/id_to_uuid_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl +3 -0
- openai_db_100chunksize/index/index_f425c27f-d414-4dc6-8771-bf85c05980bd.bin +3 -0
- openai_db_100chunksize/index/index_metadata_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl +3 -0
- openai_db_100chunksize/index/uuid_to_id_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl +3 -0
- {openai_embeddings β openai_embeddings_400chunksize}/chroma-collections.parquet +0 -0
- {openai_embeddings β openai_embeddings_400chunksize}/chroma-embeddings.parquet +0 -0
- {openai_embeddings β openai_embeddings_400chunksize}/index/id_to_uuid_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl +0 -0
- {openai_embeddings β openai_embeddings_400chunksize}/index/index_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.bin +0 -0
- {openai_embeddings β openai_embeddings_400chunksize}/index/index_metadata_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl +0 -0
- {openai_embeddings β openai_embeddings_400chunksize}/index/uuid_to_id_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl +0 -0
.gitattributes
CHANGED
@@ -36,3 +36,5 @@ apple_amazon_intel_db/* filter=lfs diff=lfs merge=lfs -text
|
|
36 |
db_index/* filter=lfs diff=lfs merge=lfs -text
|
37 |
db_index filter=lfs diff=lfs merge=lfs -text
|
38 |
openai_embeddings/* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
36 |
db_index/* filter=lfs diff=lfs merge=lfs -text
|
37 |
db_index filter=lfs diff=lfs merge=lfs -text
|
38 |
openai_embeddings/* filter=lfs diff=lfs merge=lfs -text
|
39 |
+
openai_db_100chunksize/* filter=lfs diff=lfs merge=lfs -text
|
40 |
+
openai_embeddings_400chunksize/* filter=lfs diff=lfs merge=lfs -text
|
Dockerfile
CHANGED
@@ -17,4 +17,5 @@ WORKDIR $HOME/app
|
|
17 |
|
18 |
COPY --chown=user . $HOME/app
|
19 |
|
20 |
-
CMD ["python", "bot.py"]
|
|
|
|
17 |
|
18 |
COPY --chown=user . $HOME/app
|
19 |
|
20 |
+
CMD ["python", "bot.py"]
|
21 |
+
|
bot.py
CHANGED
@@ -10,13 +10,13 @@ from langchain.memory import ConversationBufferWindowMemory
|
|
10 |
# RetrievalQAWithSourcesChain.from_llm()
|
11 |
# ConversationalRetrievalChain()
|
12 |
|
13 |
-
persist_direcory = "
|
14 |
|
15 |
embeddings = OpenAIEmbeddings()
|
16 |
# db = FAISS.load_local(persist_directory, embeddings)
|
17 |
chroma = Chroma(embedding_function=embeddings, persist_directory=persist_direcory)
|
18 |
# retriever = chroma.as_retriever(search_type="mmr", search_kwargs={"k": 10})
|
19 |
-
retriever = chroma.as_retriever(search_kwargs={"k":
|
20 |
query = "what were the net sales of aws in the first quarter of 2023?"
|
21 |
print(retriever.get_relevant_documents(query))
|
22 |
|
|
|
10 |
# RetrievalQAWithSourcesChain.from_llm()
|
11 |
# ConversationalRetrievalChain()
|
12 |
|
13 |
+
persist_direcory = "openai_db_100chunksize"
|
14 |
|
15 |
embeddings = OpenAIEmbeddings()
|
16 |
# db = FAISS.load_local(persist_directory, embeddings)
|
17 |
chroma = Chroma(embedding_function=embeddings, persist_directory=persist_direcory)
|
18 |
# retriever = chroma.as_retriever(search_type="mmr", search_kwargs={"k": 10})
|
19 |
+
retriever = chroma.as_retriever(search_kwargs={"k": 60})
|
20 |
query = "what were the net sales of aws in the first quarter of 2023?"
|
21 |
print(retriever.get_relevant_documents(query))
|
22 |
|
openai_db_100chunksize/chroma-collections.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:446557b1b09b92e290a6beb616c34e41cf61eb3f25da7287a48bef689abc2ddf
|
3 |
+
size 557
|
openai_db_100chunksize/chroma-embeddings.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b64870796a4953432eb6aba84b88aec5e33d352cfbeec1b7ac5c3bb1cf86253c
|
3 |
+
size 106836520
|
openai_db_100chunksize/index/id_to_uuid_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce7892e7ce9477988bc3df98bcee987ae3040ff876427a3b2d6a6d6582c1af9e
|
3 |
+
size 282181
|
openai_db_100chunksize/index/index_f425c27f-d414-4dc6-8771-bf85c05980bd.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3170c513ddf2ff862af83e7cfbcb4d8cd5c7876cec301224d065206ebe598665
|
3 |
+
size 54670292
|
openai_db_100chunksize/index/index_metadata_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf680a818a4c63af6adb6db718f77ba8b78051a82890b0a50a1722eae110ed1d
|
3 |
+
size 105
|
openai_db_100chunksize/index/uuid_to_id_f425c27f-d414-4dc6-8771-bf85c05980bd.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9fdc02b59c71f7401a73c2809afe11827132aa85aede545242517d8ca00e107
|
3 |
+
size 329966
|
{openai_embeddings β openai_embeddings_400chunksize}/chroma-collections.parquet
RENAMED
File without changes
|
{openai_embeddings β openai_embeddings_400chunksize}/chroma-embeddings.parquet
RENAMED
File without changes
|
{openai_embeddings β openai_embeddings_400chunksize}/index/id_to_uuid_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl
RENAMED
File without changes
|
{openai_embeddings β openai_embeddings_400chunksize}/index/index_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.bin
RENAMED
File without changes
|
{openai_embeddings β openai_embeddings_400chunksize}/index/index_metadata_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl
RENAMED
File without changes
|
{openai_embeddings β openai_embeddings_400chunksize}/index/uuid_to_id_8cd9a0f1-d432-45ef-acbc-f9b2f4b928f3.pkl
RENAMED
File without changes
|