sorg20 commited on
Commit
1ffa965
β€’
1 Parent(s): a2f2772

vector db retrain

Browse files
app.py CHANGED
@@ -22,7 +22,7 @@ def retrieve_documents():
22
  #api_key=HF_TOKEN, model_name="local:BAAI/bge-m3")
23
  db = Chroma(persist_directory="./db",
24
  embedding_function=embeddings)
25
- retriever = db.as_retriever(search_kwargs = {"k":1})
26
  return retriever
27
 
28
  @st.cache_resource()
@@ -42,8 +42,8 @@ def create_chain(_retriever):
42
 
43
  llm = HuggingFaceEndpoint(
44
  endpoint_url = "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2",
45
- max_new_tokens=512,
46
- top_k=1,
47
  top_p=0.9,
48
  temperature=0.5,
49
  repetition_penalty=1.1,
 
22
  #api_key=HF_TOKEN, model_name="local:BAAI/bge-m3")
23
  db = Chroma(persist_directory="./db",
24
  embedding_function=embeddings)
25
+ retriever = db.as_retriever(search_kwargs = {"k":3})
26
  return retriever
27
 
28
  @st.cache_resource()
 
42
 
43
  llm = HuggingFaceEndpoint(
44
  endpoint_url = "https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.2",
45
+ max_new_tokens=2048,
46
+ top_k=3,
47
  top_p=0.9,
48
  temperature=0.5,
49
  repetition_penalty=1.1,
data/Sungwon_Kim_ML_DL_Intro_together.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bf23de972563f545577fc3ba526a7095ade61ac4c9ff31a3f0b0a431fe0a9c6
3
+ size 166124
db/{727833e8-2ded-474a-9aa7-68262d54e1bf β†’ 7ff82419-a056-482d-b47b-bf20f0416667}/data_level0.bin RENAMED
File without changes
db/{727833e8-2ded-474a-9aa7-68262d54e1bf β†’ 7ff82419-a056-482d-b47b-bf20f0416667}/header.bin RENAMED
File without changes
db/{727833e8-2ded-474a-9aa7-68262d54e1bf β†’ 7ff82419-a056-482d-b47b-bf20f0416667}/length.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6288e3187b841602a59f0ecf19ab89046d64462debfe6e37465c2a39a436af5
3
  size 4000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72fff46a00133ed25e0295587e9d32f02f68c7dc9249872d219b49934c119de
3
  size 4000
db/{727833e8-2ded-474a-9aa7-68262d54e1bf β†’ 7ff82419-a056-482d-b47b-bf20f0416667}/link_lists.bin RENAMED
File without changes
db/chroma.sqlite3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc61685aeb6a95f279aac19f5b6fe590bb923ec59e754e48894f4196b92d87ed
3
- size 450560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63e5791397a6bc2efe890213198b6bd62742f7d4342c90eed8ecec781a11824f
3
+ size 270336
gen.py CHANGED
@@ -7,7 +7,6 @@ from langchain_community.embeddings import HuggingFaceInferenceAPIEmbeddings
7
  from langchain_community.vectorstores import Chroma
8
  import streamlit as st
9
 
10
-
11
  HF_TOKEN = st.secrets["HF_TOKEN"]
12
 
13
  def persist_dir(file_path):
 
7
  from langchain_community.vectorstores import Chroma
8
  import streamlit as st
9
 
 
10
  HF_TOKEN = st.secrets["HF_TOKEN"]
11
 
12
  def persist_dir(file_path):