batalovme commited on
Commit
15d7e65
1 Parent(s): 48e7c56

Data loading

Browse files
Files changed (2) hide show
  1. index.py +1 -6
  2. loader.py +4 -16
index.py CHANGED
@@ -8,12 +8,7 @@ from utils import completion_to_prompt, messages_to_prompt
8
 
9
 
10
  def build_service_context():
11
- return ServiceContext.from_defaults(llm=LlamaCPP(
12
- model_path=None,
13
- messages_to_prompt=messages_to_prompt,
14
- completion_to_prompt=completion_to_prompt,
15
- model_kwargs={"n_gpu_layers": 50},
16
- ))
17
 
18
  def build_index(documents, context):
19
  index = VectorStoreIndex.from_documents(documents, service_context=context)
 
8
 
9
 
10
  def build_service_context():
11
+ return ServiceContext.from_defaults(embed_model='local')
 
 
 
 
 
12
 
13
  def build_index(documents, context):
14
  index = VectorStoreIndex.from_documents(documents, service_context=context)
loader.py CHANGED
@@ -1,19 +1,7 @@
1
- from llama_index import download_loader
2
-
3
- BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader")
4
 
5
 
6
  def load_documents():
7
- loader = BeautifulSoupWebReader()
8
- return loader.load_data(urls=[
9
- 'http://campuslife.innopolis.ru/main',
10
- 'http://campuslife.innopolis.ru/handbook2023',
11
- 'http://campuslife.innopolis.ru/clubs',
12
- 'http://campuslife.innopolis.ru/tech_clubs',
13
- 'http://campuslife.innopolis.ru/sport_clubs',
14
- 'http://campuslife.innopolis.ru/hobby_clubs',
15
- 'http://campuslife.innopolis.ru/art_clubs'
16
- 'http://campuslife.innopolis.ru/opportunities',
17
- 'http://campuslife.innopolis.ru/faq',
18
- 'http://campuslife.innopolis.ru/contacts'
19
- ])
 
1
+ from llama_index import SimpleDirectoryReader
 
 
2
 
3
 
4
  def load_documents():
5
+ docs_dir = "./raw"
6
+ documents = SimpleDirectoryReader(docs_dir).load_data()
7
+ return documents