Update app.py
Browse files
app.py
CHANGED
@@ -32,6 +32,22 @@ urlsfile.close()
|
|
32 |
loader = WebBaseLoader(urls)
|
33 |
docs = loader.load()
|
34 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
35 |
def format_docs(docs):
|
36 |
return "\n\n".join(doc.page_content for doc in docs)
|
37 |
|
|
|
32 |
loader = WebBaseLoader(urls)
|
33 |
docs = loader.load()
|
34 |
|
35 |
+
# load arxiv papers
|
36 |
+
arxivfile = open("arxiv.txt")
|
37 |
+
arxivs = arxivfile.readlines()
|
38 |
+
arxivs = [arxiv.replace("\n","") for arxiv in arxivs]
|
39 |
+
arxivfile.close()
|
40 |
+
|
41 |
+
retriever = ArxivRetriever(
|
42 |
+
load_max_docs=2,
|
43 |
+
get_ful_documents=True,
|
44 |
+
)
|
45 |
+
|
46 |
+
for arxiv in arxivs:
|
47 |
+
doc = retriever.invoke(arxiv)
|
48 |
+
docs.append(doc)
|
49 |
+
|
50 |
+
|
51 |
def format_docs(docs):
|
52 |
return "\n\n".join(doc.page_content for doc in docs)
|
53 |
|