medelharchaoui commited on
Commit
9111075
1 Parent(s): 973762f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -5
app.py CHANGED
@@ -8,11 +8,18 @@ from langchain.embeddings import HuggingFaceEmbeddings, SentenceTransformerEmbed
8
  from langchain.vectorstores import FAISS
9
 
10
 
11
- splitter = SentenceTransformersTokenTextSplitter(model_name='dangvantuan/sentence-camembert-large',
12
- chunk_size=380,
13
- chunk_overlap=100
14
- )
15
- embeddings_fun = HuggingFaceEmbeddings(model_name='dangvantuan/sentence-camembert-large')
 
 
 
 
 
 
 
16
 
17
 
18
  def read_pdf(file):
 
8
  from langchain.vectorstores import FAISS
9
 
10
 
11
+ model_name = "dangvantuan/sentence-camembert-large"
12
+ model_kwargs = {'device': 'cpu'}
13
+ encode_kwargs = {'convert_to_tensor': True}
14
+ splitter = SentenceTransformersTokenTextSplitter(model_name=model_name,
15
+ tokens_per_chunk=380,
16
+ chunk_overlap=100)
17
+
18
+ embeddings_fun = HuggingFaceEmbeddings(
19
+ model_name=model_name,
20
+ model_kwargs=model_kwargs,
21
+ encode_kwargs=encode_kwargs
22
+ )
23
 
24
 
25
  def read_pdf(file):