ddovidovich commited on
Commit
6ecdc04
1 Parent(s): 2714936

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -4
app.py CHANGED
@@ -3,7 +3,9 @@ import streamlit as st
3
  import pandas as pd
4
  import numpy as np
5
  from tqdm.auto import tqdm
6
- from sentence_transformers import SentenceTransformer
 
 
7
 
8
  dataList = [
9
  {"Answer": "", "Distance": 0},
@@ -27,9 +29,12 @@ def load_documents_from_jsonl(embeddings_model, jsonl_path, createEmbeddings=Fal
27
 
28
  return df
29
 
30
- def generate_embeddings(model, text):
 
 
 
31
  with torch.no_grad():
32
- embeddings = model.encode(text, convert_to_tensor=True)
33
  return embeddings.cpu().numpy()
34
 
35
  def save_to_faiss(df):
@@ -56,7 +61,9 @@ def main():
56
  # Заголовок приложения
57
  st.title("Demo for LLAMA-2 RAG with CPU only")
58
 
59
- model = SentenceTransformer('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
 
 
60
 
61
  df_qa = load_documents_from_jsonl('ExportForAI1.jsonl', model, False)
62
  save_to_faiss(df_qa)
 
3
  import pandas as pd
4
  import numpy as np
5
  from tqdm.auto import tqdm
6
+ #from sentence_transformers import SentenceTransformer
7
+ from transformers import AutoTokenizer, AutoModel
8
+ import torch
9
 
10
  dataList = [
11
  {"Answer": "", "Distance": 0},
 
29
 
30
  return df
31
 
32
+ def generate_embeddings(tokenizer, model, text):
33
+ # with torch.no_grad():
34
+ # embeddings = model.encode(text, convert_to_tensor=True)
35
+ encoded_input = tokenizer(text, padding=True, truncation=True, return_tensors='pt')
36
  with torch.no_grad():
37
+ embeddings = model(**encoded_input)
38
  return embeddings.cpu().numpy()
39
 
40
  def save_to_faiss(df):
 
61
  # Заголовок приложения
62
  st.title("Demo for LLAMA-2 RAG with CPU only")
63
 
64
+ #model = SentenceTransformer('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
65
+ tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
66
+ model = AutoModel.from_pretrained('sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2')
67
 
68
  df_qa = load_documents_from_jsonl('ExportForAI1.jsonl', model, False)
69
  save_to_faiss(df_qa)