ffreemt commited on
Commit
689b5eb
1 Parent(s): fdb2623
Files changed (1) hide show
  1. app.py +3 -4
app.py CHANGED
@@ -136,11 +136,10 @@ DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
136
  # from langchain.embeddings import HuggingFaceEmbeddings
137
  # embeddings = HuggingFaceEmbeddings(model_name='paraphrase-multilingual-MiniLM-L12-v2')
138
  # https://www.sbert.net/docs/pretrained_models.html
139
- #
140
 
141
  # 'max_seq_length': 128
142
  MODEL_NAME = "paraphrase-multilingual-mpnet-base-v2" # 1.11G
143
- MODEL_NAME = "paraphrase-multilingual-MiniLM-L12-v2" # 471M
144
 
145
  # opanai max 4097
146
  # retriever default k = 4, query lenght about CHUNK_SIZE
@@ -424,8 +423,8 @@ def process_files(
424
  _ = (
425
  f"done file(s): {dict(ns.files_info)}, split to "
426
  f"{total} chunk(s). \n\nThe following embedding takes "
427
- f" {total} step(s). (Each step lasts about 18 secs "
428
- " on a free tier instance on huggingface space.)"
429
  )
430
 
431
  return _
 
136
  # from langchain.embeddings import HuggingFaceEmbeddings
137
  # embeddings = HuggingFaceEmbeddings(model_name='paraphrase-multilingual-MiniLM-L12-v2')
138
  # https://www.sbert.net/docs/pretrained_models.html
 
139
 
140
  # 'max_seq_length': 128
141
  MODEL_NAME = "paraphrase-multilingual-mpnet-base-v2" # 1.11G
142
+ MODEL_NAME = "paraphrase-multilingual-MiniLM-L12-v2" # 471M
143
 
144
  # opanai max 4097
145
  # retriever default k = 4, query lenght about CHUNK_SIZE
 
423
  _ = (
424
  f"done file(s): {dict(ns.files_info)}, split to "
425
  f"{total} chunk(s). \n\nThe following embedding takes "
426
+ f"{total} step(s) and approximately {total/10:.1f} minutes. (Each step lasts about ~6 secs "
427
+ "on a free tier instance on huggingface space.)"
428
  )
429
 
430
  return _