Zeitstaub commited on
Commit
40ae375
1 Parent(s): 1622219

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -3
app.py CHANGED
@@ -44,9 +44,14 @@ def find_similar_texts(model_name, input_text):
44
  distances = euclidean_distances(embedding_matrix, input_embedding).flatten()
45
  text_embeddings['euclidean_distance'] = distances
46
  sorted_embeddings = text_embeddings.sort_values(by='euclidean_distance', ascending=True)
47
- top_five = sorted_embeddings.head(5)[['abstract', 'patent no', 'title']]
48
- # formatted_output = '\n\n'.join([f"Patent No: {row['patent no']}\n {row['title']}\n {row['abstract']}\n" for index, row in top_five.iterrows()])
49
- formatted_output = '\n\n'.join([f"<strong>Patent No: {row['patent no']}\n<strong>Title: {row['title']}\n<strong>Abstract: {row['abstract']}" for index, row in top_five.iterrows()])
 
 
 
 
 
50
  return formatted_output
51
  else:
52
  return "It seems there is no patent abstract close to your description."
 
44
  distances = euclidean_distances(embedding_matrix, input_embedding).flatten()
45
  text_embeddings['euclidean_distance'] = distances
46
  sorted_embeddings = text_embeddings.sort_values(by='euclidean_distance', ascending=True)
47
+ # top_five = sorted_embeddings.head(5)[['abstract', 'patent no', 'title']]
48
+ # formatted_output = '\n\n'.join([f"<Patent No: {row['patent no']}\nTitle: {row['title']}\nAbstract: {row['abstract']}" for index, row in top_five.iterrows()])
49
+ formatted_output = '\n\n'.join([
50
+ f"<strong>Patent No:</strong> {row['patent no']}<br>"
51
+ f"<strong>Title:</strong> {row['title']}<br>"
52
+ f"<strong>Abstract:</strong> {row['abstract']}"
53
+ for index, row in top_five.iterrows()
54
+ ])
55
  return formatted_output
56
  else:
57
  return "It seems there is no patent abstract close to your description."