lalithadevi commited on
Commit
e48e7d5
1 Parent(s): 61f5068

Update news_category_similar_news_prediction.py

Browse files
news_category_similar_news_prediction.py CHANGED
@@ -76,7 +76,7 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
76
  headlines = [*final_df['title']].copy()
77
  label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
78
  sent_embs = vectorizer.vectorize_(headlines, sent_model)
79
- sim_news = [find_similar_news(search_vec, collection, vectorizer, sent_model, ce_model) for search_vec in sent_embs]
80
  final_df['category'] = label
81
  final_df['pred_proba'] = prob
82
  final_df['similar_news'] = sim_news
@@ -92,7 +92,7 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
92
  headlines = [*new_news['title']].copy()
93
  label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
94
  sent_embs = vectorizer.vectorize_(headlines, sent_model)
95
- sim_news = [find_similar_news(search_vec, collection, vectorizer, sent_model, ce_model) for search_vec in sent_embs]
96
  new_news['category'] = label
97
  new_news['pred_proba'] = prob
98
  final_df['similar_news'] = sim_news
 
76
  headlines = [*final_df['title']].copy()
77
  label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
78
  sent_embs = vectorizer.vectorize_(headlines, sent_model)
79
+ sim_news = [find_similar_news(text, search_vec, collection, vectorizer, sent_model, ce_model) for search_vec, text in zip(sent_embs, headlines)]
80
  final_df['category'] = label
81
  final_df['pred_proba'] = prob
82
  final_df['similar_news'] = sim_news
 
92
  headlines = [*new_news['title']].copy()
93
  label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
94
  sent_embs = vectorizer.vectorize_(headlines, sent_model)
95
+ sim_news = [find_similar_news(text, search_vec, collection, vectorizer, sent_model, ce_model) for search_vec, text in zip(sent_embs, headlines)]
96
  new_news['category'] = label
97
  new_news['pred_proba'] = prob
98
  final_df['similar_news'] = sim_news