lalithadevi
commited on
Commit
•
e48e7d5
1
Parent(s):
61f5068
Update news_category_similar_news_prediction.py
Browse files
news_category_similar_news_prediction.py
CHANGED
@@ -76,7 +76,7 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
|
|
76 |
headlines = [*final_df['title']].copy()
|
77 |
label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
|
78 |
sent_embs = vectorizer.vectorize_(headlines, sent_model)
|
79 |
-
sim_news = [find_similar_news(search_vec, collection, vectorizer, sent_model, ce_model) for search_vec in sent_embs]
|
80 |
final_df['category'] = label
|
81 |
final_df['pred_proba'] = prob
|
82 |
final_df['similar_news'] = sim_news
|
@@ -92,7 +92,7 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
|
|
92 |
headlines = [*new_news['title']].copy()
|
93 |
label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
|
94 |
sent_embs = vectorizer.vectorize_(headlines, sent_model)
|
95 |
-
sim_news = [find_similar_news(search_vec, collection, vectorizer, sent_model, ce_model) for search_vec in sent_embs]
|
96 |
new_news['category'] = label
|
97 |
new_news['pred_proba'] = prob
|
98 |
final_df['similar_news'] = sim_news
|
|
|
76 |
headlines = [*final_df['title']].copy()
|
77 |
label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
|
78 |
sent_embs = vectorizer.vectorize_(headlines, sent_model)
|
79 |
+
sim_news = [find_similar_news(text, search_vec, collection, vectorizer, sent_model, ce_model) for search_vec, text in zip(sent_embs, headlines)]
|
80 |
final_df['category'] = label
|
81 |
final_df['pred_proba'] = prob
|
82 |
final_df['similar_news'] = sim_news
|
|
|
92 |
headlines = [*new_news['title']].copy()
|
93 |
label, prob = inference(headlines, interpreter, label_encoder, tokenizer)
|
94 |
sent_embs = vectorizer.vectorize_(headlines, sent_model)
|
95 |
+
sim_news = [find_similar_news(text, search_vec, collection, vectorizer, sent_model, ce_model) for search_vec, text in zip(sent_embs, headlines)]
|
96 |
new_news['category'] = label
|
97 |
new_news['pred_proba'] = prob
|
98 |
final_df['similar_news'] = sim_news
|