Commit
•
59792ae
1
Parent(s):
132f624
Update news_category_similar_news_prediction.py
Browse files
news_category_similar_news_prediction.py
CHANGED
@@ -32,7 +32,7 @@ def date_time_parser(dt):
|
|
32 |
def delete_outdated_news(final_df: pd.DataFrame):
|
33 |
logger.warning("Entering delete_outdated_news()")
|
34 |
final_df = final_df.copy()
|
35 |
-
final_df["parsed_date"] = final_df["parsed_date"].map(correct_date)
|
36 |
final_df["parsed_date"] = final_df["parsed_date"].map(parser.parse)
|
37 |
final_df["elapsed_time"] = final_df["parsed_date"].apply(date_time_parser)
|
38 |
final_df = final_df.loc[final_df["elapsed_time"] <= 720, :].copy() # 1440=24 hrs and 720=12 hrs
|
@@ -94,6 +94,11 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
|
|
94 |
new_news = delete_outdated_news(new_news)
|
95 |
logger.warning(f'{len(new_news)} new news items found after deleting outdated news')
|
96 |
logger.warning(f'new news columns: {[*new_news.columns]}')
|
|
|
|
|
|
|
|
|
|
|
97 |
|
98 |
|
99 |
if isinstance(old_news, pd.DataFrame):
|
@@ -105,9 +110,15 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
|
|
105 |
|
106 |
old_news.drop(columns='_id', inplace=True)
|
107 |
logger.warning('Dropped _id column from old news data frame.')
|
|
|
|
|
108 |
else:
|
109 |
logger.warning('No old news is found')
|
110 |
old_news = new_news.copy()
|
|
|
|
|
|
|
|
|
111 |
|
112 |
if 'category' not in [*old_news.columns]:
|
113 |
logger.warning('No prior predictions found in old news')
|
|
|
32 |
def delete_outdated_news(final_df: pd.DataFrame):
|
33 |
logger.warning("Entering delete_outdated_news()")
|
34 |
final_df = final_df.copy()
|
35 |
+
# final_df["parsed_date"] = final_df["parsed_date"].map(correct_date)
|
36 |
final_df["parsed_date"] = final_df["parsed_date"].map(parser.parse)
|
37 |
final_df["elapsed_time"] = final_df["parsed_date"].apply(date_time_parser)
|
38 |
final_df = final_df.loc[final_df["elapsed_time"] <= 720, :].copy() # 1440=24 hrs and 720=12 hrs
|
|
|
94 |
new_news = delete_outdated_news(new_news)
|
95 |
logger.warning(f'{len(new_news)} new news items found after deleting outdated news')
|
96 |
logger.warning(f'new news columns: {[*new_news.columns]}')
|
97 |
+
if len(new_news) <= 1:
|
98 |
+
new_news = None
|
99 |
+
|
100 |
+
if not isinstance(new_news, pd.DataFrame):
|
101 |
+
raise Exception('No New News Found after deleting outdated news')
|
102 |
|
103 |
|
104 |
if isinstance(old_news, pd.DataFrame):
|
|
|
110 |
|
111 |
old_news.drop(columns='_id', inplace=True)
|
112 |
logger.warning('Dropped _id column from old news data frame.')
|
113 |
+
if len(old_news) <= 1:
|
114 |
+
old_news = None
|
115 |
else:
|
116 |
logger.warning('No old news is found')
|
117 |
old_news = new_news.copy()
|
118 |
+
|
119 |
+
if not isinstance(old_news, pd.DataFrame):
|
120 |
+
logger.warning('No old news is found after deleting outdate news')
|
121 |
+
old_news = new_news.copy()
|
122 |
|
123 |
if 'category' not in [*old_news.columns]:
|
124 |
logger.warning('No prior predictions found in old news')
|