lalithadevi commited on
Commit
59792ae
1 Parent(s): 132f624

Update news_category_similar_news_prediction.py

Browse files
news_category_similar_news_prediction.py CHANGED
@@ -32,7 +32,7 @@ def date_time_parser(dt):
32
  def delete_outdated_news(final_df: pd.DataFrame):
33
  logger.warning("Entering delete_outdated_news()")
34
  final_df = final_df.copy()
35
- final_df["parsed_date"] = final_df["parsed_date"].map(correct_date)
36
  final_df["parsed_date"] = final_df["parsed_date"].map(parser.parse)
37
  final_df["elapsed_time"] = final_df["parsed_date"].apply(date_time_parser)
38
  final_df = final_df.loc[final_df["elapsed_time"] <= 720, :].copy() # 1440=24 hrs and 720=12 hrs
@@ -94,6 +94,11 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
94
  new_news = delete_outdated_news(new_news)
95
  logger.warning(f'{len(new_news)} new news items found after deleting outdated news')
96
  logger.warning(f'new news columns: {[*new_news.columns]}')
 
 
 
 
 
97
 
98
 
99
  if isinstance(old_news, pd.DataFrame):
@@ -105,9 +110,15 @@ def predict_news_category_similar_news(old_news: pd.DataFrame, new_news: pd.Data
105
 
106
  old_news.drop(columns='_id', inplace=True)
107
  logger.warning('Dropped _id column from old news data frame.')
 
 
108
  else:
109
  logger.warning('No old news is found')
110
  old_news = new_news.copy()
 
 
 
 
111
 
112
  if 'category' not in [*old_news.columns]:
113
  logger.warning('No prior predictions found in old news')
 
32
  def delete_outdated_news(final_df: pd.DataFrame):
33
  logger.warning("Entering delete_outdated_news()")
34
  final_df = final_df.copy()
35
+ # final_df["parsed_date"] = final_df["parsed_date"].map(correct_date)
36
  final_df["parsed_date"] = final_df["parsed_date"].map(parser.parse)
37
  final_df["elapsed_time"] = final_df["parsed_date"].apply(date_time_parser)
38
  final_df = final_df.loc[final_df["elapsed_time"] <= 720, :].copy() # 1440=24 hrs and 720=12 hrs
 
94
  new_news = delete_outdated_news(new_news)
95
  logger.warning(f'{len(new_news)} new news items found after deleting outdated news')
96
  logger.warning(f'new news columns: {[*new_news.columns]}')
97
+ if len(new_news) <= 1:
98
+ new_news = None
99
+
100
+ if not isinstance(new_news, pd.DataFrame):
101
+ raise Exception('No New News Found after deleting outdated news')
102
 
103
 
104
  if isinstance(old_news, pd.DataFrame):
 
110
 
111
  old_news.drop(columns='_id', inplace=True)
112
  logger.warning('Dropped _id column from old news data frame.')
113
+ if len(old_news) <= 1:
114
+ old_news = None
115
  else:
116
  logger.warning('No old news is found')
117
  old_news = new_news.copy()
118
+
119
+ if not isinstance(old_news, pd.DataFrame):
120
+ logger.warning('No old news is found after deleting outdate news')
121
+ old_news = new_news.copy()
122
 
123
  if 'category' not in [*old_news.columns]:
124
  logger.warning('No prior predictions found in old news')