Commit
•
f740095
1
Parent(s):
71ba7d7
Update news_extractor/news_extractor.py
Browse files
news_extractor/news_extractor.py
CHANGED
@@ -137,7 +137,7 @@ def get_news_rss(url):
|
|
137 |
final_df = news_agg(url)
|
138 |
final_df.reset_index(drop=True, inplace=True)
|
139 |
|
140 |
-
|
141 |
|
142 |
final_df.sort_values(by="elapsed_time", inplace=True)
|
143 |
# final_df['src_time'] = final_df['src'] + (" " * 5) + final_df["elapsed_time_str"]
|
@@ -168,6 +168,7 @@ def get_news_multi_process(urls):
|
|
168 |
final_df = pd.concat([final_df, f.get(timeout=120)], axis=0) # getting output of each parallel job
|
169 |
|
170 |
final_df.reset_index(drop=True, inplace=True)
|
|
|
171 |
pool.close()
|
172 |
pool.join()
|
173 |
return final_df
|
|
|
137 |
final_df = news_agg(url)
|
138 |
final_df.reset_index(drop=True, inplace=True)
|
139 |
|
140 |
+
|
141 |
|
142 |
final_df.sort_values(by="elapsed_time", inplace=True)
|
143 |
# final_df['src_time'] = final_df['src'] + (" " * 5) + final_df["elapsed_time_str"]
|
|
|
168 |
final_df = pd.concat([final_df, f.get(timeout=120)], axis=0) # getting output of each parallel job
|
169 |
|
170 |
final_df.reset_index(drop=True, inplace=True)
|
171 |
+
logging.warning(final_df['src'].unique())
|
172 |
pool.close()
|
173 |
pool.join()
|
174 |
return final_df
|