File size: 1,957 Bytes
7329d3b
 
 
24bd232
7329d3b
90c8eef
 
7329d3b
90c8eef
 
214c1ff
 
fa2ba95
214c1ff
01e7208
 
 
 
 
6ba11bc
 
90c8eef
 
 
d90457d
90c8eef
e94fb2d
58ada3c
90c8eef
 
 
 
d531874
 
90c8eef
214c1ff
 
90c8eef
 
214c1ff
 
1f1a45a
aff870b
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
import os


COLLECT_PREDICTION_DATA = 1
PRODUCTION_URL = os.getenv("PRODUCTION_DB_URL")
PRODUCTION_DATABASE = "rss_news_db_cat_pred_sim_news"
PRODUCTION_COLLECTION = "rss_news_cat_pred_sim_news"
PREDICTION_URL = os.getenv("PREDICTION_DB_URL")
PREDICTION_DATABASE = "indian_news_predictions_db"
PREDICTION_COLLECTION = "indian_news_predictions_coll"
NEWS_EXTRACTOR_URL_TIMEOUT = 5

RSS_FEEDS_TO_EXTRACT = ['https://www.economictimes.indiatimes.com/rssfeedstopstories.cms',
       'https://www.thehindu.com/news/feeder/default.rss',
       'https://www.thehindu.com/sport/feeder/default.rss',
       'https://www.thehindu.com/sci-tech/science/feeder/default.rss',
       'https://www.thehindu.com/news/international/feeder/default.rss',
       'https://www.indiatoday.in/rss/1206577',
       'https://www.indiatoday.in/rss/1206550',
       'https://www.gadgets360.com/rss/feeds',
       'https://health.economictimes.indiatimes.com/rss/recentstories',
       # 'https://telanganatoday.com/feed',
       'https://www.businesstoday.in/rssfeeds/?id=225346',
       'https://feeds.feedburner.com/ndtvnews-latest',
       'https://feeds.feedburner.com/ndtvsports-latest',
       'https://www.hindustantimes.com/feeds/rss/world-news/rssfeed.xml',
       'https://www.hindustantimes.com/feeds/rss/lifestyle/health/rssfeed.xml',
       'https://www.hindustantimes.com/feeds/rss/astrology/rssfeed.xml',
       'https://www.indiatoday.in/rss/1206578',
       # 'https://www.moneycontrol.com/rss/latestnews.xml',
        'https://www.indiatvnews.com/rssnews/topstory.xml',
       'https://www.livemint.com/rss/news',
       'https://www.livemint.com/rss/technology',
       'https://www.livemint.com/rss/education',
       'https://www.zeebiz.com/latest.xml/feed',
       'https://www.timesofindia.indiatimes.com/rssfeedmostrecent.cms']



DISTILBERT_TOKENIZER_N_TOKENS = 80
NEWS_CATEGORY_CLASSIFIER_N_CLASSES = 8
CLASSIFIER_THRESHOLD = 0.5
NEWS_RETENTION_SECONDS = 300