obsei commited on
Commit
ecbe950
1 Parent(s): 0d3f6e5

Updating imports

Browse files
Files changed (1) hide show
  1. config.yaml +49 -49
config.yaml CHANGED
@@ -16,9 +16,9 @@ source:
16
  - '`app_url` is application url on app store.
17
  - For example for Xcode - https://apps.apple.com/us/app/xcode/id497799835'
18
  source:
19
- _target_: obsei.source.AppStoreScrapperSource
20
  config:
21
- _target_: obsei.source.AppStoreScrapperConfig
22
  app_url: "https://apps.apple.com/us/app/gmail-email-by-google/id422689480"
23
  lookup_period: "1h"
24
  max_count: 5
@@ -42,9 +42,9 @@ source:
42
  - 'For `queries` enter google maps urls or place ids, for example'
43
  - "https://www.google.co.in/maps/place/Taj+Mahal/@27.1751496,78.0399535,17z/data=!4m5!3m4!1s0x39747121d702ff6d:0xdd2ae4803f767dde!8m2!3d27.1751448!4d78.0421422"
44
  source:
45
- _target_: obsei.source.OSGoogleMapsReviewsSource
46
  config:
47
- _target_: obsei.source.OSGoogleMapsReviewsConfig
48
  api_key: ''
49
  queries:
50
  - "https://www.google.co.in/maps/place/Taj+Mahal/@27.1751496,78.0399535,17z/data=!4m5!3m4!1s0x39747121d702ff6d:0xdd2ae4803f767dde!8m2!3d27.1751448!4d78.0421422"
@@ -55,9 +55,9 @@ source:
55
  - 'Reddit subreddit, search etc rss url. For proper url refer following link -'
56
  - 'https://www.reddit.com/r/pathogendavid/comments/tv8m9/pathogendavids_guide_to_rss_and_reddit/'
57
  source:
58
- _target_: obsei.source.RedditScrapperSource
59
  config:
60
- _target_: obsei.source.RedditScrapperConfig
61
  url: 'https://www.reddit.com/r/wallstreetbets/comments/.rss?sort=new'
62
  lookup_period: "1h"
63
  Twitter:
@@ -67,14 +67,14 @@ source:
67
  - ''
68
  - 'Need twitter `consumer key` and `secret`, get it from https://developer.twitter.com/en/apply-for-access'
69
  source:
70
- _target_: obsei.source.TwitterSource
71
  config:
72
- _target_: obsei.source.TwitterSourceConfig
73
  query: "@Twitter"
74
  lookup_period: "1h"
75
  max_tweets: 10
76
  cred_info:
77
- _target_: obsei.source.TwitterCredentials
78
  consumer_key: ''
79
  consumer_secret: ''
80
  Facebook:
@@ -84,13 +84,13 @@ source:
84
  - ''
85
  - 'Need facebook app_id, app_secret and long_term_token. Get it from https://developers.facebook.com/apps/'
86
  source:
87
- _target_: obsei.source.FacebookSource
88
  config:
89
- _target_: obsei.source.FacebookSourceConfig
90
  page_id: "110844591144719"
91
  lookup_period: "1h"
92
  cred_info:
93
- _target_: obsei.source.FacebookCredentials
94
  app_id: ''
95
  app_secret: ''
96
  long_term_token: ''
@@ -103,12 +103,12 @@ source:
103
  - 'https://myaccount.google.com/lesssecureapps?pli=1'
104
  - 'Also enable IMAP access - https://mail.google.com/mail/u/0/#settings/fwdandpop'
105
  source:
106
- _target_: obsei.source.EmailSource
107
  config:
108
- _target_: obsei.source.EmailConfig
109
  imap_server: 'imap.gmail.com'
110
  cred_info:
111
- _target_: obsei.source.EmailCredInfo
112
  username: ''
113
  password: ''
114
  lookup_period: "1h"
@@ -118,13 +118,13 @@ source:
118
  - 'Reddit account `username` and `password` require'
119
  - 'Enter list of `subreddits`'
120
  source:
121
- _target_: obsei.source.RedditSource
122
  config:
123
- _target_: obsei.source.RedditConfig
124
  subreddits:
125
  - 'wallstreetbets'
126
  cred_info:
127
- _target_: obsei.source.RedditCredInfo
128
  username: ''
129
  password: ''
130
  lookup_period: "1h"
@@ -133,9 +133,9 @@ source:
133
  _help_:
134
  - '`fetch_article` use crawler to fetch full article'
135
  source:
136
- _target_: obsei.source.GoogleNewsSource
137
  config:
138
- _target_: obsei.source.GoogleNewsConfig
139
  query: "bitcoin"
140
  max_results: 3
141
  lookup_period: "1d"
@@ -148,9 +148,9 @@ source:
148
  - 'For example - https://play.google.com/store/apps/details?id=com.google.android.gm&hl=en&gl=US'
149
  - '`com.google.android.gm` is the `package name` for xcode and `us` is `country`.'
150
  source:
151
- _target_: obsei.source.TrafilaturaCrawlerSource
152
  config:
153
- _target_: obsei.source.TrafilaturaCrawlerConfig
154
  urls:
155
  - 'https://obsei.github.io/obsei/'
156
  sink:
@@ -165,9 +165,9 @@ sink:
165
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/logger.png"
166
  _help_: null
167
  sink:
168
- _target_: obsei.sink.LoggerSink
169
  config:
170
- _target_: obsei.sink.LoggerSinkConfig
171
  Jira:
172
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/jira.png"
173
  _help_:
@@ -182,9 +182,9 @@ sink:
182
  - '`project` in which issue to be created, for more information refer -'
183
  - 'https://support.atlassian.com/jira-software-cloud/docs/what-is-a-jira-software-project/'
184
  sink:
185
- _target_: obsei.sink.JiraSink
186
  config:
187
- _target_: obsei.sink.JiraSinkConfig
188
  url: 'http://localhost:2990/jira'
189
  username: ''
190
  password: ''
@@ -202,13 +202,13 @@ sink:
202
  - ''
203
  - 'Provide zendesk account `email` and `password`'
204
  sink:
205
- _target_: obsei.sink.ZendeskSink
206
  config:
207
- _target_: obsei.sink.ZendeskSinkConfig
208
  domain: "zendesk.com"
209
  subdomain: null
210
  cred_info:
211
- _target_: obsei.sink.ZendeskCredInfo
212
  email: ''
213
  password: ''
214
  Slack:
@@ -220,9 +220,9 @@ sink:
220
  - 'To get `channel id` refer -'
221
  - 'https://stackoverflow.com/questions/40940327/what-is-the-simplest-way-to-find-a-slack-team-id-and-a-channel-id'
222
  sink:
223
- _target_: obsei.sink.SlackSink
224
  config:
225
- _target_: obsei.sink.SlackSinkConfig
226
  slack_token: ''
227
  channel_id: ''
228
  jinja_template: |
@@ -245,9 +245,9 @@ sink:
245
  - ''
246
  - ' Provide server `hostname`, `port` along with `index` to be used'
247
  sink:
248
- _target_: obsei.sink.ElasticSearchSink
249
  config:
250
- _target_: obsei.sink.ElasticSearchSinkConfig
251
  host: "localhost"
252
  port: 9200
253
  index_name: "test"
@@ -259,9 +259,9 @@ sink:
259
  - ''
260
  - 'Provide http server `url` and `headers`'
261
  sink:
262
- _target_: obsei.sink.HttpSink
263
  config:
264
- _target_: obsei.sink.HttpSinkConfig
265
  url: 'https://localhost:8080/api/path'
266
  headers:
267
  Content-type: "application/json"
@@ -274,20 +274,20 @@ analyzer:
274
  - ''
275
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
276
  config:
277
- _target_: obsei.analyzer.TransformersSentimentAnalyzerConfig
278
  labels:
279
  - "positive"
280
  - "negative"
281
  multi_class_classification: false
282
  analyzer:
283
- _target_: obsei.analyzer.TransformersSentimentAnalyzer
284
  model_name_or_path: "typeform/mobilebert-uncased-mnli"
285
  device: "auto"
286
  Vader:
287
  _help_:
288
  - 'Vader is less resource hungry dictionary based Vader Sentiment detector'
289
  analyzer:
290
- _target_: obsei.analyzer.VaderSentimentAnalyzer
291
  Classification:
292
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/classification.png"
293
  Transformer:
@@ -298,14 +298,14 @@ analyzer:
298
  - ''
299
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
300
  config:
301
- _target_: obsei.analyzer.ClassificationAnalyzerConfig
302
  labels:
303
  - "service"
304
  - "content"
305
  - "interface"
306
  multi_class_classification: true
307
  analyzer:
308
- _target_: obsei.analyzer.ZeroShotClassificationAnalyzer
309
  model_name_or_path: "typeform/mobilebert-uncased-mnli"
310
  device: "auto"
311
  Named Entity Recognition:
@@ -316,14 +316,14 @@ analyzer:
316
  - ''
317
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
318
  analyzer:
319
- _target_: obsei.analyzer.TransformersNERAnalyzer
320
  model_name_or_path: "elastic/distilbert-base-cased-finetuned-conll03-english"
321
  device: "auto"
322
  Spacy:
323
  _help_:
324
  - 'For supported models refer https://spacy.io/models'
325
  analyzer:
326
- _target_: obsei.analyzer.SpacyNERAnalyzer
327
  model_name_or_path: "en_core_web_sm"
328
  Translation:
329
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/translator.png"
@@ -333,7 +333,7 @@ analyzer:
333
  - ''
334
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
335
  analyzer:
336
- _target_: obsei.analyzer.TranslationAnalyzer
337
  model_name_or_path: "Helsinki-NLP/opus-mt-en-hi"
338
  device: "auto"
339
  PII Anonymizer:
@@ -349,16 +349,16 @@ analyzer:
349
  - ''
350
  - 'Provide `model_name` and `lang_code` of the model'
351
  config:
352
- _target_: obsei.analyzer.PresidioPIIAnalyzerConfig
353
  analyze_only: false
354
  return_decision_process: false
355
  analyzer:
356
- _target_: obsei.analyzer.PresidioPIIAnalyzer
357
  engine_config:
358
- _target_: obsei.analyzer.PresidioEngineConfig
359
  nlp_engine_name: "spacy"
360
  models:
361
- - _target_: obsei.analyzer.PresidioModelConfig
362
  model_name: "en_core_web_md"
363
  lang_code: "en"
364
  Dummy:
@@ -367,6 +367,6 @@ analyzer:
367
  _help_:
368
  - 'Dummy Analyzer, do nothing it simply used for transforming input to output'
369
  config:
370
- _target_: obsei.analyzer.DummyAnalyzerConfig
371
  analyzer:
372
- _target_: obsei.analyzer.DummyAnalyzer
 
16
  - '`app_url` is application url on app store.
17
  - For example for Xcode - https://apps.apple.com/us/app/xcode/id497799835'
18
  source:
19
+ _target_: obsei.source.appstore_scrapper.AppStoreScrapperSource
20
  config:
21
+ _target_: obsei.source.appstore_scrapper.AppStoreScrapperConfig
22
  app_url: "https://apps.apple.com/us/app/gmail-email-by-google/id422689480"
23
  lookup_period: "1h"
24
  max_count: 5
 
42
  - 'For `queries` enter google maps urls or place ids, for example'
43
  - "https://www.google.co.in/maps/place/Taj+Mahal/@27.1751496,78.0399535,17z/data=!4m5!3m4!1s0x39747121d702ff6d:0xdd2ae4803f767dde!8m2!3d27.1751448!4d78.0421422"
44
  source:
45
+ _target_: obsei.source.playstore_scrapper.OSGoogleMapsReviewsSource
46
  config:
47
+ _target_: obsei.source.playstore_scrapper.OSGoogleMapsReviewsConfig
48
  api_key: ''
49
  queries:
50
  - "https://www.google.co.in/maps/place/Taj+Mahal/@27.1751496,78.0399535,17z/data=!4m5!3m4!1s0x39747121d702ff6d:0xdd2ae4803f767dde!8m2!3d27.1751448!4d78.0421422"
 
55
  - 'Reddit subreddit, search etc rss url. For proper url refer following link -'
56
  - 'https://www.reddit.com/r/pathogendavid/comments/tv8m9/pathogendavids_guide_to_rss_and_reddit/'
57
  source:
58
+ _target_: obsei.source.reddit_source.RedditScrapperSource
59
  config:
60
+ _target_: obsei.source.reddit_source.RedditScrapperConfig
61
  url: 'https://www.reddit.com/r/wallstreetbets/comments/.rss?sort=new'
62
  lookup_period: "1h"
63
  Twitter:
 
67
  - ''
68
  - 'Need twitter `consumer key` and `secret`, get it from https://developer.twitter.com/en/apply-for-access'
69
  source:
70
+ _target_: obsei.source.twitter_source.TwitterSource
71
  config:
72
+ _target_: obsei.source.twitter_source.TwitterSourceConfig
73
  query: "@Twitter"
74
  lookup_period: "1h"
75
  max_tweets: 10
76
  cred_info:
77
+ _target_: obsei.source.twitter_source.TwitterCredentials
78
  consumer_key: ''
79
  consumer_secret: ''
80
  Facebook:
 
84
  - ''
85
  - 'Need facebook app_id, app_secret and long_term_token. Get it from https://developers.facebook.com/apps/'
86
  source:
87
+ _target_: obsei.source.facebook_source.FacebookSource
88
  config:
89
+ _target_: obsei.source.facebook_source.FacebookSourceConfig
90
  page_id: "110844591144719"
91
  lookup_period: "1h"
92
  cred_info:
93
+ _target_: obsei.source.facebook_source.FacebookCredentials
94
  app_id: ''
95
  app_secret: ''
96
  long_term_token: ''
 
103
  - 'https://myaccount.google.com/lesssecureapps?pli=1'
104
  - 'Also enable IMAP access - https://mail.google.com/mail/u/0/#settings/fwdandpop'
105
  source:
106
+ _target_: obsei.source.email_source.EmailSource
107
  config:
108
+ _target_: obsei.source.email_source.EmailConfig
109
  imap_server: 'imap.gmail.com'
110
  cred_info:
111
+ _target_: obsei.source.email_source.EmailCredInfo
112
  username: ''
113
  password: ''
114
  lookup_period: "1h"
 
118
  - 'Reddit account `username` and `password` require'
119
  - 'Enter list of `subreddits`'
120
  source:
121
+ _target_: obsei.source.reddit_source.RedditSource
122
  config:
123
+ _target_: obsei.source.reddit_source.RedditConfig
124
  subreddits:
125
  - 'wallstreetbets'
126
  cred_info:
127
+ _target_: obsei.source.reddit_source.RedditCredInfo
128
  username: ''
129
  password: ''
130
  lookup_period: "1h"
 
133
  _help_:
134
  - '`fetch_article` use crawler to fetch full article'
135
  source:
136
+ _target_: obsei.source.google_news_source.GoogleNewsSource
137
  config:
138
+ _target_: obsei.source.google_news_source.GoogleNewsConfig
139
  query: "bitcoin"
140
  max_results: 3
141
  lookup_period: "1d"
 
148
  - 'For example - https://play.google.com/store/apps/details?id=com.google.android.gm&hl=en&gl=US'
149
  - '`com.google.android.gm` is the `package name` for xcode and `us` is `country`.'
150
  source:
151
+ _target_: obsei.source.website_crawler_source.TrafilaturaCrawlerSource
152
  config:
153
+ _target_: obsei.source.website_crawler_source.TrafilaturaCrawlerConfig
154
  urls:
155
  - 'https://obsei.github.io/obsei/'
156
  sink:
 
165
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/logger.png"
166
  _help_: null
167
  sink:
168
+ _target_: obsei.sink.logger_sink.LoggerSink
169
  config:
170
+ _target_: obsei.sink.logger_sink.LoggerSinkConfig
171
  Jira:
172
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/jira.png"
173
  _help_:
 
182
  - '`project` in which issue to be created, for more information refer -'
183
  - 'https://support.atlassian.com/jira-software-cloud/docs/what-is-a-jira-software-project/'
184
  sink:
185
+ _target_: obsei.sink.jira_sink.JiraSink
186
  config:
187
+ _target_: obsei.sink.jira_sink.JiraSinkConfig
188
  url: 'http://localhost:2990/jira'
189
  username: ''
190
  password: ''
 
202
  - ''
203
  - 'Provide zendesk account `email` and `password`'
204
  sink:
205
+ _target_: obsei.sink.zendesk_sink.ZendeskSink
206
  config:
207
+ _target_: obsei.sink.zendesk_sink.ZendeskSinkConfig
208
  domain: "zendesk.com"
209
  subdomain: null
210
  cred_info:
211
+ _target_: obsei.sink.zendesk_sink.ZendeskCredInfo
212
  email: ''
213
  password: ''
214
  Slack:
 
220
  - 'To get `channel id` refer -'
221
  - 'https://stackoverflow.com/questions/40940327/what-is-the-simplest-way-to-find-a-slack-team-id-and-a-channel-id'
222
  sink:
223
+ _target_: obsei.sink.slack_sink.SlackSink
224
  config:
225
+ _target_: obsei.sink.slack_sink.SlackSinkConfig
226
  slack_token: ''
227
  channel_id: ''
228
  jinja_template: |
 
245
  - ''
246
  - ' Provide server `hostname`, `port` along with `index` to be used'
247
  sink:
248
+ _target_: obsei.sink.elasticsearch_sink.ElasticSearchSink
249
  config:
250
+ _target_: obsei.sink.elasticsearch_sink.ElasticSearchSinkConfig
251
  host: "localhost"
252
  port: 9200
253
  index_name: "test"
 
259
  - ''
260
  - 'Provide http server `url` and `headers`'
261
  sink:
262
+ _target_: obsei.sink.http_sink.HttpSink
263
  config:
264
+ _target_: obsei.sink.http_sink.HttpSinkConfig
265
  url: 'https://localhost:8080/api/path'
266
  headers:
267
  Content-type: "application/json"
 
274
  - ''
275
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
276
  config:
277
+ _target_: obsei.analyzer.sentiment_analyzer.TransformersSentimentAnalyzerConfig
278
  labels:
279
  - "positive"
280
  - "negative"
281
  multi_class_classification: false
282
  analyzer:
283
+ _target_: obsei.analyzer.sentiment_analyzer.TransformersSentimentAnalyzer
284
  model_name_or_path: "typeform/mobilebert-uncased-mnli"
285
  device: "auto"
286
  Vader:
287
  _help_:
288
  - 'Vader is less resource hungry dictionary based Vader Sentiment detector'
289
  analyzer:
290
+ _target_: obsei.analyzer.sentiment_analyzer.VaderSentimentAnalyzer
291
  Classification:
292
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/classification.png"
293
  Transformer:
 
298
  - ''
299
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
300
  config:
301
+ _target_: obsei.analyzer.classification_analyzer.ClassificationAnalyzerConfig
302
  labels:
303
  - "service"
304
  - "content"
305
  - "interface"
306
  multi_class_classification: true
307
  analyzer:
308
+ _target_: obsei.analyzer.classification_analyzer.ZeroShotClassificationAnalyzer
309
  model_name_or_path: "typeform/mobilebert-uncased-mnli"
310
  device: "auto"
311
  Named Entity Recognition:
 
316
  - ''
317
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
318
  analyzer:
319
+ _target_: obsei.analyzer.ner_analyzer.TransformersNERAnalyzer
320
  model_name_or_path: "elastic/distilbert-base-cased-finetuned-conll03-english"
321
  device: "auto"
322
  Spacy:
323
  _help_:
324
  - 'For supported models refer https://spacy.io/models'
325
  analyzer:
326
+ _target_: obsei.analyzer.ner_analyzer.SpacyNERAnalyzer
327
  model_name_or_path: "en_core_web_sm"
328
  Translation:
329
  _icon_: "https://raw.githubusercontent.com/obsei/obsei-resources/master/logos/translator.png"
 
333
  - ''
334
  - 'Possible device values are `auto` (cuda:0 if available otherwise cpu), `cpu` and `cuda:{id}` (cuda device id)'
335
  analyzer:
336
+ _target_: obsei.analyzer.translation_analyzer.TranslationAnalyzer
337
  model_name_or_path: "Helsinki-NLP/opus-mt-en-hi"
338
  device: "auto"
339
  PII Anonymizer:
 
349
  - ''
350
  - 'Provide `model_name` and `lang_code` of the model'
351
  config:
352
+ _target_: obsei.analyzer.pii_analyzer.PresidioPIIAnalyzerConfig
353
  analyze_only: false
354
  return_decision_process: false
355
  analyzer:
356
+ _target_: obsei.analyzer.pii_analyzer.PresidioPIIAnalyzer
357
  engine_config:
358
+ _target_: obsei.analyzer.pii_analyzer.PresidioEngineConfig
359
  nlp_engine_name: "spacy"
360
  models:
361
+ - _target_: obsei.analyzer.pii_analyzer.PresidioModelConfig
362
  model_name: "en_core_web_md"
363
  lang_code: "en"
364
  Dummy:
 
367
  _help_:
368
  - 'Dummy Analyzer, do nothing it simply used for transforming input to output'
369
  config:
370
+ _target_: obsei.analyzer.dummy_analyzer.DummyAnalyzerConfig
371
  analyzer:
372
+ _target_: obsei.analyzer.dummy_analyzer.DummyAnalyzer