wizardofchance commited on
Commit
25f9d37
1 Parent(s): 3bc457f

Add BERTopic model

Browse files
Files changed (6) hide show
  1. README.md +71 -0
  2. config.json +16 -0
  3. ctfidf.safetensors +3 -0
  4. ctfidf_config.json +876 -0
  5. topic_embeddings.safetensors +3 -0
  6. topics.json +139 -0
README.md ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ tags:
4
+ - bertopic
5
+ library_name: bertopic
6
+ pipeline_tag: text-classification
7
+ ---
8
+
9
+ # NER_conllpp
10
+
11
+ This is a [BERTopic](https://github.com/MaartenGr/BERTopic) model.
12
+ BERTopic is a flexible and modular topic modeling framework that allows for the generation of easily interpretable topics from large datasets.
13
+
14
+ ## Usage
15
+
16
+ To use this model, please install BERTopic:
17
+
18
+ ```
19
+ pip install -U bertopic
20
+ ```
21
+
22
+ You can use the model as follows:
23
+
24
+ ```python
25
+ from bertopic import BERTopic
26
+ topic_model = BERTopic.load("wizardofchance/NER_conllpp")
27
+
28
+ topic_model.get_topic_info()
29
+ ```
30
+
31
+ ## Topic overview
32
+
33
+ * Number of topics: 2
34
+ * Number of training documents: 26
35
+
36
+ <details>
37
+ <summary>Click here for an overview of all topics.</summary>
38
+
39
+ | Topic ID | Topic Keywords | Topic Frequency | Label |
40
+ |----------|----------------|-----------------|-------|
41
+ | 0 | peacekeeping - gandhi - terrorism - peace - terrorists | 19 | 0_peacekeeping_gandhi_terrorism_peace |
42
+ | 1 | nations - organization - united - peace - council | 7 | 1_nations_organization_united_peace |
43
+
44
+ </details>
45
+
46
+ ## Training hyperparameters
47
+
48
+ * calculate_probabilities: False
49
+ * language: None
50
+ * low_memory: False
51
+ * min_topic_size: 10
52
+ * n_gram_range: (1, 1)
53
+ * nr_topics: None
54
+ * seed_topic_list: None
55
+ * top_n_words: 10
56
+ * verbose: False
57
+ * zeroshot_min_similarity: 0.7
58
+ * zeroshot_topic_list: None
59
+
60
+ ## Framework versions
61
+
62
+ * Numpy: 1.25.2
63
+ * HDBSCAN: 0.8.33
64
+ * UMAP: 0.5.6
65
+ * Pandas: 2.0.3
66
+ * Scikit-Learn: 1.2.2
67
+ * Sentence-transformers: 2.7.0
68
+ * Transformers: 4.40.1
69
+ * Numba: 0.58.1
70
+ * Plotly: 5.15.0
71
+ * Python: 3.10.12
config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "calculate_probabilities": false,
3
+ "language": null,
4
+ "low_memory": false,
5
+ "min_topic_size": 10,
6
+ "n_gram_range": [
7
+ 1,
8
+ 1
9
+ ],
10
+ "nr_topics": null,
11
+ "seed_topic_list": null,
12
+ "top_n_words": 10,
13
+ "verbose": false,
14
+ "zeroshot_min_similarity": 0.7,
15
+ "zeroshot_topic_list": null
16
+ }
ctfidf.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46c3297589ce0b7afa88069274abe2047067470c7df7804b2f1a92f8a3c01d76
3
+ size 18480
ctfidf_config.json ADDED
@@ -0,0 +1,876 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "ctfidf_model": {
3
+ "bm25_weighting": false,
4
+ "reduce_frequent_words": false
5
+ },
6
+ "vectorizer_model": {
7
+ "params": {
8
+ "analyzer": "word",
9
+ "binary": false,
10
+ "decode_error": "strict",
11
+ "encoding": "utf-8",
12
+ "input": "content",
13
+ "lowercase": true,
14
+ "max_df": 1.0,
15
+ "max_features": null,
16
+ "min_df": 1,
17
+ "ngram_range": [
18
+ 1,
19
+ 1
20
+ ],
21
+ "stop_words": "english",
22
+ "strip_accents": null,
23
+ "token_pattern": "(?u)\\b\\w\\w+\\b",
24
+ "vocabulary": null
25
+ },
26
+ "vocab": {
27
+ "united": 805,
28
+ "nations": 506,
29
+ "marking": 468,
30
+ "seventieth": 704,
31
+ "anniversary": 62,
32
+ "year": 840,
33
+ "making": 461,
34
+ "session": 702,
35
+ "general": 336,
36
+ "assembly": 81,
37
+ "historic": 363,
38
+ "hope": 370,
39
+ "terms": 759,
40
+ "outcomes": 541,
41
+ "like": 441,
42
+ "assure": 85,
43
+ "president": 594,
44
+ "receive": 641,
45
+ "india": 393,
46
+ "support": 746,
47
+ "efforts": 265,
48
+ "seventy": 705,
49
+ "years": 841,
50
+ "ago": 51,
51
+ "foundations": 327,
52
+ "laid": 424,
53
+ "san": 696,
54
+ "francisco": 329,
55
+ "conference": 159,
56
+ "city": 136,
57
+ "west": 830,
58
+ "coast": 142,
59
+ "country": 193,
60
+ "signatory": 710,
61
+ "countries": 192,
62
+ "charter": 131,
63
+ "time": 770,
64
+ "independent": 392,
65
+ "obtained": 527,
66
+ "independence": 391,
67
+ "later": 427,
68
+ "established": 292,
69
+ "diminutive": 236,
70
+ "looking": 451,
71
+ "man": 463,
72
+ "powerful": 586,
73
+ "weapon": 828,
74
+ "non": 521,
75
+ "violence": 818,
76
+ "writing": 839,
77
+ "final": 314,
78
+ "act": 36,
79
+ "struggle": 739,
80
+ "symbol": 750,
81
+ "colonized": 145,
82
+ "oppressed": 537,
83
+ "grateful": 345,
84
+ "proclaimed": 607,
85
+ "birthday": 104,
86
+ "extraordinary": 304,
87
+ "international": 404,
88
+ "day": 208,
89
+ "pleasing": 577,
90
+ "coincidence": 143,
91
+ "tomorrow": 774,
92
+ "october": 531,
93
+ "and42": 61,
94
+ "55": 27,
95
+ "15": 4,
96
+ "29658": 21,
97
+ "01": 1,
98
+ "10": 2,
99
+ "2015": 12,
100
+ "70": 30,
101
+ "pv": 626,
102
+ "22that": 19,
103
+ "celebrating": 124,
104
+ "mahatma": 456,
105
+ "gandhi": 334,
106
+ "said": 694,
107
+ "difference": 233,
108
+ "capable": 118,
109
+ "doing": 249,
110
+ "suffice": 744,
111
+ "solve": 724,
112
+ "world": 838,
113
+ "problems": 604,
114
+ "message": 482,
115
+ "fitting": 320,
116
+ "context": 174,
117
+ "today": 772,
118
+ "ravaged": 634,
119
+ "war": 825,
120
+ "continents": 175,
121
+ "security": 698,
122
+ "council": 189,
123
+ "powerless": 587,
124
+ "unwilling": 807,
125
+ "stem": 736,
126
+ "low": 454,
127
+ "blood": 105,
128
+ "traditional": 779,
129
+ "solutions": 723,
130
+ "rely": 661,
131
+ "force": 323,
132
+ "exacerbated": 295,
133
+ "ask": 78,
134
+ "political": 584,
135
+ "craft": 198,
136
+ "alternatives": 55,
137
+ "conflict": 160,
138
+ "pursue": 625,
139
+ "commitment": 148,
140
+ "single": 714,
141
+ "minded": 490,
142
+ "dedication": 215,
143
+ "goal": 341,
144
+ "important": 384,
145
+ "peacekeeping": 565,
146
+ "blue": 106,
147
+ "flag": 321,
148
+ "men": 480,
149
+ "women": 836,
150
+ "constantly": 167,
151
+ "working": 837,
152
+ "prevent": 596,
153
+ "protect": 617,
154
+ "civilians": 137,
155
+ "sustain": 747,
156
+ "peace": 562,
157
+ "processes": 606,
158
+ "180": 6,
159
+ "000": 0,
160
+ "peacekeepers": 564,
161
+ "deployed": 226,
162
+ "far": 310,
163
+ "largest": 426,
164
+ "contributor": 182,
165
+ "provided": 620,
166
+ "indian": 394,
167
+ "military": 487,
168
+ "police": 581,
169
+ "personnel": 570,
170
+ "participating": 554,
171
+ "missions": 495,
172
+ "operating": 534,
173
+ "highly": 362,
174
+ "challenging": 129,
175
+ "environments": 284,
176
+ "remains": 663,
177
+ "committed": 150,
178
+ "continuing": 178,
179
+ "operations": 535,
180
+ "enhancing": 279,
181
+ "contributions": 181,
182
+ "announced": 63,
183
+ "prime": 600,
184
+ "minister": 491,
185
+ "leaders": 429,
186
+ "summit": 745,
187
+ "new": 518,
188
+ "cover": 197,
189
+ "aspects": 80,
190
+ "enablers": 274,
191
+ "training": 783,
192
+ "dilution": 235,
193
+ "cardinal": 121,
194
+ "principles": 602,
195
+ "occur": 530,
196
+ "fact": 308,
197
+ "troop": 791,
198
+ "contributing": 180,
199
+ "role": 687,
200
+ "formulation": 325,
201
+ "mandates": 465,
202
+ "amended": 57,
203
+ "consultation": 170,
204
+ "matter": 470,
205
+ "concern": 156,
206
+ "clear": 139,
207
+ "violation": 817,
208
+ "article": 75,
209
+ "44": 24,
210
+ "believe": 101,
211
+ "substitute": 741,
212
+ "high": 361,
213
+ "level": 437,
214
+ "panel": 550,
215
+ "underscored": 800,
216
+ "mark": 467,
217
+ "opportunity": 536,
218
+ "pay": 561,
219
+ "tribute": 790,
220
+ "300": 22,
221
+ "including": 389,
222
+ "161": 5,
223
+ "ultimate": 796,
224
+ "sacrifice": 691,
225
+ "stand": 730,
226
+ "ready": 638,
227
+ "contribute": 179,
228
+ "memorial": 479,
229
+ "wall": 822,
230
+ "approved": 69,
231
+ "ninth": 520,
232
+ "safety": 693,
233
+ "future": 333,
234
+ "community": 152,
235
+ "depend": 225,
236
+ "respond": 672,
237
+ "greatest": 346,
238
+ "threat": 767,
239
+ "face": 307,
240
+ "terrorism": 761,
241
+ "lived": 446,
242
+ "quarter": 628,
243
+ "century": 126,
244
+ "tragically": 782,
245
+ "brought": 112,
246
+ "home": 368,
247
+ "autumn": 89,
248
+ "2001": 10,
249
+ "adequately": 41,
250
+ "countered": 191,
251
+ "proliferation": 610,
252
+ "terrorist": 762,
253
+ "acts": 38,
254
+ "rise": 685,
255
+ "extremist": 306,
256
+ "ideologies": 380,
257
+ "impunity": 386,
258
+ "states": 735,
259
+ "organized": 539,
260
+ "action": 37,
261
+ "defeat": 217,
262
+ "demonstrate": 224,
263
+ "zero": 846,
264
+ "tolerance": 773,
265
+ "terrorists": 763,
266
+ "kill": 419,
267
+ "maim": 457,
268
+ "innocent": 399,
269
+ "base": 97,
270
+ "principle": 601,
271
+ "prosecute": 614,
272
+ "extradite": 303,
273
+ "make": 460,
274
+ "provide": 619,
275
+ "financing": 317,
276
+ "safe": 692,
277
+ "havens": 355,
278
+ "arming": 73,
279
+ "heavy": 357,
280
+ "price": 599,
281
+ "equally": 288,
282
+ "establishment": 293,
283
+ "legal": 432,
284
+ "regime": 655,
285
+ "comprehensive": 154,
286
+ "convention": 184,
287
+ "longer": 449,
288
+ "held": 358,
289
+ "nineteen": 519,
290
+ "1996": 9,
291
+ "proposed": 613,
292
+ "member": 477,
293
+ "unable": 797,
294
+ "adopt": 42,
295
+ "mired": 494,
296
+ "issue": 411,
297
+ "definition": 218,
298
+ "understand": 801,
299
+ "distinction": 247,
300
+ "exists": 298,
301
+ "good": 343,
302
+ "bad": 94,
303
+ "linked15": 444,
304
+ "43": 23,
305
+ "22": 17,
306
+ "2015to": 14,
307
+ "religion": 660,
308
+ "commits": 149,
309
+ "crimes": 202,
310
+ "humanity": 376,
311
+ "appeal": 66,
312
+ "come": 147,
313
+ "pledge": 578,
314
+ "unanimously": 799,
315
+ "subject": 740,
316
+ "share": 707,
317
+ "challenges": 128,
318
+ "ties": 769,
319
+ "pakistan": 548,
320
+ "accept": 32,
321
+ "legitimate": 434,
322
+ "instrument": 403,
323
+ "statecraft": 733,
324
+ "shared": 708,
325
+ "outrage": 543,
326
+ "2008": 11,
327
+ "mumbai": 502,
328
+ "terror": 760,
329
+ "attacks": 87,
330
+ "citizens": 135,
331
+ "helplessly": 360,
332
+ "butchered": 116,
333
+ "mastermind": 469,
334
+ "attack": 86,
335
+ "walking": 821,
336
+ "free": 330,
337
+ "affront": 47,
338
+ "entire": 282,
339
+ "past": 559,
340
+ "assurances": 84,
341
+ "regard": 653,
342
+ "honoured": 369,
343
+ "cross": 206,
344
+ "border": 109,
345
+ "taken": 753,
346
+ "place": 571,
347
+ "recently": 643,
348
+ "captured": 120,
349
+ "alive": 54,
350
+ "know": 420,
351
+ "meant": 473,
352
+ "destabilize": 228,
353
+ "legitimize": 435,
354
+ "illegal": 381,
355
+ "occupation": 529,
356
+ "parts": 558,
357
+ "state": 732,
358
+ "jammu": 413,
359
+ "kashmir": 417,
360
+ "claim": 138,
361
+ "rest": 677,
362
+ "let": 436,
363
+ "use": 810,
364
+ "occasion": 528,
365
+ "spell": 727,
366
+ "approach": 68,
367
+ "clearly": 140,
368
+ "open": 533,
369
+ "dialogue": 232,
370
+ "finds": 318,
371
+ "talks": 756,
372
+ "incompatible": 390,
373
+ "yesterday": 843,
374
+ "termed": 758,
375
+ "point": 579,
376
+ "initiative": 398,
377
+ "need": 510,
378
+ "points": 580,
379
+ "just": 416,
380
+ "sit": 715,
381
+ "talk": 755,
382
+ "precisely": 589,
383
+ "discussed": 242,
384
+ "decided": 212,
385
+ "ministers": 493,
386
+ "ufa": 795,
387
+ "july": 415,
388
+ "hold": 366,
389
+ "national": 504,
390
+ "advisers": 44,
391
+ "issues": 412,
392
+ "connected": 164,
393
+ "arrange": 74,
394
+ "early": 253,
395
+ "meeting": 476,
396
+ "directors": 237,
397
+ "address": 40,
398
+ "situation": 716,
399
+ "response": 673,
400
+ "credible": 201,
401
+ "prepared": 592,
402
+ "outstanding": 544,
403
+ "bilateral": 102,
404
+ "counter": 190,
405
+ "menace": 481,
406
+ "acknowledge": 35,
407
+ "real": 639,
408
+ "social": 720,
409
+ "economic": 259,
410
+ "progress": 609,
411
+ "critical": 205,
412
+ "elimination": 267,
413
+ "basic": 99,
414
+ "human": 374,
415
+ "want": 823,
416
+ "leads": 431,
417
+ "invariably": 405,
418
+ "peaceful": 563,
419
+ "societies": 721,
420
+ "evidenced": 294,
421
+ "map": 466,
422
+ "conflicts": 161,
423
+ "engulf": 278,
424
+ "days": 209,
425
+ "adopted": 43,
426
+ "2030": 16,
427
+ "agenda": 50,
428
+ "sustainable": 748,
429
+ "development": 231,
430
+ "resolution": 669,
431
+ "goals": 342,
432
+ "core": 187,
433
+ "constitute": 168,
434
+ "blueprint": 107,
435
+ "holistic": 367,
436
+ "millennium": 488,
437
+ "successful": 743,
438
+ "implementation": 383,
439
+ "require": 668,
440
+ "resolve": 670,
441
+ "inclination": 387,
442
+ "toshare": 777,
443
+ "technology": 757,
444
+ "financial": 316,
445
+ "resources": 671,
446
+ "simultaneously": 713,
447
+ "improving": 385,
448
+ "delivery": 221,
449
+ "mechanisms": 474,
450
+ "woman": 835,
451
+ "elected": 266,
452
+ "parliament": 553,
453
+ "firm": 319,
454
+ "conviction": 185,
455
+ "shortcut": 709,
456
+ "change": 130,
457
+ "empowering": 272,
458
+ "girl": 338,
459
+ "child": 132,
460
+ "government": 344,
461
+ "policy": 582,
462
+ "programme": 608,
463
+ "educate": 262,
464
+ "empower": 271,
465
+ "conceived": 155,
466
+ "vision": 819,
467
+ "rests": 679,
468
+ "building": 113,
469
+ "planet": 573,
470
+ "children": 133,
471
+ "prepare": 591,
472
+ "meet": 475,
473
+ "months": 499,
474
+ "paris": 552,
475
+ "expects": 301,
476
+ "deliver": 219,
477
+ "ambitious": 56,
478
+ "agreement": 52,
479
+ "climate": 141,
480
+ "duty": 252,
481
+ "common": 151,
482
+ "mind": 489,
483
+ "larger": 425,
484
+ "historical": 364,
485
+ "differentiated": 234,
486
+ "responsibilities": 674,
487
+ "used": 811,
488
+ "needs": 512,
489
+ "greed": 347,
490
+ "adapting": 39,
491
+ "lifestyle": 440,
492
+ "choices": 134,
493
+ "reducing": 647,
494
+ "extravagant": 305,
495
+ "consumption": 171,
496
+ "help": 359,
497
+ "correct": 188,
498
+ "course": 195,
499
+ "reason": 640,
500
+ "equitable": 290,
501
+ "delivering": 220,
502
+ "concrete": 157,
503
+ "developing": 230,
504
+ "enabled": 273,
505
+ "developed": 229,
506
+ "areas": 72,
507
+ "finance": 315,
508
+ "transfer": 784,
509
+ "capacity": 119,
510
+ "willing": 831,
511
+ "partner": 555,
512
+ "global": 340,
513
+ "play": 575,
514
+ "reaching": 637,
515
+ "meaningful": 472,
516
+ "effective": 263,
517
+ "reverence": 681,
518
+ "environment": 283,
519
+ "based": 98,
520
+ "traditions": 780,
521
+ "nature": 508,
522
+ "sacred": 690,
523
+ "health": 356,
524
+ "tied": 768,
525
+ "guided": 350,
526
+ "yoga": 844,
527
+ "celebrated": 123,
528
+ "fervour": 313,
529
+ "192": 7,
530
+ "hallowed": 353,
531
+ "institution": 401,
532
+ "thank": 765,
533
+ "enthusiasm": 280,
534
+ "seed": 699,
535
+ "planted": 574,
536
+ "grow": 348,
537
+ "magnificent": 455,
538
+ "tree": 789,
539
+ "congratulate": 163,
540
+ "prompt": 612,
541
+ "tackling": 752,
542
+ "epidemics": 286,
543
+ "linking": 445,
544
+ "managed": 464,
545
+ "eradicate": 291,
546
+ "smallpox": 719,
547
+ "nearly": 509,
548
+ "polio": 583,
549
+ "hiv": 365,
550
+ "aids": 53,
551
+ "controlled": 183,
552
+ "ebola": 258,
553
+ "outbreak": 540,
554
+ "contained": 172,
555
+ "unacceptably": 798,
556
+ "lives": 447,
557
+ "paid": 547,
558
+ "epidemic": 285,
559
+ "example": 296,
560
+ "crisis": 204,
561
+ "proud": 618,
562
+ "that44": 766,
563
+ "22india": 18,
564
+ "played": 576,
565
+ "inspired": 400,
566
+ "successes": 742,
567
+ "redouble": 645,
568
+ "diseases": 245,
569
+ "tuberculosis": 794,
570
+ "malaria": 462,
571
+ "natural": 507,
572
+ "disasters": 240,
573
+ "deserve": 227,
574
+ "coordinated": 186,
575
+ "recent": 642,
576
+ "wanting": 824,
577
+ "refugee": 652,
578
+ "caused": 122,
579
+ "situations": 717,
580
+ "syria": 751,
581
+ "iraq": 408,
582
+ "libya": 438,
583
+ "needed": 511,
584
+ "swift": 749,
585
+ "backed": 93,
586
+ "humanitarian": 375,
587
+ "crises": 203,
588
+ "neighbourhood": 515,
589
+ "quick": 631,
590
+ "responsive": 676,
591
+ "nepal": 516,
592
+ "yemen": 842,
593
+ "emerged": 269,
594
+ "net": 517,
595
+ "provider": 621,
596
+ "assisting": 82,
597
+ "nationals": 505,
598
+ "sought": 725,
599
+ "hosting": 372,
600
+ "asian": 77,
601
+ "ministerial": 492,
602
+ "disaster": 239,
603
+ "risk": 686,
604
+ "reduction": 648,
605
+ "november": 525,
606
+ "2016": 15,
607
+ "topic": 776,
608
+ "sendai": 701,
609
+ "framework": 328,
610
+ "walked": 820,
611
+ "long": 448,
612
+ "way": 826,
613
+ "25": 20,
614
+ "billion": 103,
615
+ "countrymen": 194,
616
+ "attest": 88,
617
+ "happy": 354,
618
+ "knowledge": 421,
619
+ "democratic": 223,
620
+ "deeply": 216,
621
+ "embedded": 268,
622
+ "nonetheless": 522,
623
+ "transformative": 786,
624
+ "reinvigorate": 657,
625
+ "nation": 503,
626
+ "redeem": 644,
627
+ "spirit": 728,
628
+ "modi": 497,
629
+ "took": 775,
630
+ "office": 532,
631
+ "half": 351,
632
+ "renewal": 665,
633
+ "rightful": 683,
634
+ "affairs": 45,
635
+ "fastest": 311,
636
+ "growing": 349,
637
+ "major": 459,
638
+ "economy": 261,
639
+ "driving": 251,
640
+ "premised": 590,
641
+ "motto": 500,
642
+ "sabka": 689,
643
+ "saath": 688,
644
+ "vikas": 816,
645
+ "places": 572,
646
+ "emphasis": 270,
647
+ "welfare": 829,
648
+ "people": 566,
649
+ "africa": 48,
650
+ "region": 656,
651
+ "bonds": 108,
652
+ "solidarity": 722,
653
+ "born": 110,
654
+ "colonialism": 144,
655
+ "belief": 100,
656
+ "prosperity": 615,
657
+ "month": 498,
658
+ "host": 371,
659
+ "forum": 326,
660
+ "54": 26,
661
+ "african": 49,
662
+ "invited": 407,
663
+ "nuclear": 526,
664
+ "aware": 91,
665
+ "responsibility": 675,
666
+ "discriminatory": 241,
667
+ "verifiable": 813,
668
+ "disarmament": 238,
669
+ "undiminished": 802,
670
+ "life": 439,
671
+ "milestone": 486,
672
+ "look": 450,
673
+ "reflect": 649,
674
+ "achieved": 34,
675
+ "lost": 453,
676
+ "similarly": 712,
677
+ "associated": 83,
678
+ "provides": 622,
679
+ "analyse": 59,
680
+ "fulfilled": 331,
681
+ "purpose": 624,
682
+ "set": 703,
683
+ "question": 629,
684
+ "affirmative": 46,
685
+ "answer": 64,
686
+ "questions": 630,
687
+ "negative": 513,
688
+ "preventing": 597,
689
+ "decolonization": 214,
690
+ "dismantling": 246,
691
+ "apartheid": 65,
692
+ "combating": 146,
693
+ "hunger": 378,
694
+ "promoting": 611,
695
+ "democracy": 222,
696
+ "rights": 684,
697
+ "able": 31,
698
+ "taking": 754,
699
+ "various": 812,
700
+ "permanent": 568,
701
+ "path": 560,
702
+ "treading": 788,
703
+ "according": 33,
704
+ "parameters": 551,
705
+ "appears": 67,
706
+ "ineffective": 395,
707
+ "maintaining": 458,
708
+ "failed": 309,
709
+ "effectively": 264,
710
+ "area": 71,
711
+ "started": 731,
712
+ "reach": 635,
713
+ "enthusiastically": 281,
714
+ "partners": 556,
715
+ "focused": 322,
716
+ "foremost": 324,
717
+ "immediate": 382,
718
+ "results": 680,
719
+ "truly": 792,
720
+ "transformational": 785,
721
+ "reached": 636,
722
+ "extended": 302,
723
+ "renewing": 666,
724
+ "ancient": 60,
725
+ "linkages": 443,
726
+ "constructing": 169,
727
+ "modern": 496,
728
+ "partnerships": 557,
729
+ "14": 3,
730
+ "pacific": 546,
731
+ "island": 410,
732
+ "east": 256,
733
+ "replaced": 667,
734
+ "previous": 598,
735
+ "vigorous": 815,
736
+ "proactive": 603,
737
+ "engagement": 277,
738
+ "economically": 260,
739
+ "vibrant": 814,
740
+ "complements": 153,
741
+ "link": 442,
742
+ "remain": 662,
743
+ "middle": 484,
744
+ "process": 605,
745
+ "key": 418,
746
+ "radicalization": 632,
747
+ "continue": 176,
748
+ "asolution": 79,
749
+ "palestinian": 549,
750
+ "qualitatively": 627,
751
+ "upgraded": 808,
752
+ "relations": 658,
753
+ "powers": 588,
754
+ "institutions": 402,
755
+ "periodic": 567,
756
+ "organization": 538,
757
+ "meaning": 471,
758
+ "continues": 177,
759
+ "dominated": 250,
760
+ "wealthy": 827,
761
+ "influential": 397,
762
+ "notion": 524,
763
+ "sovereign": 726,
764
+ "equality": 287,
765
+ "permitted": 569,
766
+ "unfair": 803,
767
+ "norms": 523,
768
+ "fundamental": 332,
769
+ "challenge": 127,
770
+ "inequity": 396,
771
+ "built": 114,
772
+ "preserve": 593,
773
+ "centrality": 125,
774
+ "legitimacy": 433,
775
+ "custodian": 207,
776
+ "urgent": 809,
777
+ "pressing": 595,
778
+ "reform": 651,
779
+ "hour": 373,
780
+ "reflects": 650,
781
+ "geopolitical": 337,
782
+ "architecture": 70,
783
+ "1945": 8,
784
+ "does": 248,
785
+ "latin": 428,
786
+ "america": 58,
787
+ "seats": 697,
788
+ "members": 478,
789
+ "include": 388,
790
+ "decision": 213,
791
+ "structures": 738,
792
+ "business": 115,
793
+ "away": 92,
794
+ "outdated": 542,
795
+ "transparent": 787,
796
+ "methods": 483,
797
+ "giving": 339,
798
+ "balance": 95,
799
+ "restore": 678,
800
+ "credibility": 200,
801
+ "equip": 289,
802
+ "confront": 162,
803
+ "times": 771,
804
+ "leadership": 430,
805
+ "excellences": 297,
806
+ "mr": 501,
807
+ "sam": 695,
808
+ "kutesa": 422,
809
+ "courtenay": 196,
810
+ "rattray": 633,
811
+ "decades": 211,
812
+ "discussions": 244,
813
+ "text": 764,
814
+ "negotiations": 514,
815
+ "69": 29,
816
+ "560": 28,
817
+ "step": 737,
818
+ "springboard": 729,
819
+ "unique": 804,
820
+ "significance": 711,
821
+ "revitalization": 682,
822
+ "invite": 406,
823
+ "hall": 352,
824
+ "contemplate": 173,
825
+ "idea": 379,
826
+ "as15": 76,
827
+ "45": 25,
828
+ "2015a": 13,
829
+ "banyan": 96,
830
+ "eastern": 257,
831
+ "tradition": 778,
832
+ "connotes": 165,
833
+ "wisdom": 832,
834
+ "judgemental": 414,
835
+ "encompassing": 275,
836
+ "trunk": 793,
837
+ "outwards": 545,
838
+ "sky": 718,
839
+ "earth": 254,
840
+ "expansive": 300,
841
+ "branches": 111,
842
+ "shade": 706,
843
+ "relief": 659,
844
+ "discussion": 243,
845
+ "debate": 210,
846
+ "unlike": 806,
847
+ "young": 845,
848
+ "constant": 166,
849
+ "regeneration": 654,
850
+ "expansion": 299,
851
+ "withers": 834,
852
+ "fate": 312,
853
+ "awaits": 90,
854
+ "renew": 664,
855
+ "condemn": 158,
856
+ "irrelevance": 409,
857
+ "tragic": 781,
858
+ "withering": 833,
859
+ "easily": 255,
860
+ "lose": 452,
861
+ "labyrinth": 423,
862
+ "creation": 199,
863
+ "seize": 700,
864
+ "potential": 585,
865
+ "reduce": 646,
866
+ "gap": 335,
867
+ "mighty": 485,
868
+ "providing": 623,
869
+ "canopy": 117,
870
+ "prosperous": 616,
871
+ "humankind": 377,
872
+ "end": 276,
873
+ "statement": 734
874
+ }
875
+ }
876
+ }
topic_embeddings.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6977f5c694fe1a67c6310281eaace43556b2d8c88980d9fe778e06851f7e9a03
3
+ size 3160
topics.json ADDED
@@ -0,0 +1,139 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "topic_representations": {
3
+ "0": [
4
+ [
5
+ "peacekeeping",
6
+ 0.472503125667572
7
+ ],
8
+ [
9
+ "gandhi",
10
+ 0.4510841369628906
11
+ ],
12
+ [
13
+ "terrorism",
14
+ 0.4001331925392151
15
+ ],
16
+ [
17
+ "peace",
18
+ 0.3992835581302643
19
+ ],
20
+ [
21
+ "terrorists",
22
+ 0.3799479007720947
23
+ ],
24
+ [
25
+ "peacekeepers",
26
+ 0.3790397644042969
27
+ ],
28
+ [
29
+ "nations",
30
+ 0.36890077590942383
31
+ ],
32
+ [
33
+ "terrorist",
34
+ 0.368724524974823
35
+ ],
36
+ [
37
+ "india",
38
+ 0.34991031885147095
39
+ ],
40
+ [
41
+ "agreement",
42
+ 0.29255202412605286
43
+ ]
44
+ ],
45
+ "1": [
46
+ [
47
+ "nations",
48
+ 0.4652634561061859
49
+ ],
50
+ [
51
+ "organization",
52
+ 0.32233119010925293
53
+ ],
54
+ [
55
+ "united",
56
+ 0.3044189512729645
57
+ ],
58
+ [
59
+ "peace",
60
+ 0.3019982576370239
61
+ ],
62
+ [
63
+ "council",
64
+ 0.2955605089664459
65
+ ],
66
+ [
67
+ "banyan",
68
+ 0.28722596168518066
69
+ ],
70
+ [
71
+ "leadership",
72
+ 0.26841428875923157
73
+ ],
74
+ [
75
+ "legitimacy",
76
+ 0.2673830986022949
77
+ ],
78
+ [
79
+ "goals",
80
+ 0.25846096873283386
81
+ ],
82
+ [
83
+ "conflicts",
84
+ 0.2502977252006531
85
+ ]
86
+ ]
87
+ },
88
+ "topics": [
89
+ 0,
90
+ 0,
91
+ 1,
92
+ 1,
93
+ 0,
94
+ 0,
95
+ 0,
96
+ 0,
97
+ 0,
98
+ 0,
99
+ 0,
100
+ 0,
101
+ 0,
102
+ 0,
103
+ 0,
104
+ 0,
105
+ 0,
106
+ 0,
107
+ 1,
108
+ 1,
109
+ 0,
110
+ 0,
111
+ 1,
112
+ 1,
113
+ 1,
114
+ 0
115
+ ],
116
+ "topic_sizes": {
117
+ "0": 19,
118
+ "1": 7
119
+ },
120
+ "topic_mapper": [
121
+ [
122
+ 0,
123
+ 0,
124
+ 0
125
+ ],
126
+ [
127
+ 1,
128
+ 1,
129
+ 1
130
+ ]
131
+ ],
132
+ "topic_labels": {
133
+ "0": "0_peacekeeping_gandhi_terrorism_peace",
134
+ "1": "1_nations_organization_united_peace"
135
+ },
136
+ "custom_labels": null,
137
+ "_outliers": 0,
138
+ "topic_aspects": {}
139
+ }