LysandreJik commited on
Commit
67a0dec
1 Parent(s): 5d5fa0b

Initial commit

Browse files
.gitattributes CHANGED
@@ -14,3 +14,8 @@
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
14
  *.pb filter=lfs diff=lfs merge=lfs -text
15
  *.pt filter=lfs diff=lfs merge=lfs -text
16
  *.pth filter=lfs diff=lfs merge=lfs -text
17
+ elmo_token_embeddings.hdf5 filter=lfs diff=lfs merge=lfs -text
18
+ lm_embeddings_0.hdf5 filter=lfs diff=lfs merge=lfs -text
19
+ lm_embeddings_1.hdf5 filter=lfs diff=lfs merge=lfs -text
20
+ lm_embeddings_2.hdf5 filter=lfs diff=lfs merge=lfs -text
21
+ lm_weights.hdf5 filter=lfs diff=lfs merge=lfs -text
config/characters_token_embedder.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_reader": {
3
+ "type": "conll2003",
4
+ "tag_label": "ner",
5
+ "token_indexers": {
6
+ "tokens": {
7
+ "type": "single_id",
8
+ "lowercase_tokens": true
9
+ },
10
+ "elmo": {
11
+ "type": "elmo_characters"
12
+ }
13
+ }
14
+ },
15
+ "train_data_path": "test_fixtures/data/conll2003.txt",
16
+ "validation_data_path": "test_fixtures/data/conll2003.txt",
17
+ "model": {
18
+ "type": "simple_tagger",
19
+ "text_field_embedder": {
20
+ "token_embedders": {
21
+ "tokens": {
22
+ "type": "embedding",
23
+ "embedding_dim": 50
24
+ },
25
+ "elmo": {
26
+ "type": "elmo_token_embedder",
27
+ "options_file": "test_fixtures/elmo/options.json",
28
+ "weight_file": "test_fixtures/elmo/lm_weights.hdf5"
29
+ }
30
+ }
31
+ },
32
+ "encoder": {
33
+ "type": "gru",
34
+ "input_size": 82,
35
+ "hidden_size": 25,
36
+ "num_layers": 2,
37
+ "dropout": 0.5,
38
+ "bidirectional": true
39
+ },
40
+ "regularizer": {
41
+ "regexes": [
42
+ ["transitions$", {"type": "l2", "alpha": 0.01}]
43
+ ]
44
+ }
45
+ },
46
+ "data_loader": {"batch_size": 32},
47
+ "trainer": {
48
+ "optimizer": "adam",
49
+ "num_epochs": 5,
50
+ "cuda_device": -1
51
+ }
52
+ }
elmo_token_embeddings.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39cd3c881b66b74a7b7d0ba231dbed57cfac89a6a248f4d34e5ec94589e0bd68
3
+ size 31456
lm_embeddings_0.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebeee87fe246cacc2dd4b6b109537cd03bf45c8f5402d3570be7c57ddcb6ea21
3
+ size 44000
lm_embeddings_1.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c1547698ac31d92e2965a555656f0f4680b83ab4ab0a54958646bcbb0f00da0
3
+ size 34016
lm_embeddings_2.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b10dabcc36b9461cb49a4ea20b01f395c779df340963fa66cf053b8c99f8f676
3
+ size 35936
lm_weights.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfdfd3001b5965b4b6ef857ac772b6624984f8248eaae08fb9be6d1b51ad8755
3
+ size 450896
options.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lstm": {
3
+ "cell_clip": 3,
4
+ "use_skip_connections": true,
5
+ "n_layers": 2,
6
+ "proj_clip": 3,
7
+ "projection_dim": 16,
8
+ "dim": 64
9
+ },
10
+ "char_cnn": {
11
+ "embedding": {
12
+ "dim": 4
13
+ },
14
+ "filters": [
15
+ [1, 4],
16
+ [2, 8],
17
+ [3, 16],
18
+ [4, 32],
19
+ [5, 64]
20
+ ],
21
+ "n_highway": 2,
22
+ "n_characters": 262,
23
+ "max_characters_per_token": 50,
24
+ "activation": "relu"
25
+ }
26
+ }
sentences.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ [
3
+ "The U.S. Centers for Disease Control and Prevention initially advised school systems to close if outbreaks occurred , then reversed itself , saying the apparent mildness of the virus meant most schools and day care centers should stay open , even if they had confirmed cases of swine flu .",
4
+ "When Ms. Winfrey invited Suzanne Somers to share her controversial views about bio-identical hormone treatment on her syndicated show in 2009 , it won Ms. Winfrey a rare dollop of unflattering press , including a Newsweek cover story titled \" Crazy Talk : Oprah , Wacky Cures & You . \"",
5
+ "Elk calling -- a skill that hunters perfected long ago to lure game with the promise of a little romance -- is now its own sport .",
6
+ "Don 't !",
7
+ "Fish , ranked 98th in the world , fired 22 aces en route to a 6-3 , 6-7 ( 5 \/ 7 ) , 7-6 ( 7 \/ 4 ) win over seventh-seeded Argentinian David Nalbandian .",
8
+ "Why does everything have to become such a big issue ?",
9
+ "AMMAN ( Reuters ) - King Abdullah of Jordan will meet U.S. President Barack Obama in Washington on April 21 to lobby on behalf of Arab states for a stronger U.S. role in Middle East peacemaking , palace officials said on Sunday .",
10
+ "To help keep traffic flowing the Congestion Charge will remain in operation through-out the strike and TfL will be suspending road works on major London roads wherever possible .",
11
+ "If no candidate wins an absolute majority , there will be a runoff between the top two contenders , most likely in mid-October .",
12
+ "Authorities previously served search warrants at Murray 's Las Vegas home and his businesses in Las Vegas and Houston ."
13
+ ],
14
+ [
15
+ "Brent North Sea crude for November delivery rose 84 cents to 68.88 dollars a barrel .",
16
+ "That seems to have been their model up til now .",
17
+ "Gordon will join Luol Deng on the GB team ; their respective NBA teams , the Detroit Pistons and the Chicago Bulls , play tonight .",
18
+ "Nikam maintains the attacks were masterminded by the Muslim militant group Lashkar-e-Taiba .",
19
+ "Last year , Williams was unseeded , ranked 81st and coming off one of her worst losses on tour -- in a Tier 4 event at Hobart -- yet she beat six seeded players en route to the title at Melbourne Park .",
20
+ "It said that two officers involved in the case had been disciplined .",
21
+ "\" There is more intelligence now being gathered , \" the official said , adding that such efforts would continue for some time .",
22
+ "The majority will be of the standard 6X6 configuration for carrying personnel .",
23
+ "\" Consequently , necessary actions may not be taken to reduce the risks to children of sexual exploitation and drug or alcohol misuse , \" the report said . \u2022 Almost two-thirds of inspected schools were good or outstanding , but the number of underperforming secondaries remained \" stubborn and persistent . \"",
24
+ "What a World Cup ."
25
+ ],
26
+ [
27
+ "But , there have also been many cases of individuals and small groups of people protesting , as in the case of Rongye Adak , a nomad who called for the return of the Dalai Lama and for the freedom of Tibet during the Lithang Horse Racing Festival , in eastern Tibet .",
28
+ "James Duncan , head of transportation at Bournemouth Borough Council , said : \" Our legal team is reviewing the entitlement of taxis to drop and pick up passengers at bus stops , only for as long as is absolutely necessary to fulfil that function and for no other reason .",
29
+ "To Mo concerning the food log you kept -- Dr. Buchholz recommends the same thing .",
30
+ "The CBO estimates that only 23 percent of that would be spent in 2009 and 2010 .",
31
+ "Even so , Democrats slammed Bush as out of touch .",
32
+ "An information campaign will be launched later to raise awareness of employment rights and how to enforce them .",
33
+ "At the gallery the concept is less vague , as Ms. Piper cites specific instances of racial violence , political assassinations and the devastation of Hurricane Katrina .",
34
+ "There have been some exceptions -- such as Medicare in 1965 .",
35
+ "The government guidance will be reviewed early next year after a period of public comment .",
36
+ "It wasn 't the most seaworthy of prizes ."
37
+ ]
38
+ ]
vocab_test.txt ADDED
@@ -0,0 +1,458 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ good
2
+ Why
3
+ employment
4
+ government
5
+ Don
6
+ care
7
+ ;
8
+ case
9
+ North
10
+ Bush
11
+ assassinations
12
+ you
13
+ disciplined
14
+ press
15
+ romance
16
+ major
17
+ Muslim
18
+ sport
19
+ flu
20
+ entitlement
21
+ <S>
22
+ nomad
23
+ now
24
+ fulfil
25
+ Oprah
26
+ reviewing
27
+ enforce
28
+ number
29
+ log
30
+ rights
31
+ suspending
32
+ warrants
33
+ coming
34
+ stubborn
35
+ Hurricane
36
+ Duncan
37
+ East
38
+ role
39
+ Katrina
40
+ it
41
+ businesses
42
+ a
43
+ At
44
+ been
45
+ Disease
46
+ necessary
47
+ Racing
48
+ later
49
+ 's
50
+ specific
51
+ would
52
+ groups
53
+ next
54
+ masterminded
55
+ misuse
56
+ London
57
+ kept
58
+ become
59
+ November
60
+ centers
61
+ 22
62
+ To
63
+ day
64
+ title
65
+ outbreaks
66
+ AMMAN
67
+ his
68
+ 21
69
+ concept
70
+ early
71
+ dollars
72
+ is
73
+ people
74
+ game
75
+ confirmed
76
+ palace
77
+ syndicated
78
+ issue
79
+ school
80
+ called
81
+ It
82
+ had
83
+ rare
84
+ remain
85
+ Elk
86
+ some
87
+ world
88
+ unseeded
89
+ (
90
+ What
91
+ inspected
92
+ Jordan
93
+ touch
94
+ Newsweek
95
+ Argentinian
96
+ after
97
+ seems
98
+ contenders
99
+ runoff
100
+ tonight
101
+ -
102
+ Charge
103
+ Authorities
104
+ stops
105
+ When
106
+ top
107
+ public
108
+ respective
109
+ Lithang
110
+ 68.88
111
+ Nalbandian
112
+ sexual
113
+ vague
114
+ cents
115
+ political
116
+ Festival
117
+ Bulls
118
+ <UNK>
119
+ wasn
120
+ freedom
121
+ Suzanne
122
+ !
123
+ calling
124
+ thing
125
+ officers
126
+ return
127
+ ,
128
+ route
129
+ Abdullah
130
+ David
131
+ everything
132
+ GB
133
+ year
134
+ players
135
+ Middle
136
+ works
137
+ views
138
+ April
139
+ wins
140
+ through-out
141
+ Brent
142
+
143
+ close
144
+ treatment
145
+ But
146
+ World
147
+ There
148
+ and
149
+ eastern
150
+ in
151
+ not
152
+ personnel
153
+ carrying
154
+ between
155
+ Lashkar-e-Taiba
156
+ may
157
+ fired
158
+ home
159
+ Murray
160
+ 98th
161
+ they
162
+ 81st
163
+ outstanding
164
+ have
165
+ Winfrey
166
+ hunters
167
+ advised
168
+ reduce
169
+ Somers
170
+ were
171
+ 2010
172
+ NBA
173
+ King
174
+ gallery
175
+ traffic
176
+ Vegas
177
+ also
178
+ racial
179
+ if
180
+ being
181
+ risks
182
+ percent
183
+ no
184
+ maintains
185
+ guidance
186
+ more
187
+ worst
188
+ Buchholz
189
+ devastation
190
+ off
191
+ Chicago
192
+ barrel
193
+ Washington
194
+ Last
195
+ titled
196
+ show
197
+ Centers
198
+ during
199
+ gathered
200
+ Gordon
201
+ operation
202
+ remained
203
+ even
204
+ Deng
205
+ 't
206
+ Mo
207
+ taken
208
+ militant
209
+ play
210
+ 6-3
211
+ Melbourne
212
+ Luol
213
+ the
214
+ absolute
215
+ she
216
+ one
217
+ secondaries
218
+ /
219
+ behalf
220
+ food
221
+ concerning
222
+ spent
223
+ should
224
+ cover
225
+ </S>
226
+ standard
227
+ stay
228
+ Arab
229
+ her
230
+ same
231
+ 6-7
232
+ mildness
233
+ individuals
234
+ that
235
+ team
236
+ seeded
237
+ win
238
+ many
239
+ U.S.
240
+ Consequently
241
+ Horse
242
+ wherever
243
+ served
244
+ initially
245
+ event
246
+ awareness
247
+ peacemaking
248
+ Sunday
249
+ so
250
+ Piper
251
+ 5
252
+ teams
253
+ six
254
+ swine
255
+ Almost
256
+ join
257
+ --
258
+ attacks
259
+ 7
260
+ mid-October
261
+ promise
262
+ Pistons
263
+ 84
264
+ time
265
+ to
266
+ flowing
267
+ involved
268
+ Democrats
269
+ lobby
270
+ TfL
271
+ tour
272
+ meet
273
+ majority
274
+ recommends
275
+ Dr.
276
+ stronger
277
+ seventh-seeded
278
+ campaign
279
+ head
280
+ group
281
+ seaworthy
282
+ saying
283
+ Las
284
+ cites
285
+ Lama
286
+ states
287
+ Detroit
288
+ Borough
289
+ Williams
290
+ children
291
+ including
292
+ configuration
293
+ Park
294
+ Tier
295
+ pick
296
+ out
297
+ Reuters
298
+ such
299
+ "
300
+ ?
301
+ Tibet
302
+ Cup
303
+ dollop
304
+ own
305
+ of
306
+ other
307
+ how
308
+ transportation
309
+ CBO
310
+ rose
311
+ legal
312
+ open
313
+ little
314
+ exploitation
315
+ alcohol
316
+ said
317
+ official
318
+ roads
319
+ Adak
320
+ period
321
+ as
322
+ instances
323
+ absolutely
324
+ Fish
325
+ Houston
326
+ was
327
+ long
328
+ protesting
329
+ raise
330
+ occurred
331
+ That
332
+ beat
333
+ Crazy
334
+ apparent
335
+ unflattering
336
+ their
337
+ two-thirds
338
+ information
339
+ itself
340
+ controversial
341
+ reversed
342
+ prizes
343
+ underperforming
344
+ search
345
+ at
346
+ passengers
347
+ 7-6
348
+ yet
349
+ Council
350
+ slammed
351
+ .
352
+ small
353
+ model
354
+ Talk
355
+ meant
356
+ aces
357
+ drop
358
+ keep
359
+ Cures
360
+ strike
361
+ An
362
+ Bournemouth
363
+ officials
364
+ invited
365
+ road
366
+ Wacky
367
+ schools
368
+ by
369
+ Nikam
370
+ systems
371
+ 4
372
+ previously
373
+ who
374
+ launched
375
+ possible
376
+ them
377
+ violence
378
+ two
379
+ estimates
380
+ hormone
381
+ taxis
382
+ ago
383
+ less
384
+ 1965
385
+ over
386
+ Prevention
387
+ actions
388
+ be
389
+ most
390
+ does
391
+ Control
392
+ Barack
393
+ continue
394
+ perfected
395
+ reason
396
+ 2009
397
+ delivery
398
+ up
399
+ crude
400
+ Rongye
401
+ losses
402
+ drug
403
+ Ms.
404
+ Congestion
405
+ about
406
+ skill
407
+ til
408
+ bus
409
+ for
410
+ Our
411
+ Dalai
412
+ virus
413
+ James
414
+ Even
415
+ story
416
+ The
417
+ lure
418
+ Obama
419
+ then
420
+ report
421
+ or
422
+ )
423
+ with
424
+ help
425
+ persistent
426
+ on
427
+ Hobart
428
+ President
429
+ 23
430
+ share
431
+ ranked
432
+ Medicare
433
+ there
434
+ won
435
+ bio-identical
436
+ candidate
437
+ :
438
+ en
439
+ only
440
+ likely
441
+ efforts
442
+ You
443
+ adding
444
+ will
445
+ cases
446
+ exceptions
447
+ intelligence
448
+ comment
449
+ but
450
+ reviewed
451
+ If
452
+ its
453
+ 6X6
454
+ &
455
+ Sea
456
+ big
457
+ an
458
+ function