AmitMY commited on
Commit
3a45c3b
1 Parent(s): 4525eff

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. args.yaml +5 -5
  2. config +96 -102
  3. metrics +0 -0
  4. params.best +2 -2
  5. vocab.src.0.json +0 -0
args.yaml CHANGED
@@ -51,7 +51,7 @@ local_rank: null
51
  loglevel: INFO
52
  loglevel_secondary_workers: INFO
53
  max_checkpoints: null
54
- max_num_checkpoint_not_improved: 50
55
  max_num_epochs: null
56
  max_samples: null
57
  max_seconds: null
@@ -59,7 +59,7 @@ max_seq_len:
59
  - 512
60
  - 512
61
  max_updates: null
62
- min_num_epochs: null
63
  min_samples: null
64
  min_updates: null
65
  momentum: 0.0
@@ -83,11 +83,11 @@ optimizer_betas:
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
- output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
- params: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v4/model/params.best
90
- prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-tuned/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
 
51
  loglevel: INFO
52
  loglevel_secondary_workers: INFO
53
  max_checkpoints: null
54
+ max_num_checkpoint_not_improved: 100
55
  max_num_epochs: null
56
  max_samples: null
57
  max_seconds: null
 
59
  - 512
60
  - 512
61
  max_updates: null
62
+ min_num_epochs: 10
63
  min_samples: null
64
  min_updates: null
65
  momentum: 0.0
 
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
+ output: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt-tuned/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
+ params: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt/model/params.best
90
+ prepared_data: /shares/iict-sp2.ebling.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-gpt-tuned/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
config CHANGED
@@ -2,30 +2,30 @@
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
- - 6.01988730121871
6
- - 10.49707202236441
7
- - 18.536005711954232
8
- - 25.91453940066591
9
- - 33.44474802671516
10
- - 41.29017292281736
11
- - 50.38165137614682
12
- - 59.57928802588991
13
- - 67.86491420226359
14
- - 75.76032388663967
15
- - 82.68249075215772
16
- - 12.0
17
- - 23.333333333333332
18
- - 24.88888888888889
19
- - 15.857142857142856
20
- - 8.6
21
- - 8.0
22
- - 6.5
23
- - 4.5
24
- - null
25
- - 6.25
26
  - 6.0
27
- - 8.0
28
- - 10.0
 
 
 
 
 
 
 
29
  - null
30
  - null
31
  - null
@@ -263,80 +263,73 @@ config_data: !DataConfig
263
  - !!python/tuple
264
  - 513
265
  - 513
266
- length_ratio_mean: 1.4422861755889766
267
  length_ratio_stats_per_bucket:
268
  - !!python/tuple
269
- - 1.1255982284370691
270
- - 0.3093025169709561
271
- - !!python/tuple
272
- - 1.6064942041128283
273
- - 0.6417946634210556
274
- - !!python/tuple
275
- - 2.359196679910085
276
- - 0.9575904838242857
277
  - !!python/tuple
278
- - 2.9607196399710274
279
- - 1.5584344652106463
280
  - !!python/tuple
281
- - 2.9543389770526325
282
- - 2.297144978089179
283
  - !!python/tuple
284
- - 3.002340450312629
285
- - 2.18681603522054
286
  - !!python/tuple
287
- - 3.081058473996043
288
- - 2.5011199006515183
289
  - !!python/tuple
290
- - 2.9163894753348045
291
- - 2.2789742432670086
292
  - !!python/tuple
293
- - 2.9722600022754504
294
- - 2.230352263818367
295
  - !!python/tuple
296
- - 3.138369081443168
297
- - 2.4620594208603235
298
  - !!python/tuple
299
- - 2.854253034817575
300
- - 1.6376340581023332
301
  - !!python/tuple
302
- - 0.12974460739238317
303
- - 0.160679251677897
304
  - !!python/tuple
305
- - 0.23436597326420017
306
- - 0.24015947073924906
307
  - !!python/tuple
308
- - 0.23457181630569815
309
- - 0.2675720247460546
310
  - !!python/tuple
311
- - 0.1366625632624212
312
- - 0.16557849394412172
313
  - !!python/tuple
314
- - 0.06941451000342352
315
- - 0.02389100863634256
316
  - !!python/tuple
317
- - 0.05970149253731343
318
  - 0.0
319
  - !!python/tuple
320
- - 0.04609929078014184
321
- - 0.017730496453900707
322
  - !!python/tuple
323
- - 0.03063680118474639
324
- - 0.0036097741577193615
325
- - &id001 !!python/tuple
326
- - null
327
- - null
328
  - !!python/tuple
329
- - 0.038657633805228714
330
- - 0.010237907973024957
331
  - !!python/tuple
332
- - 0.03469146238377008
333
- - 0.004700847851307781
334
- - !!python/tuple
335
- - 0.0446927374301676
336
  - 0.0
337
  - !!python/tuple
338
- - 0.05405405405405406
339
  - 0.0
 
 
 
 
 
340
  - *id001
341
  - *id001
342
  - *id001
@@ -378,36 +371,37 @@ config_data: !DataConfig
378
  - *id001
379
  - *id001
380
  - *id001
381
- length_ratio_std: 0.8479651722336846
382
- max_observed_len_source: 185
 
383
  max_observed_len_target: 87
384
  num_discarded: 0
385
- num_sents: 425392
386
  num_sents_per_bucket:
387
- - 245433
388
- - 135930
389
- - 19608
390
- - 7208
391
- - 3294
392
- - 2371
393
- - 2180
394
- - 2472
395
- - 2739
396
- - 2470
397
- - 1622
398
- - 20
399
- - 9
400
- - 9
401
- - 7
402
- - 5
403
- - 1
404
- - 2
405
  - 2
406
- - 0
407
  - 4
408
- - 3
409
- - 1
410
  - 2
 
 
 
 
 
411
  - 0
412
  - 0
413
  - 0
@@ -449,11 +443,11 @@ config_data: !DataConfig
449
  - 0
450
  - 0
451
  - 0
452
- num_tokens_source: 3056735
453
- num_tokens_target: 4427820
454
  num_unks_source: 0
455
  num_unks_target: 0
456
- size_vocab_source: 8016
457
  size_vocab_target: 656
458
  eop_id: -1
459
  max_seq_len_source: 513
@@ -485,7 +479,7 @@ config_embed_source: !EmbeddingConfig
485
  factor_configs: null
486
  num_embed: 512
487
  num_factors: 1
488
- vocab_size: 8016
489
  config_embed_target: !EmbeddingConfig
490
  allow_sparse_grad: false
491
  dropout: 0.5
@@ -537,6 +531,6 @@ dtype: float32
537
  lhuc: false
538
  neural_vocab_selection: null
539
  neural_vocab_selection_block_loss: false
540
- vocab_source_size: 8016
541
  vocab_target_size: 656
542
  weight_tying_type: trg_softmax
 
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
+ - 6.011277314861252
6
+ - 10.39671010650862
7
+ - 18.504618481112797
8
+ - 26.041977712863865
9
+ - 32.48293857888395
10
+ - 41.60258525852575
11
+ - 51.3669121514993
12
+ - 59.76513060097686
13
+ - 68.25156398104271
14
+ - 75.67976141505562
15
+ - 83.09476309226905
16
+ - 21.1875
17
+ - 7.749999999999999
18
+ - 5.833333333333333
 
 
 
 
 
 
 
19
  - 6.0
20
+ - 7.0
21
+ - 7.25
22
+ - 6.333333333333333
23
+ - 7.0
24
+ - 5.0
25
+ - null
26
+ - null
27
+ - null
28
+ - null
29
  - null
30
  - null
31
  - null
 
263
  - !!python/tuple
264
  - 513
265
  - 513
266
+ length_ratio_mean: 1.4462363190719616
267
  length_ratio_stats_per_bucket:
268
  - !!python/tuple
269
+ - 1.13785261776882
270
+ - 0.30617192612461125
 
 
 
 
 
 
271
  - !!python/tuple
272
+ - 1.6532001104346803
273
+ - 0.6379238313847178
274
  - !!python/tuple
275
+ - 2.471066932954014
276
+ - 0.9542933578872858
277
  - !!python/tuple
278
+ - 2.9657919123449297
279
+ - 1.5793440289847793
280
  - !!python/tuple
281
+ - 3.096168086847911
282
+ - 2.441325976657657
283
  - !!python/tuple
284
+ - 3.268248874962792
285
+ - 2.2403195790511785
286
  - !!python/tuple
287
+ - 3.453956732311208
288
+ - 2.518686961607376
289
  - !!python/tuple
290
+ - 3.2456624469723585
291
+ - 2.2619507905455962
292
  - !!python/tuple
293
+ - 3.322785538319874
294
+ - 2.1624153548695157
295
  - !!python/tuple
296
+ - 3.489342008082259
297
+ - 2.469578333618206
298
  - !!python/tuple
299
+ - 3.278259980416589
300
+ - 1.6906831932492183
301
  - !!python/tuple
302
+ - 0.23045117210041233
303
+ - 0.26501940303452104
304
  - !!python/tuple
305
+ - 0.07818400556098729
306
+ - 0.027479091254378488
307
  - !!python/tuple
308
+ - 0.05445908159715249
309
+ - 0.013332869808672716
310
  - !!python/tuple
311
+ - 0.05042016806722689
312
  - 0.0
313
  - !!python/tuple
314
+ - 0.05658536585365853
315
+ - 0.016585365853658534
316
  - !!python/tuple
317
+ - 0.05537665840439907
318
+ - 0.021182928316626336
 
 
 
319
  - !!python/tuple
320
+ - 0.04568795432892477
321
+ - 0.009015856562239487
322
  - !!python/tuple
323
+ - 0.047619047619047616
 
 
 
324
  - 0.0
325
  - !!python/tuple
326
+ - 0.032679738562091505
327
  - 0.0
328
+ - &id001 !!python/tuple
329
+ - null
330
+ - null
331
+ - *id001
332
+ - *id001
333
  - *id001
334
  - *id001
335
  - *id001
 
371
  - *id001
372
  - *id001
373
  - *id001
374
+ - *id001
375
+ length_ratio_std: 0.8476478699398606
376
+ max_observed_len_source: 153
377
  max_observed_len_target: 87
378
  num_discarded: 0
379
+ num_sents: 779247
380
  num_sents_per_bucket:
381
+ - 478128
382
+ - 233503
383
+ - 27823
384
+ - 9243
385
+ - 4982
386
+ - 3636
387
+ - 3802
388
+ - 4709
389
+ - 5275
390
+ - 4862
391
+ - 3208
392
+ - 32
393
+ - 8
394
+ - 12
 
 
 
 
395
  - 2
 
396
  - 4
397
+ - 8
398
+ - 6
399
  - 2
400
+ - 2
401
+ - 0
402
+ - 0
403
+ - 0
404
+ - 0
405
  - 0
406
  - 0
407
  - 0
 
443
  - 0
444
  - 0
445
  - 0
446
+ num_tokens_source: 5305413
447
+ num_tokens_target: 7842731
448
  num_unks_source: 0
449
  num_unks_target: 0
450
+ size_vocab_source: 45864
451
  size_vocab_target: 656
452
  eop_id: -1
453
  max_seq_len_source: 513
 
479
  factor_configs: null
480
  num_embed: 512
481
  num_factors: 1
482
+ vocab_size: 45864
483
  config_embed_target: !EmbeddingConfig
484
  allow_sparse_grad: false
485
  dropout: 0.5
 
531
  lhuc: false
532
  neural_vocab_selection: null
533
  neural_vocab_selection_block_loss: false
534
+ vocab_source_size: 45864
535
  vocab_target_size: 656
536
  weight_tying_type: trg_softmax
metrics CHANGED
The diff for this file is too large to render. See raw diff
 
params.best CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbc40d947ce0a1c03679cc4c62a4a94c11b179a485637727fc1b491a063042c4
3
- size 201248510
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3cbabac4d28a48fbef952e0155e471556d607dda6700a919f08b44b49299597
3
+ size 278761214
vocab.src.0.json CHANGED
The diff for this file is too large to render. See raw diff