pere commited on
Commit
44cf2aa
1 Parent(s): 59ee58e

Commit from model create scripts

Browse files
config.gin CHANGED
@@ -31,7 +31,7 @@ MODEL_DIR = 'gs://nb-t5x-us-central2/finetuned/scandi3_3stammer_v2_base'
31
  OPTIMIZER = @adafactor.Adafactor()
32
  RANDOM_SEED = 0
33
  TASK_FEATURE_LENGTHS = {'inputs': 512, 'targets': 512}
34
- TRAIN_STEPS = 3100000
35
  USE_CACHED_TASKS = False
36
  USE_HARDWARE_RNG = False
37
  VOCABULARY = @seqio.SentencePieceVocabulary()
31
  OPTIMIZER = @adafactor.Adafactor()
32
  RANDOM_SEED = 0
33
  TASK_FEATURE_LENGTHS = {'inputs': 512, 'targets': 512}
34
+ TRAIN_STEPS = 3300000
35
  USE_CACHED_TASKS = False
36
  USE_HARDWARE_RNG = False
37
  VOCABULARY = @seqio.SentencePieceVocabulary()
config.json CHANGED
@@ -26,14 +26,5 @@
26
  "torch_dtype": "float32",
27
  "transformers_version": "4.19.2",
28
  "use_cache": true,
29
- "max_length": 512,
30
- "task_specific_params": {
31
- "text-generation": {
32
- "max_length": 512
33
- },
34
- "translation": {
35
- "max_length": 512
36
- }
37
- },
38
  "vocab_size": 250112
39
  }
26
  "torch_dtype": "float32",
27
  "transformers_version": "4.19.2",
28
  "use_cache": true,
 
 
 
 
 
 
 
 
 
29
  "vocab_size": 250112
30
  }
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af86406264accac6a46ee82ca7bd94c774e2257a990e0ab18b5a8b2ce1bc3968
3
  size 2329617315
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bffa8608e66655a7e99017923cd7c5194d5002fe2851c5ed46c09eb31eb09f1
3
  size 2329617315
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae81423872018be47b5f66faa04cb72da4972552ade35e91a11f8da7080442e3
3
  size 2329696333
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa4ebc7ed41aa462491be7f9d1be37cb6df0357fad80920ca1fe96a3f5fa2d6
3
  size 2329696333
train/events.out.tfevents.1667313658.t1v-n-101cf975-w-0.21692.0.v2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f88916972825e1375a0743c0e5888723f8fd0b5e0c10a50a8e82be10cd6935a
3
- size 147027
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b28aa102d956b57eb1d8d33576ab6f5a7c345274519c99f0675753b2e144cc
3
+ size 225507
train/events.out.tfevents.1667421797.t1v-n-101cf975-w-0.623115.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:badfa6b6804f1bf63e05f6da6f517b42e6dc42edbe738420cded1265546f7be7
3
+ size 99067
training_eval/translate/events.out.tfevents.1667313658.t1v-n-101cf975-w-0.21692.1.v2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81177c88a19dfc1a5ea055f428e1b42a2a6c4ef1b2ccb3d89ac9a4c57ca5a4d6
3
- size 114047
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:911b26e6b66e2d9022d23202393e05045dbaf6a7d39832a0cea662a479358d78
3
+ size 178127
training_eval/translate/events.out.tfevents.1667421797.t1v-n-101cf975-w-0.623115.1.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25de68e105f8ae5604ccab397aca319b01ff641123cf0adb79195f84796b0241
3
+ size 74887