marinone94 commited on
Commit
a050237
β€’
1 Parent(s): ef8c3fa
checkpoint-20/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc9a37bf342d6b4931c7270220724a92600d8294837cdbcd124a0ec5e19ec080
3
  size 2490337361
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f436b11b0e72d1e94060965296a9e9e846ca0f9771daa24e1a9345c5f9a7d16
3
  size 2490337361
checkpoint-20/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3628cb625fb06fb9b5feb8070ed125a0961b552a86df1fcdcbb45d1703f7757f
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d76176b1de3e024882e5dc97f4c62f8c353ad6bd2bb044b8780d02f878d5a8b
3
  size 1262063089
checkpoint-20/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73e968b5fb75f3d028c5b87fc29d361b46586d839eb1fc406be3e77c69542778
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59257a32aba32d8c5fcf991ca9a70b329ffb647f6a2161088a777522fce19900
3
  size 14567
checkpoint-20/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8d1040cd70f91f849688103143e8c9d631ff10c4acee0b2f4d6ff9e27727776
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de50320fd62b63ba68a5d5884bc2615e3b1236c94802e7d58610a99abb679720
3
  size 559
checkpoint-20/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd820f300afb9f82707d847f7f02b33e058c7d1676a355fccacc0f7f2f251fcd
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dff68c58af865abbc7152291f4ccc6e0dc5bda2584ed11e74751073d18e44ac9
3
  size 623
checkpoint-20/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.26490066225165565,
5
  "global_step": 20,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
@@ -9,29 +9,29 @@
9
  "log_history": [
10
  {
11
  "epoch": 0.13,
12
- "learning_rate": 0.00045,
13
- "loss": 10.7126,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.26,
18
- "learning_rate": 0.0007469387755102041,
19
- "loss": 5.3922,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.26,
24
- "eval_loss": 3.5064597129821777,
25
- "eval_runtime": 4.8648,
26
- "eval_samples_per_second": 20.145,
27
- "eval_steps_per_second": 0.822,
28
  "eval_wer": 1.0,
29
  "step": 20
30
  }
31
  ],
32
- "max_steps": 750,
33
  "num_train_epochs": 10,
34
- "total_flos": 4.155165485184e+17,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.25559105431309903,
5
  "global_step": 20,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
 
9
  "log_history": [
10
  {
11
  "epoch": 0.13,
12
+ "learning_rate": 1.8749999999999998e-06,
13
+ "loss": 13.2907,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.26,
18
+ "learning_rate": 3.7499999999999997e-06,
19
+ "loss": 17.4007,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.26,
24
+ "eval_loss": 21.748823165893555,
25
+ "eval_runtime": 3.3192,
26
+ "eval_samples_per_second": 30.127,
27
+ "eval_steps_per_second": 1.205,
28
  "eval_wer": 1.0,
29
  "step": 20
30
  }
31
  ],
32
+ "max_steps": 780,
33
  "num_train_epochs": 10,
34
+ "total_flos": 3.123017532990259e+17,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
checkpoint-20/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad06bcea7129bc90fba0c606327162a14f89fd4622d165a2ff161b26e6fbb59e
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5806ee760f93397337bb9a8c9234fc7d900c26bb857abd80187ccde2f46dde70
3
  size 3055
checkpoint-300/config.json DELETED
@@ -1,115 +0,0 @@
1
- {
2
- "_name_or_path": "KBLab/wav2vec2-large-voxrex",
3
- "activation_dropout": 0.1,
4
- "adapter_kernel_size": 3,
5
- "adapter_stride": 2,
6
- "add_adapter": false,
7
- "apply_spec_augment": true,
8
- "architectures": [
9
- "Wav2Vec2ForCTC"
10
- ],
11
- "attention_dropout": 0.0,
12
- "bos_token_id": 1,
13
- "classifier_proj_size": 256,
14
- "codevector_dim": 768,
15
- "contrastive_logits_temperature": 0.1,
16
- "conv_bias": true,
17
- "conv_dim": [
18
- 512,
19
- 512,
20
- 512,
21
- 512,
22
- 512,
23
- 512,
24
- 512
25
- ],
26
- "conv_kernel": [
27
- 10,
28
- 3,
29
- 3,
30
- 3,
31
- 3,
32
- 2,
33
- 2
34
- ],
35
- "conv_stride": [
36
- 5,
37
- 2,
38
- 2,
39
- 2,
40
- 2,
41
- 2,
42
- 2
43
- ],
44
- "ctc_loss_reduction": "mean",
45
- "ctc_zero_infinity": false,
46
- "diversity_loss_weight": 0.1,
47
- "do_stable_layer_norm": true,
48
- "eos_token_id": 2,
49
- "feat_extract_activation": "gelu",
50
- "feat_extract_dropout": 0.0,
51
- "feat_extract_norm": "layer",
52
- "feat_proj_dropout": 0.0,
53
- "feat_quantizer_dropout": 0.0,
54
- "final_dropout": 0.0,
55
- "hidden_act": "gelu",
56
- "hidden_dropout": 0.0,
57
- "hidden_size": 1024,
58
- "initializer_range": 0.02,
59
- "intermediate_size": 4096,
60
- "layer_norm_eps": 1e-05,
61
- "layerdrop": 0.0,
62
- "mask_channel_length": 10,
63
- "mask_channel_min_space": 1,
64
- "mask_channel_other": 0.0,
65
- "mask_channel_prob": 0.0,
66
- "mask_channel_selection": "static",
67
- "mask_feature_length": 64,
68
- "mask_feature_min_masks": 0,
69
- "mask_feature_prob": 0.25,
70
- "mask_time_length": 10,
71
- "mask_time_min_masks": 2,
72
- "mask_time_min_space": 1,
73
- "mask_time_other": 0.0,
74
- "mask_time_prob": 0.75,
75
- "mask_time_selection": "static",
76
- "model_type": "wav2vec2",
77
- "num_adapter_layers": 3,
78
- "num_attention_heads": 16,
79
- "num_codevector_groups": 2,
80
- "num_codevectors_per_group": 320,
81
- "num_conv_pos_embedding_groups": 16,
82
- "num_conv_pos_embeddings": 128,
83
- "num_feat_extract_layers": 7,
84
- "num_hidden_layers": 24,
85
- "num_negatives": 100,
86
- "output_hidden_size": 1024,
87
- "pad_token_id": 31,
88
- "proj_codevector_dim": 768,
89
- "tdnn_dilation": [
90
- 1,
91
- 2,
92
- 3,
93
- 1,
94
- 1
95
- ],
96
- "tdnn_dim": [
97
- 512,
98
- 512,
99
- 512,
100
- 512,
101
- 1500
102
- ],
103
- "tdnn_kernel": [
104
- 5,
105
- 3,
106
- 3,
107
- 1,
108
- 1
109
- ],
110
- "torch_dtype": "float32",
111
- "transformers_version": "4.17.0.dev0",
112
- "use_weighted_layer_sum": false,
113
- "vocab_size": 34,
114
- "xvector_output_dim": 512
115
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-300/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ae9e41884d3305d9a0797fd14fd35fc8e619e12951eedb6e1396e3ead551313
3
- size 2490337809
 
 
 
 
checkpoint-300/preprocessor_config.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "do_normalize": true,
3
- "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
- "feature_size": 1,
5
- "padding_side": "right",
6
- "padding_value": 0,
7
- "return_attention_mask": true,
8
- "sampling_rate": 16000
9
- }
 
 
 
 
 
 
 
 
 
 
checkpoint-300/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ba896f27a39cdc0a9c70e56aeff43d05c53ba85e3a65d2c02f13edcce3b7ac8
3
- size 1262063089
 
 
 
 
checkpoint-300/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7dad8817bedcf4b45f9a2d36af4404126640a18d28d8189d505ec2ab56d4b6a1
3
- size 14503
 
 
 
 
checkpoint-300/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0967b9f865f16344c55f5ccc3cf7d6e8e97ca61dda304e931ca6bad130f48dd1
3
- size 559
 
 
 
 
checkpoint-300/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:303fe9412b2bbace437d42323a895571355b0ae20c611a474d9492be12287f9c
3
- size 623
 
 
 
 
checkpoint-300/trainer_state.json DELETED
@@ -1,160 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 3.8434504792332267,
5
- "global_step": 300,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.26,
12
- "learning_rate": 0.0007307692307692308,
13
- "loss": 4.2559,
14
- "step": 20
15
- },
16
- {
17
- "epoch": 0.51,
18
- "learning_rate": 0.0007115384615384615,
19
- "loss": 3.068,
20
- "step": 40
21
- },
22
- {
23
- "epoch": 0.64,
24
- "eval_loss": 3.058549165725708,
25
- "eval_runtime": 3.3353,
26
- "eval_samples_per_second": 29.982,
27
- "eval_steps_per_second": 1.199,
28
- "eval_wer": 1.0,
29
- "step": 50
30
- },
31
- {
32
- "epoch": 0.77,
33
- "learning_rate": 0.0006923076923076924,
34
- "loss": 3.0637,
35
- "step": 60
36
- },
37
- {
38
- "epoch": 1.03,
39
- "learning_rate": 0.0006730769230769232,
40
- "loss": 3.0752,
41
- "step": 80
42
- },
43
- {
44
- "epoch": 1.28,
45
- "learning_rate": 0.0006538461538461538,
46
- "loss": 3.0083,
47
- "step": 100
48
- },
49
- {
50
- "epoch": 1.28,
51
- "eval_loss": 3.1246652603149414,
52
- "eval_runtime": 3.2285,
53
- "eval_samples_per_second": 30.974,
54
- "eval_steps_per_second": 1.239,
55
- "eval_wer": 1.0,
56
- "step": 100
57
- },
58
- {
59
- "epoch": 1.54,
60
- "learning_rate": 0.0006346153846153846,
61
- "loss": 3.0159,
62
- "step": 120
63
- },
64
- {
65
- "epoch": 1.79,
66
- "learning_rate": 0.0006153846153846154,
67
- "loss": 2.977,
68
- "step": 140
69
- },
70
- {
71
- "epoch": 1.92,
72
- "eval_loss": 2.973355770111084,
73
- "eval_runtime": 3.1716,
74
- "eval_samples_per_second": 31.53,
75
- "eval_steps_per_second": 1.261,
76
- "eval_wer": 1.0,
77
- "step": 150
78
- },
79
- {
80
- "epoch": 2.05,
81
- "learning_rate": 0.0005961538461538461,
82
- "loss": 3.0056,
83
- "step": 160
84
- },
85
- {
86
- "epoch": 2.31,
87
- "learning_rate": 0.000576923076923077,
88
- "loss": 2.9591,
89
- "step": 180
90
- },
91
- {
92
- "epoch": 2.56,
93
- "learning_rate": 0.0005576923076923078,
94
- "loss": 2.9398,
95
- "step": 200
96
- },
97
- {
98
- "epoch": 2.56,
99
- "eval_loss": 2.940675735473633,
100
- "eval_runtime": 3.1691,
101
- "eval_samples_per_second": 31.554,
102
- "eval_steps_per_second": 1.262,
103
- "eval_wer": 1.0,
104
- "step": 200
105
- },
106
- {
107
- "epoch": 2.82,
108
- "learning_rate": 0.0005384615384615384,
109
- "loss": 2.9295,
110
- "step": 220
111
- },
112
- {
113
- "epoch": 3.08,
114
- "learning_rate": 0.0005192307692307692,
115
- "loss": 2.9465,
116
- "step": 240
117
- },
118
- {
119
- "epoch": 3.2,
120
- "eval_loss": 2.835913896560669,
121
- "eval_runtime": 3.1824,
122
- "eval_samples_per_second": 31.423,
123
- "eval_steps_per_second": 1.257,
124
- "eval_wer": 1.0,
125
- "step": 250
126
- },
127
- {
128
- "epoch": 3.33,
129
- "learning_rate": 0.0005,
130
- "loss": 2.9053,
131
- "step": 260
132
- },
133
- {
134
- "epoch": 3.59,
135
- "learning_rate": 0.0004807692307692308,
136
- "loss": 2.899,
137
- "step": 280
138
- },
139
- {
140
- "epoch": 3.84,
141
- "learning_rate": 0.0004615384615384616,
142
- "loss": 2.8861,
143
- "step": 300
144
- },
145
- {
146
- "epoch": 3.84,
147
- "eval_loss": 2.8373122215270996,
148
- "eval_runtime": 3.1455,
149
- "eval_samples_per_second": 31.791,
150
- "eval_steps_per_second": 1.272,
151
- "eval_wer": 1.0,
152
- "step": 300
153
- }
154
- ],
155
- "max_steps": 780,
156
- "num_train_epochs": 10,
157
- "total_flos": 4.5237874175174973e+18,
158
- "trial_name": null,
159
- "trial_params": null
160
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-300/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:31becb5e425437ea470512000be6c31bb502b71fe15942ff8cf0cc01eb8267a0
3
- size 3055
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3628cb625fb06fb9b5feb8070ed125a0961b552a86df1fcdcbb45d1703f7757f
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d76176b1de3e024882e5dc97f4c62f8c353ad6bd2bb044b8780d02f878d5a8b
3
  size 1262063089
run.sh CHANGED
@@ -6,13 +6,11 @@ python run_speech_recognition_ctc.py \
6
  --eval_split_name="test" \
7
  --output_dir="./" \
8
  --overwrite_output_dir \
9
- --num_train_epochs="10" \
10
  --per_device_train_batch_size="32" \
11
  --per_device_eval_batch_size="32" \
12
  --gradient_accumulation_steps="4" \
13
  --learning_rate="7.5e-4" \
14
- --max_train_samples="10000" \
15
- --max_eval_samples="100" \
16
  --warmup_ratio="0.02" \
17
  --length_column_name="input_length" \
18
  --evaluation_strategy="steps" \
@@ -40,27 +38,26 @@ python run_speech_recognition_ctc.py \
40
 
41
  python run_speech_recognition_ctc.py \
42
  --dataset_name="mozilla-foundation/common_voice_8_0" \
43
- --model_name_or_path="KBLab/wav2vec2-large-voxrex" \
44
  --dataset_config_name="sv-SE" \
45
  --train_split_name="train+validation" \
46
  --eval_split_name="test" \
47
  --output_dir="./" \
48
- --num_train_epochs="10" \
 
49
  --per_device_train_batch_size="32" \
50
  --per_device_eval_batch_size="32" \
51
  --gradient_accumulation_steps="4" \
52
  --learning_rate="7.5e-5" \
53
- --warmup_steps="400" \
54
- --max_train_samples="10000" \
55
- --max_eval_samples="100" \
56
  --length_column_name="input_length" \
57
  --evaluation_strategy="steps" \
58
  --save_strategy="steps" \
59
- --eval_steps="20" \
60
- --save_steps="20" \
61
  --text_column_name="sentence" \
62
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – \
63
- --logging_steps="10" \
64
  --layerdrop="0.0" \
65
  --activation_dropout="0.1" \
66
  --save_total_limit="2" \
 
6
  --eval_split_name="test" \
7
  --output_dir="./" \
8
  --overwrite_output_dir \
9
+ --num_train_epochs="3" \
10
  --per_device_train_batch_size="32" \
11
  --per_device_eval_batch_size="32" \
12
  --gradient_accumulation_steps="4" \
13
  --learning_rate="7.5e-4" \
 
 
14
  --warmup_ratio="0.02" \
15
  --length_column_name="input_length" \
16
  --evaluation_strategy="steps" \
 
38
 
39
  python run_speech_recognition_ctc.py \
40
  --dataset_name="mozilla-foundation/common_voice_8_0" \
41
+ --model_name_or_path="marinone94/xls-r-300m-sv-robust" \
42
  --dataset_config_name="sv-SE" \
43
  --train_split_name="train+validation" \
44
  --eval_split_name="test" \
45
  --output_dir="./" \
46
+ --overwrite_output_dir \
47
+ --num_train_epochs="50" \
48
  --per_device_train_batch_size="32" \
49
  --per_device_eval_batch_size="32" \
50
  --gradient_accumulation_steps="4" \
51
  --learning_rate="7.5e-5" \
52
+ --warmup_steps="2000" \
 
 
53
  --length_column_name="input_length" \
54
  --evaluation_strategy="steps" \
55
  --save_strategy="steps" \
56
+ --eval_steps="500" \
57
+ --save_steps="500" \
58
  --text_column_name="sentence" \
59
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – \
60
+ --logging_steps="100" \
61
  --layerdrop="0.0" \
62
  --activation_dropout="0.1" \
63
  --save_total_limit="2" \
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad06bcea7129bc90fba0c606327162a14f89fd4622d165a2ff161b26e6fbb59e
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5806ee760f93397337bb9a8c9234fc7d900c26bb857abd80187ccde2f46dde70
3
  size 3055