HoangHa commited on
Commit
b6b3c64
1 Parent(s): 090b768

Saving weights and logs of epoch 2

Browse files
epoch_2/config.json CHANGED
@@ -1,26 +1,25 @@
1
  {
2
- "_name_or_path": "roberta-base",
3
  "architectures": [
4
  "RobertaForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
8
- "classifier_dropout": null,
9
  "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 3072,
15
- "layer_norm_eps": 1e-05,
16
- "max_position_embeddings": 514,
17
  "model_type": "roberta",
18
  "num_attention_heads": 12,
19
  "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
22
  "transformers_version": "4.20.0",
23
- "type_vocab_size": 1,
24
  "use_cache": true,
25
- "vocab_size": 50265
26
  }
 
1
  {
 
2
  "architectures": [
3
  "RobertaForMaskedLM"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "bos_token_id": 0,
7
+ "classifier_dropout": 0.1,
8
  "eos_token_id": 2,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 130,
16
  "model_type": "roberta",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 1,
20
  "position_embedding_type": "absolute",
21
  "transformers_version": "4.20.0",
22
+ "type_vocab_size": 2,
23
  "use_cache": true,
24
+ "vocab_size": 3132
25
  }
epoch_2/flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f016afd7d6e0f852d85469fd98eebe11db3d079ba58b15ea859bf8363fab4f3
3
  size 352639294
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390abddfa1b8f447f1b0ea7a3710ec3f866008662d7586b7eae5e3bf18ed46d8
3
  size 352639294