blmoistawinde commited on
Commit
f121b87
1 Parent(s): 661a0fb

fix: bert->roformer

Browse files
Files changed (2) hide show
  1. config.json +4 -4
  2. pytorch_model.bin +2 -2
config.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "_name_or_path": "./chinese_roformer-sim-char-ft_L-12_H-768_A-12",
3
  "architectures": [
4
- "BertModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
  "directionality": "bidi",
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
@@ -13,7 +13,7 @@
13
  "intermediate_size": 3072,
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
- "model_type": "bert",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
@@ -22,7 +22,7 @@
22
  "pooler_num_fc_layers": 3,
23
  "pooler_size_per_head": 128,
24
  "pooler_type": "first_token_transform",
25
- "position_embedding_type": "absolute",
26
  "torch_dtype": "float32",
27
  "transformers_version": "4.19.3",
28
  "type_vocab_size": 2,
 
1
  {
2
  "_name_or_path": "./chinese_roformer-sim-char-ft_L-12_H-768_A-12",
3
  "architectures": [
4
+ "RoFormerModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
7
  "directionality": "bidi",
8
+ "embedding_size": 768,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
13
  "intermediate_size": 3072,
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
+ "model_type": "roformer",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
 
22
  "pooler_num_fc_layers": 3,
23
  "pooler_size_per_head": 128,
24
  "pooler_type": "first_token_transform",
25
+ "rotary_value": false,
26
  "torch_dtype": "float32",
27
  "transformers_version": "4.19.3",
28
  "type_vocab_size": 2,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a9bbc01a62c05c0f25c417f74da08d60eaac656e4f3bde4c6e833acda54ecac
3
- size 381095985
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf20794ca35c4c5706d2496bae0c0f362b75c67cc3c588cc69aa98688fb608b1
3
+ size 377286775