Pisethan commited on
Commit
2e904fd
·
verified ·
1 Parent(s): d4c62d0

Upload XLMRobertaForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +16 -10
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
2
  "_name_or_path": "./sangapac-math-model",
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
 
7
  "classifier_dropout": null,
8
- "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
@@ -13,7 +14,9 @@
13
  "0": "LABEL_0",
14
  "1": "LABEL_1",
15
  "2": "LABEL_2",
16
- "3": "LABEL_3"
 
 
17
  },
18
  "initializer_range": 0.02,
19
  "intermediate_size": 3072,
@@ -21,19 +24,22 @@
21
  "LABEL_0": 0,
22
  "LABEL_1": 1,
23
  "LABEL_2": 2,
24
- "LABEL_3": 3
 
 
25
  },
26
- "layer_norm_eps": 1e-12,
27
- "max_position_embeddings": 512,
28
- "model_type": "bert",
29
  "num_attention_heads": 12,
30
  "num_hidden_layers": 12,
31
- "pad_token_id": 0,
 
32
  "position_embedding_type": "absolute",
33
  "problem_type": "single_label_classification",
34
  "torch_dtype": "float32",
35
  "transformers_version": "4.46.2",
36
- "type_vocab_size": 2,
37
  "use_cache": true,
38
- "vocab_size": 30522
39
  }
 
1
  {
2
  "_name_or_path": "./sangapac-math-model",
3
  "architectures": [
4
+ "XLMRobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
  "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
 
14
  "0": "LABEL_0",
15
  "1": "LABEL_1",
16
  "2": "LABEL_2",
17
+ "3": "LABEL_3",
18
+ "4": "LABEL_4",
19
+ "5": "LABEL_5"
20
  },
21
  "initializer_range": 0.02,
22
  "intermediate_size": 3072,
 
24
  "LABEL_0": 0,
25
  "LABEL_1": 1,
26
  "LABEL_2": 2,
27
+ "LABEL_3": 3,
28
+ "LABEL_4": 4,
29
+ "LABEL_5": 5
30
  },
31
+ "layer_norm_eps": 1e-05,
32
+ "max_position_embeddings": 514,
33
+ "model_type": "xlm-roberta",
34
  "num_attention_heads": 12,
35
  "num_hidden_layers": 12,
36
+ "output_past": true,
37
+ "pad_token_id": 1,
38
  "position_embedding_type": "absolute",
39
  "problem_type": "single_label_classification",
40
  "torch_dtype": "float32",
41
  "transformers_version": "4.46.2",
42
+ "type_vocab_size": 1,
43
  "use_cache": true,
44
+ "vocab_size": 250002
45
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:301433b751ac4fb849bf30b12420c78ed039dd384d61fb384d113fc2147a73d9
3
- size 437964800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6249813a6f00098952e1ed83f3f374b2ced66cd8297f10271ec66841f3befe2
3
+ size 1112217312