albertmartinez commited on
Commit
bfc98df
1 Parent(s): 5a5916f

Training in progress, step 500

Browse files
Files changed (5) hide show
  1. config.json +39 -34
  2. model.safetensors +1 -1
  3. tokenizer.json +16 -2
  4. tokenizer_config.json +0 -2
  5. training_args.bin +2 -2
config.json CHANGED
@@ -1,52 +1,52 @@
1
  {
2
- "_name_or_path": "bert-base-multilingual-uncased",
3
- "_num_labels": 16,
4
  "architectures": [
5
  "BertForSequenceClassification"
6
  ],
7
  "attention_probs_dropout_prob": 0.1,
8
  "classifier_dropout": null,
9
- "gradient_checkpointing": false,
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
  "0": "sdg1",
15
- "1": "sdg2",
16
- "2": "sdg3",
17
- "3": "sdg4",
18
- "4": "sdg5",
19
- "5": "sdg6",
20
- "6": "sdg7",
21
- "7": "sdg8",
22
- "8": "sdg9",
23
- "9": "sdg10",
24
- "10": "sdg11",
25
- "11": "sdg12",
26
- "12": "sdg13",
27
- "13": "sdg14",
28
- "14": "sdg15",
29
- "15": "sdg16"
30
  },
31
  "initializer_range": 0.02,
32
  "intermediate_size": 3072,
33
  "label2id": {
34
  "sdg1": 0,
35
- "sdg10": 9,
36
- "sdg11": 10,
37
- "sdg12": 11,
38
- "sdg13": 12,
39
- "sdg14": 13,
40
- "sdg15": 14,
41
- "sdg16": 15,
42
- "sdg2": 1,
43
- "sdg3": 2,
44
- "sdg4": 3,
45
- "sdg5": 4,
46
- "sdg6": 5,
47
- "sdg7": 6,
48
- "sdg8": 7,
49
- "sdg9": 8
50
  },
51
  "layer_norm_eps": 1e-12,
52
  "max_position_embeddings": 512,
@@ -54,10 +54,15 @@
54
  "num_attention_heads": 12,
55
  "num_hidden_layers": 12,
56
  "pad_token_id": 0,
 
 
 
 
 
57
  "position_embedding_type": "absolute",
58
  "problem_type": "single_label_classification",
59
  "torch_dtype": "float32",
60
- "transformers_version": "4.40.0",
61
  "type_vocab_size": 2,
62
  "use_cache": true,
63
  "vocab_size": 105879
 
1
  {
2
+ "_name_or_path": "google-bert/bert-base-multilingual-uncased",
 
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "finetuning_task": "text-classification",
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
  "0": "sdg1",
15
+ "1": "sdg10",
16
+ "2": "sdg11",
17
+ "3": "sdg12",
18
+ "4": "sdg13",
19
+ "5": "sdg14",
20
+ "6": "sdg15",
21
+ "7": "sdg16",
22
+ "8": "sdg2",
23
+ "9": "sdg3",
24
+ "10": "sdg4",
25
+ "11": "sdg5",
26
+ "12": "sdg6",
27
+ "13": "sdg7",
28
+ "14": "sdg8",
29
+ "15": "sdg9"
30
  },
31
  "initializer_range": 0.02,
32
  "intermediate_size": 3072,
33
  "label2id": {
34
  "sdg1": 0,
35
+ "sdg10": 1,
36
+ "sdg11": 2,
37
+ "sdg12": 3,
38
+ "sdg13": 4,
39
+ "sdg14": 5,
40
+ "sdg15": 6,
41
+ "sdg16": 7,
42
+ "sdg2": 8,
43
+ "sdg3": 9,
44
+ "sdg4": 10,
45
+ "sdg5": 11,
46
+ "sdg6": 12,
47
+ "sdg7": 13,
48
+ "sdg8": 14,
49
+ "sdg9": 15
50
  },
51
  "layer_norm_eps": 1e-12,
52
  "max_position_embeddings": 512,
 
54
  "num_attention_heads": 12,
55
  "num_hidden_layers": 12,
56
  "pad_token_id": 0,
57
+ "pooler_fc_size": 768,
58
+ "pooler_num_attention_heads": 12,
59
+ "pooler_num_fc_layers": 3,
60
+ "pooler_size_per_head": 128,
61
+ "pooler_type": "first_token_transform",
62
  "position_embedding_type": "absolute",
63
  "problem_type": "single_label_classification",
64
  "torch_dtype": "float32",
65
+ "transformers_version": "4.42.4",
66
  "type_vocab_size": 2,
67
  "use_cache": true,
68
  "vocab_size": 105879
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec796ee78f016d404eb75c66d4f685952dde16e8cd9085b308829856b7bd319a
3
  size 669498432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516fea04f25059c326209a4030621c6fcdc999a068f0ed2c13d162f42114d52b
3
  size 669498432
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 512
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 0,
16
+ "pad_type_id": 0,
17
+ "pad_token": "[PAD]"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,
tokenizer_config.json CHANGED
@@ -43,11 +43,9 @@
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
- "do_basic_tokenize": true,
47
  "do_lower_case": true,
48
  "mask_token": "[MASK]",
49
  "model_max_length": 512,
50
- "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
53
  "strip_accents": null,
 
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
 
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
48
  "model_max_length": 512,
 
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
51
  "strip_accents": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:083cc43ec3c52d3d3f2909320ed7dfdd4cd56397a51ee1512c3811ac2a1fd11a
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7373b46fe45f2e461bb25799d911cf82ba24f3261a11f2d574c0c2008eafc1a0
3
+ size 5240