awlassche commited on
Commit
090da5b
·
verified ·
1 Parent(s): b72d9d9

gender-play-gysbert-4b

Browse files
Files changed (3) hide show
  1. README.md +9 -10
  2. config.json +5 -4
  3. model.safetensors +2 -2
README.md CHANGED
@@ -1,6 +1,5 @@
1
  ---
2
- license: mit
3
- base_model: emanjavacas/GysBERT
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -15,10 +14,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # results
17
 
18
- This model is a fine-tuned version of [emanjavacas/GysBERT](https://huggingface.co/emanjavacas/GysBERT) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.6299
21
- - Accuracy: 0.6589
22
 
23
  ## Model description
24
 
@@ -49,14 +48,14 @@ The following hyperparameters were used during training:
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:------:|:----:|:---------------:|:--------:|
52
- | 0.7228 | 0.7143 | 100 | 0.6931 | 0.4875 |
53
- | 0.7043 | 1.4286 | 200 | 0.6834 | 0.5357 |
54
- | 0.6531 | 2.1429 | 300 | 0.6321 | 0.6482 |
55
- | 0.5927 | 2.8571 | 400 | 0.6299 | 0.6589 |
56
 
57
 
58
  ### Framework versions
59
 
60
- - Transformers 4.41.1
61
  - Pytorch 2.3.0+cu121
62
  - Tokenizers 0.19.1
 
1
  ---
2
+ base_model: GroNLP/bert-base-dutch-cased
 
3
  tags:
4
  - generated_from_trainer
5
  metrics:
 
14
 
15
  # results
16
 
17
+ This model is a fine-tuned version of [GroNLP/bert-base-dutch-cased](https://huggingface.co/GroNLP/bert-base-dutch-cased) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.9758
20
+ - Accuracy: 0.6464
21
 
22
  ## Model description
23
 
 
48
 
49
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
50
  |:-------------:|:------:|:----:|:---------------:|:--------:|
51
+ | 0.6817 | 0.7143 | 100 | 0.6938 | 0.5696 |
52
+ | 0.5836 | 1.4286 | 200 | 0.7187 | 0.6286 |
53
+ | 0.4291 | 2.1429 | 300 | 0.8203 | 0.6625 |
54
+ | 0.2009 | 2.8571 | 400 | 0.9758 | 0.6464 |
55
 
56
 
57
  ### Framework versions
58
 
59
+ - Transformers 4.41.2
60
  - Pytorch 2.3.0+cu121
61
  - Tokenizers 0.19.1
config.json CHANGED
@@ -1,10 +1,11 @@
1
  {
2
- "_name_or_path": "emanjavacas/GysBERT",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
 
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
  "hidden_size": 768,
@@ -15,12 +16,12 @@
15
  "model_type": "bert",
16
  "num_attention_heads": 12,
17
  "num_hidden_layers": 12,
18
- "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.41.1",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
- "vocab_size": 30522
26
  }
 
1
  {
2
+ "_name_or_path": "GroNLP/bert-base-dutch-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
16
  "model_type": "bert",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
+ "pad_token_id": 3,
20
  "position_embedding_type": "absolute",
21
  "problem_type": "single_label_classification",
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.41.2",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
+ "vocab_size": 30073
27
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0294e5461fbfb174835f4e5191f3f4eb59b4801a9fbff17d30ad23011e8d7d3c
3
- size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b07394ba5d96ca47525d8f544181e8ab4d5e5a78db69e872439b7fd1bb42bf1
3
+ size 436579312