End of training

Browse files

Files changed (6) hide show

README.md +73 -0
config.json +51 -0
model.safetensors +3 -0
runs/Jun19_18-19-29_817494848e48/events.out.tfevents.1718821174.817494848e48.5078.0 +3 -0
runs/Jun19_18-21-25_817494848e48/events.out.tfevents.1718821288.817494848e48.5842.0 +3 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,73 @@

+---
+license: mit
+base_model: indobenchmark/indobert-large-p2
+tags:
+- generated_from_trainer
+model-index:
+- name: pertama
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# pertama
+This model is a fine-tuned version of [indobenchmark/indobert-large-p2](https://huggingface.co/indobenchmark/indobert-large-p2) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 2.4507
+- F1 macro: 0.4131
+- Weighted: 0.5840
+- Balanced accuracy: 0.5423
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 1e-05
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 14
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | F1 macro | Weighted | Balanced accuracy |
+|:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|:-----------------:|
+| 1.3416        | 1.0   | 154  | 1.5603          | 0.2942   | 0.3462   | 0.4357            |
+| 0.941         | 2.0   | 308  | 1.3408          | 0.3530   | 0.5202   | 0.4807            |
+| 0.6965        | 3.0   | 462  | 1.3731          | 0.3747   | 0.5629   | 0.5101            |
+| 0.4375        | 4.0   | 616  | 1.3137          | 0.3904   | 0.5961   | 0.5002            |
+| 0.2491        | 5.0   | 770  | 1.5577          | 0.3772   | 0.5930   | 0.4978            |
+| 0.0793        | 6.0   | 924  | 2.1326          | 0.3923   | 0.5382   | 0.5401            |
+| 0.0488        | 7.0   | 1078 | 2.2000          | 0.3861   | 0.5483   | 0.5243            |
+| 0.0206        | 8.0   | 1232 | 2.1568          | 0.3914   | 0.5873   | 0.5096            |
+| 0.0243        | 9.0   | 1386 | 2.2272          | 0.4118   | 0.5851   | 0.5457            |
+| 0.0126        | 10.0  | 1540 | 2.3494          | 0.4029   | 0.5885   | 0.5346            |
+| 0.0449        | 11.0  | 1694 | 2.2914          | 0.4115   | 0.6037   | 0.5387            |
+| 0.0023        | 12.0  | 1848 | 2.5714          | 0.3962   | 0.5675   | 0.5334            |
+| 0.0023        | 13.0  | 2002 | 2.4491          | 0.4155   | 0.5878   | 0.5400            |
+| 0.0024        | 14.0  | 2156 | 2.4507          | 0.4131   | 0.5840   | 0.5423            |
+### Framework versions
+- Transformers 4.41.2
+- Pytorch 2.3.0+cu121
+- Datasets 2.20.0
+- Tokenizers 0.19.1

config.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "_name_or_path": "indobenchmark/indobert-large-p2",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "Sumber Daya Alam",
+    "1": "Politik",
+    "2": "Demografi",
+    "3": "Pertahanan dan Keamanan",
+    "4": "Ideologi",
+    "5": "Ekonomi",
+    "6": "Sosial Budaya",
+    "7": "Geografi"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.41.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2d6c1bcd5e17797eeea5714de26ca4d87669e0e51d7f16531bd9866eea53295b
+size 1340647360

runs/Jun19_18-19-29_817494848e48/events.out.tfevents.1718821174.817494848e48.5078.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:516d1966d0e18f8e9b28294619c90da0427e3ec8084e75529867e4c411c53c3c
+size 6146

runs/Jun19_18-21-25_817494848e48/events.out.tfevents.1718821288.817494848e48.5842.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bd9bb7b19e1ec39c0885dd9a8ba0f849b52e9291ffd63678ecba849829d4a9e6
+size 57093

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:258efb47016f9103428380b1f9e4c7bf63d264c9c838fc35c6d9d2e2e670678c
+size 5112