End of training

Browse files

Files changed (7) hide show

README.md +16 -16
config.json +2 -2
model.safetensors +1 -1
runs/Feb23_16-22-54_dgx10/events.out.tfevents.1740324187.dgx10.4171446.0 +3 -0
runs/Feb23_16-33-39_dgx10/events.out.tfevents.1740324822.dgx10.4171446.1 +3 -0
runs/Feb23_16-33-39_dgx10/events.out.tfevents.1740366134.dgx10.4171446.2 +3 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -20,14 +20,14 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [xlm-roberta-large](https://huggingface.co/xlm-roberta-large) on the generator dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.4441
-- Accuracy: 0.9035
-- Micro Precision: 0.9035
-- Micro Recall: 0.9035
-- Micro F1: 0.9035
-- Macro Precision: 0.8681
-- Macro Recall: 0.8564
-- Macro F1: 0.8581
 ## Model description
@@ -61,14 +61,14 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step   | Validation Loss | Accuracy | Micro Precision | Micro Recall | Micro F1 | Macro Precision | Macro Recall | Macro F1 |
 |:-------------:|:-----:|:------:|:---------------:|:--------:|:---------------:|:------------:|:--------:|:---------------:|:------------:|:--------:|
-| 0.506         | 1.0   | 15074  | 0.4465          | 0.8717   | 0.8717          | 0.8717       | 0.8717   | 0.8315          | 0.8249       | 0.8189   |
-| 0.4444        | 2.0   | 30148  | 0.4104          | 0.8797   | 0.8797          | 0.8797       | 0.8797   | 0.8369          | 0.8384       | 0.8268   |
-| 0.347         | 3.0   | 45222  | 0.3999          | 0.8918   | 0.8918          | 0.8918       | 0.8918   | 0.8593          | 0.8470       | 0.8458   |
-| 0.3004        | 4.0   | 60296  | 0.3732          | 0.8989   | 0.8989          | 0.8989       | 0.8989   | 0.8569          | 0.8628       | 0.8552   |
-| 0.2735        | 5.0   | 75370  | 0.3913          | 0.9013   | 0.9013          | 0.9013       | 0.9013   | 0.8596          | 0.8643       | 0.8569   |
-| 0.2294        | 6.0   | 90444  | 0.4118          | 0.9035   | 0.9035          | 0.9035       | 0.9035   | 0.8647          | 0.8730       | 0.8643   |
-| 0.187         | 7.0   | 105518 | 0.4153          | 0.9051   | 0.9051          | 0.9051       | 0.9051   | 0.8703          | 0.8743       | 0.8680   |
-| 0.172         | 8.0   | 120592 | 0.4362          | 0.9048   | 0.9048          | 0.9048       | 0.9048   | 0.8653          | 0.8723       | 0.8637   |
 ### Framework versions

 This model is a fine-tuned version of [xlm-roberta-large](https://huggingface.co/xlm-roberta-large) on the generator dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6614
+- Accuracy: 0.9100
+- Micro Precision: 0.9100
+- Micro Recall: 0.9100
+- Micro F1: 0.9100
+- Macro Precision: 0.8823
+- Macro Recall: 0.8656
+- Macro F1: 0.8703
 ## Model description
 | Training Loss | Epoch | Step   | Validation Loss | Accuracy | Micro Precision | Micro Recall | Micro F1 | Macro Precision | Macro Recall | Macro F1 |
 |:-------------:|:-----:|:------:|:---------------:|:--------:|:---------------:|:------------:|:--------:|:---------------:|:------------:|:--------:|
+| 0.4142        | 1.0   | 15074  | 0.3827          | 0.8873   | 0.8873          | 0.8873       | 0.8873   | 0.8729          | 0.8334       | 0.8429   |
+| 0.3407        | 2.0   | 30148  | 0.3548          | 0.8965   | 0.8965          | 0.8965       | 0.8965   | 0.8663          | 0.8600       | 0.8586   |
+| 0.2327        | 3.0   | 45222  | 0.3800          | 0.9015   | 0.9015          | 0.9015       | 0.9015   | 0.8816          | 0.8550       | 0.8623   |
+| 0.1701        | 4.0   | 60296  | 0.4035          | 0.9062   | 0.9062          | 0.9062       | 0.9062   | 0.8730          | 0.8707       | 0.8684   |
+| 0.1281        | 5.0   | 75370  | 0.4522          | 0.9109   | 0.9109          | 0.9109       | 0.9109   | 0.8751          | 0.8833       | 0.8755   |
+| 0.1007        | 6.0   | 90444  | 0.5409          | 0.9109   | 0.9109          | 0.9109       | 0.9109   | 0.8741          | 0.8776       | 0.8723   |
+| 0.0598        | 7.0   | 105518 | 0.5965          | 0.9115   | 0.9115          | 0.9115       | 0.9115   | 0.8773          | 0.8803       | 0.8751   |
+| 0.0519        | 8.0   | 120592 | 0.6388          | 0.9131   | 0.9131          | 0.9131       | 0.9131   | 0.8736          | 0.8817       | 0.8738   |
 ### Framework versions

config.json CHANGED Viewed

@@ -3,12 +3,12 @@
   "architectures": [
     "RelationExtractionModel"
   ],
-  "attention_probs_dropout_prob": 0.25,
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.25,
   "hidden_size": 1024,
   "id2label": {
     "0": "P0 other",

   "architectures": [
     "RelationExtractionModel"
   ],
+  "attention_probs_dropout_prob": 0.1,
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "id2label": {
     "0": "P0 other",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:263ed6385608569ac4c500dd907e5be45793f820784b0733c36ec8fc886dd32f
 size 2240416848

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ed12f364660765f2470d20feaf19e2103a3bd41d4ce62f125489e8ed1951dd7
 size 2240416848

runs/Feb23_16-22-54_dgx10/events.out.tfevents.1740324187.dgx10.4171446.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84d484c536cb07053e5b4c30adecb67acec8f6498e2ddc07d783ff08c948f5d6
+size 10718

runs/Feb23_16-33-39_dgx10/events.out.tfevents.1740324822.dgx10.4171446.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34b8d63aa71c5022bd24016090246ad90f736b9d172a5f671513523f5dfad20d
+size 67238

runs/Feb23_16-33-39_dgx10/events.out.tfevents.1740366134.dgx10.4171446.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce362229c2976044013002cb440c66e42ab14a5809228e03462689c76f416a76
+size 757

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b873ac0ed7c7180499ed7d0365eda1bcfba9f27ad41b0f08c7fbd9d29f25c37b
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:304663f5f22a482e5f26a27058b5ec70058f0998a6ee6e274b1ea399fcde2625
 size 5304