Connor Finley commited on
Commit
686253f
1 Parent(s): 3b1e5ca
README.md CHANGED
@@ -16,7 +16,7 @@ model_index:
16
  metric:
17
  name: Accuracy
18
  type: accuracy
19
- value: 0.9860828488372093
20
  ---
21
 
22
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -26,11 +26,11 @@ should probably proofread and complete it, then remove this comment. -->
26
 
27
  This model is a fine-tuned version of [camembert-base](https://huggingface.co/camembert-base) on an unkown dataset.
28
  It achieves the following results on the evaluation set:
29
- - Loss: 0.0503
30
- - Precision: 0.9333
31
- - Recall: 0.9275
32
- - F1: 0.9304
33
- - Accuracy: 0.9861
34
 
35
  ## Model description
36
 
16
  metric:
17
  name: Accuracy
18
  type: accuracy
19
+ value: 0.991500810518732
20
  ---
21
 
22
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
26
 
27
  This model is a fine-tuned version of [camembert-base](https://huggingface.co/camembert-base) on an unkown dataset.
28
  It achieves the following results on the evaluation set:
29
+ - Loss: 0.0301
30
+ - Precision: 0.9601
31
+ - Recall: 0.9527
32
+ - F1: 0.9564
33
+ - Accuracy: 0.9915
34
 
35
  ## Model description
36
 
all_results.json CHANGED
@@ -1,25 +1,25 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_accuracy": 0.9860828488372093,
4
- "eval_f1": 0.9304015991277484,
5
- "eval_loss": 0.05031319707632065,
6
- "eval_precision": 0.9332847247539191,
7
- "eval_recall": 0.927536231884058,
8
- "eval_runtime": 3.16,
9
- "eval_samples": 430,
10
- "eval_samples_per_second": 136.078,
11
- "eval_steps_per_second": 17.089,
12
- "predict_accuracy": 0.9901502991390632,
13
- "predict_f1": 0.952212389380531,
14
- "predict_loss": 0.03813100978732109,
15
- "predict_precision": 0.9662356321839081,
16
- "predict_recall": 0.9385903698534543,
17
- "predict_runtime": 3.1212,
18
- "predict_samples_per_second": 137.449,
19
- "predict_steps_per_second": 17.301,
20
- "train_loss": 0.059730371578719264,
21
- "train_runtime": 194.0601,
22
- "train_samples": 3434,
23
- "train_samples_per_second": 53.087,
24
- "train_steps_per_second": 3.324
25
  }
1
  {
2
  "epoch": 3.0,
3
+ "eval_accuracy": 0.991500810518732,
4
+ "eval_f1": 0.9564196794489446,
5
+ "eval_loss": 0.03012062981724739,
6
+ "eval_precision": 0.9601328903654485,
7
+ "eval_recall": 0.9527350787748687,
8
+ "eval_runtime": 30.7406,
9
+ "eval_samples": 4164,
10
+ "eval_samples_per_second": 135.456,
11
+ "eval_steps_per_second": 16.948,
12
+ "predict_accuracy": 0.9907505424296343,
13
+ "predict_f1": 0.952959144711722,
14
+ "predict_loss": 0.03142160549759865,
15
+ "predict_precision": 0.9562085743841232,
16
+ "predict_recall": 0.9497317249514822,
17
+ "predict_runtime": 31.6681,
18
+ "predict_samples_per_second": 131.457,
19
+ "predict_steps_per_second": 16.452,
20
+ "train_loss": 0.02315408722391657,
21
+ "train_runtime": 2017.0522,
22
+ "train_samples": 33304,
23
+ "train_samples_per_second": 49.534,
24
+ "train_steps_per_second": 3.097
25
  }
eval_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_accuracy": 0.9860828488372093,
4
- "eval_f1": 0.9304015991277484,
5
- "eval_loss": 0.05031319707632065,
6
- "eval_precision": 0.9332847247539191,
7
- "eval_recall": 0.927536231884058,
8
- "eval_runtime": 3.16,
9
- "eval_samples": 430,
10
- "eval_samples_per_second": 136.078,
11
- "eval_steps_per_second": 17.089
12
  }
1
  {
2
  "epoch": 3.0,
3
+ "eval_accuracy": 0.991500810518732,
4
+ "eval_f1": 0.9564196794489446,
5
+ "eval_loss": 0.03012062981724739,
6
+ "eval_precision": 0.9601328903654485,
7
+ "eval_recall": 0.9527350787748687,
8
+ "eval_runtime": 30.7406,
9
+ "eval_samples": 4164,
10
+ "eval_samples_per_second": 135.456,
11
+ "eval_steps_per_second": 16.948
12
  }
predict_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "predict_accuracy": 0.9901502991390632,
3
- "predict_f1": 0.952212389380531,
4
- "predict_loss": 0.03813100978732109,
5
- "predict_precision": 0.9662356321839081,
6
- "predict_recall": 0.9385903698534543,
7
- "predict_runtime": 3.1212,
8
- "predict_samples_per_second": 137.449,
9
- "predict_steps_per_second": 17.301
10
  }
1
  {
2
+ "predict_accuracy": 0.9907505424296343,
3
+ "predict_f1": 0.952959144711722,
4
+ "predict_loss": 0.03142160549759865,
5
+ "predict_precision": 0.9562085743841232,
6
+ "predict_recall": 0.9497317249514822,
7
+ "predict_runtime": 31.6681,
8
+ "predict_samples_per_second": 131.457,
9
+ "predict_steps_per_second": 16.452
10
  }
predictions.txt CHANGED
The diff for this file is too large to render. See raw diff
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c841421b4991274dd8f2e12a18211934ea8b410a43b579a231ceaac23e3e5745
3
  size 440216305
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:799b6c8692bf8a5e41950b41508032b2c1a06cffe87aa6d980d208ade3975d39
3
  size 440216305
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.059730371578719264,
4
- "train_runtime": 194.0601,
5
- "train_samples": 3434,
6
- "train_samples_per_second": 53.087,
7
- "train_steps_per_second": 3.324
8
  }
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.02315408722391657,
4
+ "train_runtime": 2017.0522,
5
+ "train_samples": 33304,
6
+ "train_samples_per_second": 49.534,
7
+ "train_steps_per_second": 3.097
8
  }
trainer_state.json CHANGED
@@ -2,30 +2,96 @@
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
- "global_step": 645,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 2.33,
12
- "learning_rate": 1.1240310077519382e-05,
13
- "loss": 0.0692,
14
  "step": 500
15
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  {
17
  "epoch": 3.0,
18
- "step": 645,
19
- "total_flos": 675153499627752.0,
20
- "train_loss": 0.059730371578719264,
21
- "train_runtime": 194.0601,
22
- "train_samples_per_second": 53.087,
23
- "train_steps_per_second": 3.324
24
  }
25
  ],
26
- "max_steps": 645,
27
  "num_train_epochs": 3,
28
- "total_flos": 675153499627752.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
+ "global_step": 6246,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.24,
12
+ "learning_rate": 4.599743836055075e-05,
13
+ "loss": 0.0731,
14
  "step": 500
15
  },
16
+ {
17
+ "epoch": 0.48,
18
+ "learning_rate": 4.1994876721101504e-05,
19
+ "loss": 0.0345,
20
+ "step": 1000
21
+ },
22
+ {
23
+ "epoch": 0.72,
24
+ "learning_rate": 3.7992315081652255e-05,
25
+ "loss": 0.0299,
26
+ "step": 1500
27
+ },
28
+ {
29
+ "epoch": 0.96,
30
+ "learning_rate": 3.398975344220301e-05,
31
+ "loss": 0.027,
32
+ "step": 2000
33
+ },
34
+ {
35
+ "epoch": 1.2,
36
+ "learning_rate": 2.998719180275376e-05,
37
+ "loss": 0.0199,
38
+ "step": 2500
39
+ },
40
+ {
41
+ "epoch": 1.44,
42
+ "learning_rate": 2.5984630163304517e-05,
43
+ "loss": 0.0183,
44
+ "step": 3000
45
+ },
46
+ {
47
+ "epoch": 1.68,
48
+ "learning_rate": 2.1982068523855268e-05,
49
+ "loss": 0.018,
50
+ "step": 3500
51
+ },
52
+ {
53
+ "epoch": 1.92,
54
+ "learning_rate": 1.797950688440602e-05,
55
+ "loss": 0.0175,
56
+ "step": 4000
57
+ },
58
+ {
59
+ "epoch": 2.16,
60
+ "learning_rate": 1.3976945244956775e-05,
61
+ "loss": 0.0132,
62
+ "step": 4500
63
+ },
64
+ {
65
+ "epoch": 2.4,
66
+ "learning_rate": 9.974383605507526e-06,
67
+ "loss": 0.0114,
68
+ "step": 5000
69
+ },
70
+ {
71
+ "epoch": 2.64,
72
+ "learning_rate": 5.971821966058277e-06,
73
+ "loss": 0.0108,
74
+ "step": 5500
75
+ },
76
+ {
77
+ "epoch": 2.88,
78
+ "learning_rate": 1.96926032660903e-06,
79
+ "loss": 0.0105,
80
+ "step": 6000
81
+ },
82
  {
83
  "epoch": 3.0,
84
+ "step": 6246,
85
+ "total_flos": 6623681170117440.0,
86
+ "train_loss": 0.02315408722391657,
87
+ "train_runtime": 2017.0522,
88
+ "train_samples_per_second": 49.534,
89
+ "train_steps_per_second": 3.097
90
  }
91
  ],
92
+ "max_steps": 6246,
93
  "num_train_epochs": 3,
94
+ "total_flos": 6623681170117440.0,
95
  "trial_name": null,
96
  "trial_params": null
97
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82e501ebaafb54fa08b9cc6a6a337a7ed61a65191081ddd5bda8581472f0a7c2
3
  size 2607
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa1fa9ff04e58841c66e7e501162366a8cc278043ea6c602d8e2d809df1e4268
3
  size 2607