xshubhamx commited on
Commit
045df22
·
verified ·
1 Parent(s): 0cbefc7

Upload folder using huggingface_hub

Browse files
training_checkpoints/checkpoint-643/adapter_config.json CHANGED
@@ -21,8 +21,8 @@
21
  "revision": null,
22
  "target_modules": [
23
  "key",
24
- "dense",
25
  "value",
 
26
  "query"
27
  ],
28
  "task_type": "SEQ_CLS",
 
21
  "revision": null,
22
  "target_modules": [
23
  "key",
 
24
  "value",
25
+ "dense",
26
  "query"
27
  ],
28
  "task_type": "SEQ_CLS",
training_checkpoints/checkpoint-643/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c53182b2c2c69c0d0d5eced0d73bd90fb6351291f5abd2a3f553054ac412349b
3
  size 104549068
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:807626fbe31da1676bfb47c4e711c05c686ee9ed330a1aa1123f64f769be412f
3
  size 104549068
training_checkpoints/checkpoint-643/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f922e3622a510677ec7a22a5cfc432084a4335086bbca12acbf57a0b4e684c29
3
  size 21646778
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb13d7468a59df546c16ce0cf0e090673b2cafc0fcfcca2c1ccc7ac3de7586e6
3
  size 21646778
training_checkpoints/checkpoint-643/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6438ed6cfc5010cc62ed940c59c896be41c9578565a6a8d984b6ec712fc0303a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74888fb227ac28db8dee18137a1df7903e74e06fc48019f644883eaf139f2072
3
  size 1064
training_checkpoints/checkpoint-643/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.4262450946907797,
3
- "best_model_checkpoint": "legal-bert-lora/checkpoint-482",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
6
  "global_step": 643,
@@ -10,102 +10,102 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6297443841982959,
14
- "eval_f1_macro": 0.274206359888179,
15
- "eval_f1_micro": 0.6297443841982959,
16
- "eval_f1_weighted": 0.5693924444438366,
17
- "eval_loss": 1.3252344131469727,
18
- "eval_macro_fpr": 0.04170202326759921,
19
- "eval_macro_sensitivity": 0.31095312319919677,
20
- "eval_macro_specificity": 0.9716859606487191,
21
- "eval_precision": 0.5643117258906628,
22
- "eval_precision_macro": 0.2864620870649182,
23
- "eval_recall": 0.6297443841982959,
24
- "eval_recall_macro": 0.31095312319919677,
25
- "eval_runtime": 29.2455,
26
- "eval_samples_per_second": 44.143,
27
- "eval_steps_per_second": 5.539,
28
- "eval_weighted_fpr": 0.0403035413153457,
29
- "eval_weighted_sensitivity": 0.6297443841982959,
30
- "eval_weighted_specificity": 0.945545025532491,
31
  "step": 160
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.7312161115414407,
36
- "eval_f1_macro": 0.39668888106795264,
37
- "eval_f1_micro": 0.7312161115414407,
38
- "eval_f1_weighted": 0.6996238601563893,
39
- "eval_loss": 0.8870222568511963,
40
- "eval_macro_fpr": 0.025654492164758257,
41
- "eval_macro_sensitivity": 0.4525442260434048,
42
- "eval_macro_specificity": 0.9800113592544849,
43
- "eval_precision": 0.687310022738013,
44
- "eval_precision_macro": 0.37417463878901125,
45
- "eval_recall": 0.7312161115414407,
46
- "eval_recall_macro": 0.4525442260434048,
47
- "eval_runtime": 31.4769,
48
- "eval_samples_per_second": 41.014,
49
- "eval_steps_per_second": 5.147,
50
- "eval_weighted_fpr": 0.025584310255843103,
51
- "eval_weighted_sensitivity": 0.7312161115414407,
52
- "eval_weighted_specificity": 0.9689542772758329,
53
  "step": 321
54
  },
55
  {
56
  "epoch": 3.0,
57
- "eval_accuracy": 0.7482571649883811,
58
- "eval_f1_macro": 0.4262450946907797,
59
- "eval_f1_micro": 0.7482571649883811,
60
- "eval_f1_weighted": 0.7282078768513273,
61
- "eval_loss": 0.7794041037559509,
62
- "eval_macro_fpr": 0.023941075707085962,
63
- "eval_macro_sensitivity": 0.46803400264857875,
64
- "eval_macro_specificity": 0.9812882861560729,
65
- "eval_precision": 0.716881212213352,
66
- "eval_precision_macro": 0.40594566191566384,
67
- "eval_recall": 0.7482571649883811,
68
- "eval_recall_macro": 0.46803400264857875,
69
- "eval_runtime": 31.9176,
70
- "eval_samples_per_second": 40.448,
71
- "eval_steps_per_second": 5.076,
72
- "eval_weighted_fpr": 0.02346739836811322,
73
- "eval_weighted_sensitivity": 0.7482571649883811,
74
- "eval_weighted_specificity": 0.9710671273527125,
75
  "step": 482
76
  },
77
  {
78
  "epoch": 3.11,
79
- "learning_rate": 3.4375e-05,
80
- "loss": 1.2835,
81
  "step": 500
82
  },
83
  {
84
  "epoch": 4.0,
85
- "eval_accuracy": 0.7443841982958946,
86
- "eval_f1_macro": 0.4099967964216515,
87
- "eval_f1_micro": 0.7443841982958946,
88
- "eval_f1_weighted": 0.7145941103131069,
89
- "eval_loss": 0.7480739951133728,
90
- "eval_macro_fpr": 0.024347730036769315,
91
- "eval_macro_sensitivity": 0.45879715060247334,
92
- "eval_macro_specificity": 0.9809610383366641,
93
- "eval_precision": 0.7084810945380595,
94
- "eval_precision_macro": 0.39966194371515146,
95
- "eval_recall": 0.7443841982958946,
96
- "eval_recall_macro": 0.45879715060247334,
97
- "eval_runtime": 31.4007,
98
- "eval_samples_per_second": 41.114,
99
- "eval_steps_per_second": 5.159,
100
- "eval_weighted_fpr": 0.023940800928612886,
101
- "eval_weighted_sensitivity": 0.7443841982958946,
102
- "eval_weighted_specificity": 0.9700313767540658,
103
  "step": 643
104
  }
105
  ],
106
  "logging_steps": 500,
107
- "max_steps": 1600,
108
- "num_train_epochs": 10,
109
  "save_steps": 500,
110
  "total_flos": 5577944869453824.0,
111
  "trial_name": null,
 
1
  {
2
+ "best_metric": 0.46141164864389705,
3
+ "best_model_checkpoint": "legal-bert-lora/checkpoint-643",
4
  "epoch": 4.0,
5
  "eval_steps": 500,
6
  "global_step": 643,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6374903175832688,
14
+ "eval_f1_macro": 0.3394539856434376,
15
+ "eval_f1_micro": 0.6374903175832688,
16
+ "eval_f1_weighted": 0.5765523433851403,
17
+ "eval_loss": 1.3127473592758179,
18
+ "eval_macro_fpr": 0.040137717078130394,
19
+ "eval_macro_sensitivity": 0.4017115530536667,
20
+ "eval_macro_specificity": 0.9725650393599338,
21
+ "eval_precision": 0.5466227876047401,
22
+ "eval_precision_macro": 0.31141306924471374,
23
+ "eval_recall": 0.6374903175832688,
24
+ "eval_recall_macro": 0.4017115530536667,
25
+ "eval_runtime": 44.4128,
26
+ "eval_samples_per_second": 29.068,
27
+ "eval_steps_per_second": 3.648,
28
+ "eval_weighted_fpr": 0.0390325271059216,
29
+ "eval_weighted_sensitivity": 0.6374903175832688,
30
+ "eval_weighted_specificity": 0.950985272815738,
31
  "step": 160
32
  },
33
  {
34
  "epoch": 2.0,
35
+ "eval_accuracy": 0.7273431448489543,
36
+ "eval_f1_macro": 0.3969800602789428,
37
+ "eval_f1_micro": 0.7273431448489543,
38
+ "eval_f1_weighted": 0.6960627383550935,
39
+ "eval_loss": 0.8160030841827393,
40
+ "eval_macro_fpr": 0.026417996388603746,
41
+ "eval_macro_sensitivity": 0.450135625445356,
42
+ "eval_macro_specificity": 0.9796396430402219,
43
+ "eval_precision": 0.6997929823446861,
44
+ "eval_precision_macro": 0.39453164470926966,
45
+ "eval_recall": 0.7273431448489543,
46
+ "eval_recall_macro": 0.450135625445356,
47
+ "eval_runtime": 34.3148,
48
+ "eval_samples_per_second": 37.622,
49
+ "eval_steps_per_second": 4.721,
50
+ "eval_weighted_fpr": 0.026077937472218107,
51
+ "eval_weighted_sensitivity": 0.7273431448489543,
52
+ "eval_weighted_specificity": 0.9672515007543734,
53
  "step": 321
54
  },
55
  {
56
  "epoch": 3.0,
57
+ "eval_accuracy": 0.7443841982958946,
58
+ "eval_f1_macro": 0.4210575074216338,
59
+ "eval_f1_micro": 0.7443841982958946,
60
+ "eval_f1_weighted": 0.7223603623418946,
61
+ "eval_loss": 0.7322217226028442,
62
+ "eval_macro_fpr": 0.024451015698283406,
63
+ "eval_macro_sensitivity": 0.46251578703813245,
64
+ "eval_macro_specificity": 0.9809603839363172,
65
+ "eval_precision": 0.711002444877192,
66
+ "eval_precision_macro": 0.4030436676815596,
67
+ "eval_recall": 0.7443841982958946,
68
+ "eval_recall_macro": 0.46251578703813245,
69
+ "eval_runtime": 32.8708,
70
+ "eval_samples_per_second": 39.275,
71
+ "eval_steps_per_second": 4.928,
72
+ "eval_weighted_fpr": 0.023940800928612886,
73
+ "eval_weighted_sensitivity": 0.7443841982958946,
74
+ "eval_weighted_specificity": 0.9700215607488639,
75
  "step": 482
76
  },
77
  {
78
  "epoch": 3.11,
79
+ "learning_rate": 3.958333333333333e-05,
80
+ "loss": 1.2229,
81
  "step": 500
82
  },
83
  {
84
  "epoch": 4.0,
85
+ "eval_accuracy": 0.7536793183578622,
86
+ "eval_f1_macro": 0.46141164864389705,
87
+ "eval_f1_micro": 0.7536793183578622,
88
+ "eval_f1_weighted": 0.7337325056665881,
89
+ "eval_loss": 0.7034952640533447,
90
+ "eval_macro_fpr": 0.023326126599014015,
91
+ "eval_macro_sensitivity": 0.4865735295815666,
92
+ "eval_macro_specificity": 0.9815978320880049,
93
+ "eval_precision": 0.7340611054176746,
94
+ "eval_precision_macro": 0.4982390488816621,
95
+ "eval_recall": 0.7536793183578622,
96
+ "eval_recall_macro": 0.4865735295815666,
97
+ "eval_runtime": 33.282,
98
+ "eval_samples_per_second": 38.79,
99
+ "eval_steps_per_second": 4.868,
100
+ "eval_weighted_fpr": 0.022812051649928264,
101
+ "eval_weighted_sensitivity": 0.7536793183578622,
102
+ "eval_weighted_specificity": 0.9702881629622103,
103
  "step": 643
104
  }
105
  ],
106
  "logging_steps": 500,
107
+ "max_steps": 2400,
108
+ "num_train_epochs": 15,
109
  "save_steps": 500,
110
  "total_flos": 5577944869453824.0,
111
  "trial_name": null,
training_checkpoints/checkpoint-643/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1be05b6bb510587fe353991f6f2836b34a5909cbc5adc58389938bd163228a1f
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36a33fe5941ace0a96599f0a2229d1ce6d7002fe79c5372925862ab481915414
3
  size 4600