sara-nabhani commited on
Commit
a8506d5
1 Parent(s): 2124686

Training in progress, step 12000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dcf1e089fce6094a43a6df148dccae971c0758feecdb68eeeb7dc88e615426f
3
  size 1135685
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc52c0fda0953e9c5a430c827e292d874b1f843ff7773931f9c93cc6008fe891
3
  size 1135685
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f0978cde5847e3dd7ce8a7f7c7c3254251303630f4b6281edb8558cea3d3d29
3
  size 307910149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2fe0ab2f310ff386ee37c2b5b780f689e9a8938176d4023a3a7ae780f91cae
3
  size 307910149
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40593ea88f5e9169b2d59cd6aa5b2cd985839724b0346e888aae95e4bdf14a75
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8a619c5b75ad0de048a2974bf922da29a1e97a9cea67f262287c758eca45981
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71a546360b22b38e65568c028955da704276b3a9551ee9dcac6165cd80d1258c
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f07e5c87a13181fdd91b70430838fde915aa2178a6a09686f68923b2683ae87
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 1.7871696949005127,
3
  "best_model_checkpoint": "/home2/s5432073/nlp-final-project/results/google-flan-t5-small-e-snli-generation-label_and_explanation-selected-b64/checkpoint-2000",
4
- "epoch": 1.1649580615097856,
5
- "global_step": 10000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -116,11 +116,33 @@
116
  "eval_samples_per_second": 66.314,
117
  "eval_steps_per_second": 1.038,
118
  "step": 10000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
119
  }
120
  ],
121
  "max_steps": 85840,
122
  "num_train_epochs": 10,
123
- "total_flos": 1.3703196663877632e+16,
124
  "trial_name": null,
125
  "trial_params": null
126
  }
 
1
  {
2
  "best_metric": 1.7871696949005127,
3
  "best_model_checkpoint": "/home2/s5432073/nlp-final-project/results/google-flan-t5-small-e-snli-generation-label_and_explanation-selected-b64/checkpoint-2000",
4
+ "epoch": 1.3979496738117427,
5
+ "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
116
  "eval_samples_per_second": 66.314,
117
  "eval_steps_per_second": 1.038,
118
  "step": 10000
119
+ },
120
+ {
121
+ "epoch": 1.4,
122
+ "learning_rate": 0.0009054789817040271,
123
+ "loss": 1.0913,
124
+ "step": 12000
125
+ },
126
+ {
127
+ "epoch": 1.4,
128
+ "eval_accuracy": 0.8691322901849218,
129
+ "eval_bertscore_f1": 0.9338201113503969,
130
+ "eval_bleu": 0.4012059786299585,
131
+ "eval_f1": 0.8686267742768865,
132
+ "eval_loss": 1.870266079902649,
133
+ "eval_rouge1": 0.6062872493545299,
134
+ "eval_rouge2": 0.39947246134905595,
135
+ "eval_rougeL": 0.5500107773403655,
136
+ "eval_rougeLsum": 0.5520562338476832,
137
+ "eval_runtime": 149.6673,
138
+ "eval_samples_per_second": 65.759,
139
+ "eval_steps_per_second": 1.029,
140
+ "step": 12000
141
  }
142
  ],
143
  "max_steps": 85840,
144
  "num_train_epochs": 10,
145
+ "total_flos": 1.6445151317200896e+16,
146
  "trial_name": null,
147
  "trial_params": null
148
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f0978cde5847e3dd7ce8a7f7c7c3254251303630f4b6281edb8558cea3d3d29
3
  size 307910149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b2fe0ab2f310ff386ee37c2b5b780f689e9a8938176d4023a3a7ae780f91cae
3
  size 307910149