arpanl commited on
Commit
8383219
1 Parent(s): c0826fa

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.42857142857142855,
4
- "eval_f1": 0.3151515151515151,
5
- "eval_loss": 1.3327875137329102,
6
- "eval_runtime": 8.6145,
7
- "eval_samples_per_second": 1.625,
8
- "eval_steps_per_second": 0.232,
9
- "total_flos": 3254926098493440.0,
10
- "train_loss": 1.865134557088216,
11
- "train_runtime": 21.8909,
12
- "train_samples_per_second": 1.919,
13
- "train_steps_per_second": 0.137
14
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "eval_accuracy": 0.14285714285714285,
4
+ "eval_f1": 0.024242424242424246,
5
+ "eval_loss": 3.5492660999298096,
6
+ "eval_runtime": 85.1371,
7
+ "eval_samples_per_second": 0.164,
8
+ "eval_steps_per_second": 0.023,
9
+ "total_flos": 4.2624032242176e+16,
10
+ "train_loss": 2.1595826721191407,
11
+ "train_runtime": 4004.6726,
12
+ "train_samples_per_second": 0.137,
13
+ "train_steps_per_second": 0.012
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.42857142857142855,
4
- "eval_f1": 0.3151515151515151,
5
- "eval_loss": 1.3327875137329102,
6
- "eval_runtime": 8.6145,
7
- "eval_samples_per_second": 1.625,
8
- "eval_steps_per_second": 0.232
9
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "eval_accuracy": 0.14285714285714285,
4
+ "eval_f1": 0.024242424242424246,
5
+ "eval_loss": 3.5492660999298096,
6
+ "eval_runtime": 85.1371,
7
+ "eval_samples_per_second": 0.164,
8
+ "eval_steps_per_second": 0.023
9
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa22762222dddcfa14f9b16baa16916e893778d17c40e6c7b3fa39824857ecc4
3
  size 343251660
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81a7149e941c65f576002c5da1477c635a8370338a45dd98d7d2ae0f50b8763e
3
  size 343251660
runs/Mar21_05-18-06_059120fe4fe5/events.out.tfevents.1711002445.059120fe4fe5.7249.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b80c48893b9de88097eb2b80a4bf2ccf3258f528eb4e7c642fe7e4fef96c6a0
3
+ size 450
runs/Mar21_08-27-06_059120fe4fe5/events.out.tfevents.1711009682.059120fe4fe5.7249.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f288e783db8e24c916c160b2c88c0f0e3dc77244d5d3153229e4133eccf1abca
3
+ size 5392
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 3254926098493440.0,
4
- "train_loss": 1.865134557088216,
5
- "train_runtime": 21.8909,
6
- "train_samples_per_second": 1.919,
7
- "train_steps_per_second": 0.137
8
  }
 
1
  {
2
+ "epoch": 50.0,
3
+ "total_flos": 4.2624032242176e+16,
4
+ "train_loss": 2.1595826721191407,
5
+ "train_runtime": 4004.6726,
6
+ "train_samples_per_second": 0.137,
7
+ "train_steps_per_second": 0.012
8
  }
trainer_state.json CHANGED
@@ -1,29 +1,46 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
- "eval_steps": 1000,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 3.0,
13
- "step": 3,
14
- "total_flos": 3254926098493440.0,
15
- "train_loss": 1.865134557088216,
16
- "train_runtime": 21.8909,
17
- "train_samples_per_second": 1.919,
18
- "train_steps_per_second": 0.137
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
- "logging_steps": 1000,
22
- "max_steps": 3,
23
  "num_input_tokens_seen": 0,
24
- "num_train_epochs": 3,
25
- "save_steps": 1000,
26
- "total_flos": 3254926098493440.0,
27
  "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": null
 
1
  {
2
+ "best_metric": 4.275224208831787,
3
+ "best_model_checkpoint": "/content/drive/MyDrive/Arkiv_Fine_tuning/Model/checkpoint-50",
4
+ "epoch": 50.0,
5
+ "eval_steps": 50,
6
+ "global_step": 50,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 50.0,
13
+ "grad_norm": 0.10450424998998642,
14
+ "learning_rate": 2.1875e-05,
15
+ "loss": 2.1596,
16
+ "step": 50
17
+ },
18
+ {
19
+ "epoch": 50.0,
20
+ "eval_accuracy": 0.3333333333333333,
21
+ "eval_f1": 0.16666666666666666,
22
+ "eval_loss": 4.275224208831787,
23
+ "eval_runtime": 18.0209,
24
+ "eval_samples_per_second": 0.166,
25
+ "eval_steps_per_second": 0.055,
26
+ "step": 50
27
+ },
28
+ {
29
+ "epoch": 50.0,
30
+ "step": 50,
31
+ "total_flos": 4.2624032242176e+16,
32
+ "train_loss": 2.1595826721191407,
33
+ "train_runtime": 4004.6726,
34
+ "train_samples_per_second": 0.137,
35
+ "train_steps_per_second": 0.012
36
  }
37
  ],
38
+ "logging_steps": 50,
39
+ "max_steps": 50,
40
  "num_input_tokens_seen": 0,
41
+ "num_train_epochs": 50,
42
+ "save_steps": 50,
43
+ "total_flos": 4.2624032242176e+16,
44
  "train_batch_size": 32,
45
  "trial_name": null,
46
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74c5ab8809bb1b7d6f20f532bb1058fead8dd042887e285e70237eb37db40d4e
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3908d5c733eb4947919dc2d992cf34178e68045538e3bb37d69b69794607888
3
  size 4984