Shresthadev403 commited on
Commit
44aa160
1 Parent(s): 0371498

End of training

Browse files
logs/events.out.tfevents.1702885199.f99763f5b9a6.40910.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfc2304108de57b732a5a6b519fefd1ff858ad98df8ac1ca52dcccec92c690eb
3
+ size 4661
logs/events.out.tfevents.1702885463.f99763f5b9a6.40910.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71161617aaf09a07e106669dc827138d37a6bea47350e527a500cfe19e550f39
3
+ size 4855
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e7dc4954663319ae553f7c8324f0be8209074fd1a7d694d36b48d737871b3fb
3
  size 497918592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce1ad637c7a99828fc7e7d3601c659a5dd4de6c4967b5f8d19f044d6350570b
3
  size 497918592
trainer_state.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.25,
5
  "eval_steps": 10,
6
- "global_step": 1,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.25,
13
- "step": 1,
14
- "total_flos": 2090336256000.0,
15
- "train_loss": 1.2067252397537231,
16
- "train_runtime": 2.2969,
17
- "train_samples_per_second": 3.918,
18
- "train_steps_per_second": 0.435
19
  }
20
  ],
21
  "logging_steps": 10,
22
- "max_steps": 1,
23
  "num_train_epochs": 1,
24
  "save_steps": 10,
25
- "total_flos": 2090336256000.0,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.09375,
5
  "eval_steps": 10,
6
+ "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.09,
13
+ "step": 3,
14
+ "total_flos": 6271008768000.0,
15
+ "train_loss": 1.1875303586324055,
16
+ "train_runtime": 2.2971,
17
+ "train_samples_per_second": 39.179,
18
+ "train_steps_per_second": 1.306
19
  }
20
  ],
21
  "logging_steps": 10,
22
+ "max_steps": 3,
23
  "num_train_epochs": 1,
24
  "save_steps": 10,
25
+ "total_flos": 6271008768000.0,
26
  "trial_name": null,
27
  "trial_params": null
28
  }