yhyhy3 commited on
Commit
ef3736e
1 Parent(s): 2c08fae

Add model files and configs

Browse files
README.md CHANGED
@@ -49,7 +49,7 @@ The following hyperparameters were used during training:
49
 
50
  ### Framework versions
51
 
52
- - Transformers 4.36.0.dev0
53
  - Pytorch 2.2.0.dev20231114
54
- - Datasets 2.14.6
55
- - Tokenizers 0.14.1
 
49
 
50
  ### Framework versions
51
 
52
+ - Transformers 4.35.2
53
  - Pytorch 2.2.0.dev20231114
54
+ - Datasets 2.15.0
55
+ - Tokenizers 0.15.0
all_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.6294479370117188,
4
- "train_runtime": 14.4911,
5
- "train_samples_per_second": 8.074,
6
- "train_steps_per_second": 1.035
7
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.5570555263095431,
4
+ "train_runtime": 17.3481,
5
+ "train_samples_per_second": 7.436,
6
+ "train_steps_per_second": 1.038
7
  }
config.json CHANGED
@@ -45,7 +45,7 @@
45
  ],
46
  "problem_type": "single_label_classification",
47
  "semantic_loss_ignore_index": 255,
48
- "transformers_version": "4.36.0.dev0",
49
  "use_absolute_position_embeddings": true,
50
  "use_auxiliary_head": true,
51
  "use_mask_token": true,
 
45
  ],
46
  "problem_type": "single_label_classification",
47
  "semantic_loss_ignore_index": 255,
48
+ "transformers_version": "4.35.2",
49
  "use_absolute_position_embeddings": true,
50
  "use_auxiliary_head": true,
51
  "use_mask_token": true,
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.6294479370117188,
4
- "train_runtime": 14.4911,
5
- "train_samples_per_second": 8.074,
6
- "train_steps_per_second": 1.035
7
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.5570555263095431,
4
+ "train_runtime": 17.3481,
5
+ "train_samples_per_second": 7.436,
6
+ "train_steps_per_second": 1.038
7
  }
trainer_state.json CHANGED
@@ -3,26 +3,26 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 15,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 3.0,
13
- "step": 15,
14
- "total_flos": 9067617800736768.0,
15
- "train_loss": 0.6294479370117188,
16
- "train_runtime": 14.4911,
17
- "train_samples_per_second": 8.074,
18
- "train_steps_per_second": 1.035
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 15,
23
  "num_train_epochs": 3,
24
  "save_steps": 500,
25
- "total_flos": 9067617800736768.0,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
 
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 3.0,
13
+ "step": 18,
14
+ "total_flos": 9997629882863616.0,
15
+ "train_loss": 0.5570555263095431,
16
+ "train_runtime": 17.3481,
17
+ "train_samples_per_second": 7.436,
18
+ "train_steps_per_second": 1.038
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 18,
23
  "num_train_epochs": 3,
24
  "save_steps": 500,
25
+ "total_flos": 9997629882863616.0,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f0c1e74c85f426352c503551abb429faf8f58dc744bc1ea002e8c2ffac5493c
3
- size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2059d238b115f5ffcbcd8a5d04fc8803894e1dd28e3e8ed4f0d1fe4a199f846e
3
+ size 4536