Takeshi10Days commited on
Commit
ff17baf
1 Parent(s): 3575ada

Training in progress, step 1500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59aaa84190c52a039f51c36d7cdf7843a54ba9681c4aa7cdfc1a073f739fbed5
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ea815675a34cbac9041de1da9a12ba61041e70f135f09a49e7225458df2955
3
  size 268290900
run-0/checkpoint-1500/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_loss": 0.4282287061214447,
14
- "eval_runtime": 3.2301,
15
- "eval_samples_per_second": 959.713,
16
- "eval_steps_per_second": 20.123,
17
  "step": 318
18
  },
19
  {
@@ -26,17 +26,17 @@
26
  {
27
  "epoch": 2.0,
28
  "eval_loss": 0.1691545695066452,
29
- "eval_runtime": 3.3122,
30
- "eval_samples_per_second": 935.929,
31
- "eval_steps_per_second": 19.624,
32
  "step": 636
33
  },
34
  {
35
  "epoch": 3.0,
36
  "eval_loss": 0.09601032733917236,
37
- "eval_runtime": 3.3191,
38
- "eval_samples_per_second": 933.993,
39
- "eval_steps_per_second": 19.584,
40
  "step": 954
41
  },
42
  {
@@ -49,9 +49,9 @@
49
  {
50
  "epoch": 4.0,
51
  "eval_loss": 0.07325955480337143,
52
- "eval_runtime": 3.3266,
53
- "eval_samples_per_second": 931.889,
54
- "eval_steps_per_second": 19.54,
55
  "step": 1272
56
  },
57
  {
@@ -71,7 +71,7 @@
71
  "train_batch_size": 48,
72
  "trial_name": null,
73
  "trial_params": {
74
- "alpha": 0.10630408646687006,
75
  "num_train_epochs": 9,
76
  "temperature": 2
77
  }
 
11
  {
12
  "epoch": 1.0,
13
  "eval_loss": 0.4282287061214447,
14
+ "eval_runtime": 3.2319,
15
+ "eval_samples_per_second": 959.178,
16
+ "eval_steps_per_second": 20.112,
17
  "step": 318
18
  },
19
  {
 
26
  {
27
  "epoch": 2.0,
28
  "eval_loss": 0.1691545695066452,
29
+ "eval_runtime": 3.2816,
30
+ "eval_samples_per_second": 944.667,
31
+ "eval_steps_per_second": 19.808,
32
  "step": 636
33
  },
34
  {
35
  "epoch": 3.0,
36
  "eval_loss": 0.09601032733917236,
37
+ "eval_runtime": 3.3082,
38
+ "eval_samples_per_second": 937.058,
39
+ "eval_steps_per_second": 19.648,
40
  "step": 954
41
  },
42
  {
 
49
  {
50
  "epoch": 4.0,
51
  "eval_loss": 0.07325955480337143,
52
+ "eval_runtime": 3.4009,
53
+ "eval_samples_per_second": 911.523,
54
+ "eval_steps_per_second": 19.113,
55
  "step": 1272
56
  },
57
  {
 
71
  "train_batch_size": 48,
72
  "trial_name": null,
73
  "trial_params": {
74
+ "alpha": 0.31661862639116345,
75
  "num_train_epochs": 9,
76
  "temperature": 2
77
  }