Takeshi10Days commited on
Commit
3575ada
1 Parent(s): 0b39063

Training in progress, step 1000

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c90a8343645a6bbe8931fb749f22a6c31331f90b9d81678d49817a28e1677bca
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59aaa84190c52a039f51c36d7cdf7843a54ba9681c4aa7cdfc1a073f739fbed5
3
  size 268290900
run-0/checkpoint-1000/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_loss": 0.4282287061214447,
14
- "eval_runtime": 3.2301,
15
- "eval_samples_per_second": 959.713,
16
- "eval_steps_per_second": 20.123,
17
  "step": 318
18
  },
19
  {
@@ -26,17 +26,17 @@
26
  {
27
  "epoch": 2.0,
28
  "eval_loss": 0.1691545695066452,
29
- "eval_runtime": 3.3122,
30
- "eval_samples_per_second": 935.929,
31
- "eval_steps_per_second": 19.624,
32
  "step": 636
33
  },
34
  {
35
  "epoch": 3.0,
36
  "eval_loss": 0.09601032733917236,
37
- "eval_runtime": 3.3191,
38
- "eval_samples_per_second": 933.993,
39
- "eval_steps_per_second": 19.584,
40
  "step": 954
41
  },
42
  {
@@ -56,7 +56,7 @@
56
  "train_batch_size": 48,
57
  "trial_name": null,
58
  "trial_params": {
59
- "alpha": 0.10630408646687006,
60
  "num_train_epochs": 9,
61
  "temperature": 2
62
  }
 
11
  {
12
  "epoch": 1.0,
13
  "eval_loss": 0.4282287061214447,
14
+ "eval_runtime": 3.2319,
15
+ "eval_samples_per_second": 959.178,
16
+ "eval_steps_per_second": 20.112,
17
  "step": 318
18
  },
19
  {
 
26
  {
27
  "epoch": 2.0,
28
  "eval_loss": 0.1691545695066452,
29
+ "eval_runtime": 3.2816,
30
+ "eval_samples_per_second": 944.667,
31
+ "eval_steps_per_second": 19.808,
32
  "step": 636
33
  },
34
  {
35
  "epoch": 3.0,
36
  "eval_loss": 0.09601032733917236,
37
+ "eval_runtime": 3.3082,
38
+ "eval_samples_per_second": 937.058,
39
+ "eval_steps_per_second": 19.648,
40
  "step": 954
41
  },
42
  {
 
56
  "train_batch_size": 48,
57
  "trial_name": null,
58
  "trial_params": {
59
+ "alpha": 0.31661862639116345,
60
  "num_train_epochs": 9,
61
  "temperature": 2
62
  }