fenguhao commited on
Commit
0243293
·
verified ·
1 Parent(s): 9dd5e1e

Model save

Browse files
all_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 5.19321114598441e+16,
4
- "train_loss": 0.29687737567084177,
5
- "train_runtime": 332.0278,
6
  "train_samples": 9000,
7
- "train_samples_per_second": 1.678,
8
- "train_steps_per_second": 0.105
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 5.19321114598441e+16,
4
+ "train_loss": 0.3596490706716265,
5
+ "train_runtime": 336.8523,
6
  "train_samples": 9000,
7
+ "train_samples_per_second": 1.657,
8
+ "train_steps_per_second": 0.104
9
  }
runs/Nov29_13-10-26_RLHF000/events.out.tfevents.1732885850.RLHF000.687743.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2581c00f4c1466bcf817413b6208387fb1ad5c48ea66e96a01ecf744c12266e5
3
- size 8570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db5884ea7d51261793891b0ae9a0c23b9417bb6b1e0c193f6152171a47ee187d
3
+ size 9184
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 5.19321114598441e+16,
4
- "train_loss": 0.29687737567084177,
5
- "train_runtime": 332.0278,
6
  "train_samples": 9000,
7
- "train_samples_per_second": 1.678,
8
- "train_steps_per_second": 0.105
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 5.19321114598441e+16,
4
+ "train_loss": 0.3596490706716265,
5
+ "train_runtime": 336.8523,
6
  "train_samples": 9000,
7
+ "train_samples_per_second": 1.657,
8
+ "train_steps_per_second": 0.104
9
  }
trainer_state.json CHANGED
@@ -10,76 +10,76 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.02857142857142857,
13
- "grad_norm": 1.1770261526107788,
14
  "learning_rate": 5e-05,
15
- "loss": 0.781,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.14285714285714285,
20
- "grad_norm": 0.7865971326828003,
21
  "learning_rate": 0.00019948693233918952,
22
- "loss": 0.6954,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 0.2857142857142857,
27
- "grad_norm": 0.3400590717792511,
28
  "learning_rate": 0.00018207634412072764,
29
- "loss": 0.4525,
30
  "step": 10
31
  },
32
  {
33
  "epoch": 0.42857142857142855,
34
- "grad_norm": 0.24245862662792206,
35
  "learning_rate": 0.00014403941515576344,
36
- "loss": 0.306,
37
  "step": 15
38
  },
39
  {
40
  "epoch": 0.5714285714285714,
41
- "grad_norm": 0.23055194318294525,
42
  "learning_rate": 9.493508311612874e-05,
43
- "loss": 0.2153,
44
  "step": 20
45
  },
46
  {
47
  "epoch": 0.7142857142857143,
48
- "grad_norm": 0.25304117798805237,
49
  "learning_rate": 4.710359896730379e-05,
50
- "loss": 0.1602,
51
  "step": 25
52
  },
53
  {
54
  "epoch": 0.8571428571428571,
55
- "grad_norm": 0.2968534231185913,
56
  "learning_rate": 1.2565338385541792e-05,
57
- "loss": 0.1206,
58
  "step": 30
59
  },
60
  {
61
  "epoch": 1.0,
62
- "grad_norm": 0.11835439503192902,
63
  "learning_rate": 0.0,
64
- "loss": 0.111,
65
  "step": 35
66
  },
67
  {
68
  "epoch": 1.0,
69
- "eval_loss": 0.11065573990345001,
70
- "eval_runtime": 10.7768,
71
- "eval_samples_per_second": 5.66,
72
- "eval_steps_per_second": 0.371,
73
  "step": 35
74
  },
75
  {
76
  "epoch": 1.0,
77
  "step": 35,
78
  "total_flos": 5.19321114598441e+16,
79
- "train_loss": 0.29687737567084177,
80
- "train_runtime": 332.0278,
81
- "train_samples_per_second": 1.678,
82
- "train_steps_per_second": 0.105
83
  }
84
  ],
85
  "logging_steps": 5,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.02857142857142857,
13
+ "grad_norm": 1.1929763555526733,
14
  "learning_rate": 5e-05,
15
+ "loss": 0.842,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.14285714285714285,
20
+ "grad_norm": 0.5904757380485535,
21
  "learning_rate": 0.00019948693233918952,
22
+ "loss": 0.7602,
23
  "step": 5
24
  },
25
  {
26
  "epoch": 0.2857142857142857,
27
+ "grad_norm": 0.35242587327957153,
28
  "learning_rate": 0.00018207634412072764,
29
+ "loss": 0.5166,
30
  "step": 10
31
  },
32
  {
33
  "epoch": 0.42857142857142855,
34
+ "grad_norm": 0.23204153776168823,
35
  "learning_rate": 0.00014403941515576344,
36
+ "loss": 0.3699,
37
  "step": 15
38
  },
39
  {
40
  "epoch": 0.5714285714285714,
41
+ "grad_norm": 0.21575891971588135,
42
  "learning_rate": 9.493508311612874e-05,
43
+ "loss": 0.2784,
44
  "step": 20
45
  },
46
  {
47
  "epoch": 0.7142857142857143,
48
+ "grad_norm": 0.27512410283088684,
49
  "learning_rate": 4.710359896730379e-05,
50
+ "loss": 0.222,
51
  "step": 25
52
  },
53
  {
54
  "epoch": 0.8571428571428571,
55
+ "grad_norm": 0.3192328214645386,
56
  "learning_rate": 1.2565338385541792e-05,
57
+ "loss": 0.1813,
58
  "step": 30
59
  },
60
  {
61
  "epoch": 1.0,
62
+ "grad_norm": 0.11489653587341309,
63
  "learning_rate": 0.0,
64
+ "loss": 0.1727,
65
  "step": 35
66
  },
67
  {
68
  "epoch": 1.0,
69
+ "eval_loss": 0.1722353994846344,
70
+ "eval_runtime": 11.0271,
71
+ "eval_samples_per_second": 5.623,
72
+ "eval_steps_per_second": 0.363,
73
  "step": 35
74
  },
75
  {
76
  "epoch": 1.0,
77
  "step": 35,
78
  "total_flos": 5.19321114598441e+16,
79
+ "train_loss": 0.3596490706716265,
80
+ "train_runtime": 336.8523,
81
+ "train_samples_per_second": 1.657,
82
+ "train_steps_per_second": 0.104
83
  }
84
  ],
85
  "logging_steps": 5,