chchen commited on
Commit
d85b286
1 Parent(s): 1d2f5ca

Training in progress, step 1500

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +51 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83e947f37148f79b9e77f85e553930963ffb769e3088bd76132dd8f2ca6449e0
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bdcf36330c9e2459f73c25385bc4ff67646784dd6071b9c9a920838f7057efc
3
  size 83945296
trainer_log.jsonl CHANGED
@@ -100,3 +100,54 @@
100
  {"current_steps": 990, "total_steps": 1686, "loss": 0.8854, "accuracy": 0.5375000238418579, "learning_rate": 1.8239381598343576e-06, "epoch": 1.76039119804401, "percentage": 58.72, "elapsed_time": "2:45:53", "remaining_time": "1:56:37"}
101
  {"current_steps": 1000, "total_steps": 1686, "loss": 0.906, "accuracy": 0.5375000238418579, "learning_rate": 1.779207600392312e-06, "epoch": 1.7781729273171816, "percentage": 59.31, "elapsed_time": "2:47:35", "remaining_time": "1:54:58"}
102
  {"current_steps": 1000, "total_steps": 1686, "eval_loss": 0.903913676738739, "epoch": 1.7781729273171816, "percentage": 59.31, "elapsed_time": "2:50:44", "remaining_time": "1:57:07"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
  {"current_steps": 990, "total_steps": 1686, "loss": 0.8854, "accuracy": 0.5375000238418579, "learning_rate": 1.8239381598343576e-06, "epoch": 1.76039119804401, "percentage": 58.72, "elapsed_time": "2:45:53", "remaining_time": "1:56:37"}
101
  {"current_steps": 1000, "total_steps": 1686, "loss": 0.906, "accuracy": 0.5375000238418579, "learning_rate": 1.779207600392312e-06, "epoch": 1.7781729273171816, "percentage": 59.31, "elapsed_time": "2:47:35", "remaining_time": "1:54:58"}
102
  {"current_steps": 1000, "total_steps": 1686, "eval_loss": 0.903913676738739, "epoch": 1.7781729273171816, "percentage": 59.31, "elapsed_time": "2:50:44", "remaining_time": "1:57:07"}
103
+ {"current_steps": 1010, "total_steps": 1686, "loss": 0.9076, "accuracy": 0.512499988079071, "learning_rate": 1.7347273253353552e-06, "epoch": 1.7959546565903532, "percentage": 59.91, "elapsed_time": "2:52:25", "remaining_time": "1:55:24"}
104
+ {"current_steps": 1020, "total_steps": 1686, "loss": 0.9632, "accuracy": 0.574999988079071, "learning_rate": 1.690512779774029e-06, "epoch": 1.8137363858635251, "percentage": 60.5, "elapsed_time": "2:54:04", "remaining_time": "1:53:39"}
105
+ {"current_steps": 1030, "total_steps": 1686, "loss": 0.8807, "accuracy": 0.59375, "learning_rate": 1.6465793165482838e-06, "epoch": 1.831518115136697, "percentage": 61.09, "elapsed_time": "2:55:45", "remaining_time": "1:51:56"}
106
+ {"current_steps": 1040, "total_steps": 1686, "loss": 0.8817, "accuracy": 0.612500011920929, "learning_rate": 1.6029421908964305e-06, "epoch": 1.849299844409869, "percentage": 61.68, "elapsed_time": "2:57:18", "remaining_time": "1:50:08"}
107
+ {"current_steps": 1050, "total_steps": 1686, "loss": 0.9034, "accuracy": 0.543749988079071, "learning_rate": 1.559616555157985e-06, "epoch": 1.8670815736830408, "percentage": 62.28, "elapsed_time": "2:58:59", "remaining_time": "1:48:24"}
108
+ {"current_steps": 1060, "total_steps": 1686, "loss": 0.9475, "accuracy": 0.512499988079071, "learning_rate": 1.516617453512252e-06, "epoch": 1.8848633029562125, "percentage": 62.87, "elapsed_time": "3:00:38", "remaining_time": "1:46:40"}
109
+ {"current_steps": 1070, "total_steps": 1686, "loss": 0.8975, "accuracy": 0.5375000238418579, "learning_rate": 1.473959816754449e-06, "epoch": 1.9026450322293842, "percentage": 63.46, "elapsed_time": "3:02:13", "remaining_time": "1:44:54"}
110
+ {"current_steps": 1080, "total_steps": 1686, "loss": 0.9463, "accuracy": 0.550000011920929, "learning_rate": 1.4316584571112213e-06, "epoch": 1.920426761502556, "percentage": 64.06, "elapsed_time": "3:03:52", "remaining_time": "1:43:10"}
111
+ {"current_steps": 1090, "total_steps": 1686, "loss": 0.9165, "accuracy": 0.5874999761581421, "learning_rate": 1.389728063097306e-06, "epoch": 1.938208490775728, "percentage": 64.65, "elapsed_time": "3:05:33", "remaining_time": "1:41:27"}
112
+ {"current_steps": 1100, "total_steps": 1686, "loss": 0.9192, "accuracy": 0.6312500238418579, "learning_rate": 1.348183194415179e-06, "epoch": 1.9559902200488999, "percentage": 65.24, "elapsed_time": "3:07:07", "remaining_time": "1:39:41"}
113
+ {"current_steps": 1110, "total_steps": 1686, "loss": 0.9242, "accuracy": 0.543749988079071, "learning_rate": 1.3070382768994015e-06, "epoch": 1.9737719493220716, "percentage": 65.84, "elapsed_time": "3:08:48", "remaining_time": "1:37:58"}
114
+ {"current_steps": 1120, "total_steps": 1686, "loss": 0.8944, "accuracy": 0.5687500238418579, "learning_rate": 1.2663075975074746e-06, "epoch": 1.9915536785952432, "percentage": 66.43, "elapsed_time": "3:10:29", "remaining_time": "1:36:15"}
115
+ {"current_steps": 1130, "total_steps": 1686, "loss": 0.9847, "accuracy": 0.512499988079071, "learning_rate": 1.2260052993589034e-06, "epoch": 2.009335407868415, "percentage": 67.02, "elapsed_time": "3:12:09", "remaining_time": "1:34:32"}
116
+ {"current_steps": 1140, "total_steps": 1686, "loss": 0.8449, "accuracy": 0.643750011920929, "learning_rate": 1.1861453768242099e-06, "epoch": 2.027117137141587, "percentage": 67.62, "elapsed_time": "3:13:48", "remaining_time": "1:32:49"}
117
+ {"current_steps": 1150, "total_steps": 1686, "loss": 0.9851, "accuracy": 0.518750011920929, "learning_rate": 1.1467416706655982e-06, "epoch": 2.044898866414759, "percentage": 68.21, "elapsed_time": "3:15:32", "remaining_time": "1:31:08"}
118
+ {"current_steps": 1160, "total_steps": 1686, "loss": 0.8987, "accuracy": 0.543749988079071, "learning_rate": 1.1078078632309559e-06, "epoch": 2.062680595687931, "percentage": 68.8, "elapsed_time": "3:17:09", "remaining_time": "1:29:24"}
119
+ {"current_steps": 1170, "total_steps": 1686, "loss": 0.9292, "accuracy": 0.5249999761581421, "learning_rate": 1.0693574737028627e-06, "epoch": 2.0804623249611023, "percentage": 69.4, "elapsed_time": "3:18:50", "remaining_time": "1:27:41"}
120
+ {"current_steps": 1180, "total_steps": 1686, "loss": 0.8704, "accuracy": 0.550000011920929, "learning_rate": 1.0314038534042586e-06, "epoch": 2.098244054234274, "percentage": 69.99, "elapsed_time": "3:20:31", "remaining_time": "1:25:59"}
121
+ {"current_steps": 1190, "total_steps": 1686, "loss": 0.9141, "accuracy": 0.53125, "learning_rate": 9.939601811623946e-07, "epoch": 2.116025783507446, "percentage": 70.58, "elapsed_time": "3:22:07", "remaining_time": "1:24:14"}
122
+ {"current_steps": 1200, "total_steps": 1686, "loss": 0.8916, "accuracy": 0.6000000238418579, "learning_rate": 9.570394587326825e-07, "epoch": 2.133807512780618, "percentage": 71.17, "elapsed_time": "3:23:46", "remaining_time": "1:22:31"}
123
+ {"current_steps": 1210, "total_steps": 1686, "loss": 0.8573, "accuracy": 0.637499988079071, "learning_rate": 9.206545062840302e-07, "epoch": 2.15158924205379, "percentage": 71.77, "elapsed_time": "3:25:23", "remaining_time": "1:20:48"}
124
+ {"current_steps": 1220, "total_steps": 1686, "loss": 0.8803, "accuracy": 0.512499988079071, "learning_rate": 8.848179579472285e-07, "epoch": 2.1693709713269618, "percentage": 72.36, "elapsed_time": "3:27:03", "remaining_time": "1:19:05"}
125
+ {"current_steps": 1230, "total_steps": 1686, "loss": 0.8073, "accuracy": 0.637499988079071, "learning_rate": 8.495422574279403e-07, "epoch": 2.1871527006001332, "percentage": 72.95, "elapsed_time": "3:28:38", "remaining_time": "1:17:21"}
126
+ {"current_steps": 1240, "total_steps": 1686, "loss": 0.9162, "accuracy": 0.59375, "learning_rate": 8.148396536858063e-07, "epoch": 2.204934429873305, "percentage": 73.55, "elapsed_time": "3:30:17", "remaining_time": "1:15:38"}
127
+ {"current_steps": 1250, "total_steps": 1686, "loss": 0.9478, "accuracy": 0.5375000238418579, "learning_rate": 7.807221966811815e-07, "epoch": 2.222716159146477, "percentage": 74.14, "elapsed_time": "3:31:58", "remaining_time": "1:13:56"}
128
+ {"current_steps": 1260, "total_steps": 1686, "loss": 0.8614, "accuracy": 0.543749988079071, "learning_rate": 7.47201733190962e-07, "epoch": 2.240497888419649, "percentage": 74.73, "elapsed_time": "3:33:38", "remaining_time": "1:12:13"}
129
+ {"current_steps": 1270, "total_steps": 1686, "loss": 0.8802, "accuracy": 0.574999988079071, "learning_rate": 7.142899026949721e-07, "epoch": 2.258279617692821, "percentage": 75.33, "elapsed_time": "3:35:18", "remaining_time": "1:10:31"}
130
+ {"current_steps": 1280, "total_steps": 1686, "loss": 0.8761, "accuracy": 0.5625, "learning_rate": 6.819981333343273e-07, "epoch": 2.2760613469659923, "percentage": 75.92, "elapsed_time": "3:36:53", "remaining_time": "1:08:47"}
131
+ {"current_steps": 1290, "total_steps": 1686, "loss": 0.9673, "accuracy": 0.5062500238418579, "learning_rate": 6.503376379431839e-07, "epoch": 2.293843076239164, "percentage": 76.51, "elapsed_time": "3:38:32", "remaining_time": "1:07:05"}
132
+ {"current_steps": 1300, "total_steps": 1686, "loss": 0.8516, "accuracy": 0.606249988079071, "learning_rate": 6.193194101552502e-07, "epoch": 2.311624805512336, "percentage": 77.11, "elapsed_time": "3:40:13", "remaining_time": "1:05:23"}
133
+ {"current_steps": 1310, "total_steps": 1686, "loss": 0.9165, "accuracy": 0.6187499761581421, "learning_rate": 5.889542205864083e-07, "epoch": 2.329406534785508, "percentage": 77.7, "elapsed_time": "3:41:47", "remaining_time": "1:03:39"}
134
+ {"current_steps": 1320, "total_steps": 1686, "loss": 0.9403, "accuracy": 0.512499988079071, "learning_rate": 5.592526130947862e-07, "epoch": 2.34718826405868, "percentage": 78.29, "elapsed_time": "3:43:28", "remaining_time": "1:01:57"}
135
+ {"current_steps": 1330, "total_steps": 1686, "loss": 0.8828, "accuracy": 0.543749988079071, "learning_rate": 5.302249011195507e-07, "epoch": 2.3649699933318518, "percentage": 78.88, "elapsed_time": "3:45:00", "remaining_time": "1:00:13"}
136
+ {"current_steps": 1340, "total_steps": 1686, "loss": 0.9397, "accuracy": 0.574999988079071, "learning_rate": 5.018811640997307e-07, "epoch": 2.382751722605023, "percentage": 79.48, "elapsed_time": "3:46:44", "remaining_time": "0:58:32"}
137
+ {"current_steps": 1350, "total_steps": 1686, "loss": 0.9355, "accuracy": 0.550000011920929, "learning_rate": 4.7423124397427105e-07, "epoch": 2.400533451878195, "percentage": 80.07, "elapsed_time": "3:48:15", "remaining_time": "0:56:48"}
138
+ {"current_steps": 1360, "total_steps": 1686, "loss": 0.9027, "accuracy": 0.6000000238418579, "learning_rate": 4.472847417645787e-07, "epoch": 2.418315181151367, "percentage": 80.66, "elapsed_time": "3:49:50", "remaining_time": "0:55:05"}
139
+ {"current_steps": 1370, "total_steps": 1686, "loss": 0.8711, "accuracy": 0.574999988079071, "learning_rate": 4.210510142406993e-07, "epoch": 2.436096910424539, "percentage": 81.26, "elapsed_time": "3:51:26", "remaining_time": "0:53:22"}
140
+ {"current_steps": 1380, "total_steps": 1686, "loss": 0.9248, "accuracy": 0.550000011920929, "learning_rate": 3.9553917067232966e-07, "epoch": 2.4538786396977104, "percentage": 81.85, "elapsed_time": "3:53:02", "remaining_time": "0:51:40"}
141
+ {"current_steps": 1390, "total_steps": 1686, "loss": 0.8702, "accuracy": 0.606249988079071, "learning_rate": 3.707580696657509e-07, "epoch": 2.4716603689708823, "percentage": 82.44, "elapsed_time": "3:54:37", "remaining_time": "0:49:57"}
142
+ {"current_steps": 1400, "total_steps": 1686, "loss": 0.9252, "accuracy": 0.550000011920929, "learning_rate": 3.4671631608781815e-07, "epoch": 2.489442098244054, "percentage": 83.04, "elapsed_time": "3:56:09", "remaining_time": "0:48:14"}
143
+ {"current_steps": 1410, "total_steps": 1686, "loss": 0.8863, "accuracy": 0.5625, "learning_rate": 3.234222580780405e-07, "epoch": 2.507223827517226, "percentage": 83.63, "elapsed_time": "3:57:43", "remaining_time": "0:46:31"}
144
+ {"current_steps": 1420, "total_steps": 1686, "loss": 0.9167, "accuracy": 0.543749988079071, "learning_rate": 3.0088398414982375e-07, "epoch": 2.525005556790398, "percentage": 84.22, "elapsed_time": "3:59:20", "remaining_time": "0:44:50"}
145
+ {"current_steps": 1430, "total_steps": 1686, "loss": 0.9131, "accuracy": 0.625, "learning_rate": 2.7910932038184487e-07, "epoch": 2.54278728606357, "percentage": 84.82, "elapsed_time": "4:00:56", "remaining_time": "0:43:07"}
146
+ {"current_steps": 1440, "total_steps": 1686, "loss": 0.8714, "accuracy": 0.6000000238418579, "learning_rate": 2.5810582770057325e-07, "epoch": 2.5605690153367417, "percentage": 85.41, "elapsed_time": "4:02:38", "remaining_time": "0:41:27"}
147
+ {"current_steps": 1450, "total_steps": 1686, "loss": 0.9391, "accuracy": 0.5375000238418579, "learning_rate": 2.3788079925484402e-07, "epoch": 2.578350744609913, "percentage": 86.0, "elapsed_time": "4:04:21", "remaining_time": "0:39:46"}
148
+ {"current_steps": 1460, "total_steps": 1686, "loss": 0.8548, "accuracy": 0.643750011920929, "learning_rate": 2.1844125788342661e-07, "epoch": 2.596132473883085, "percentage": 86.6, "elapsed_time": "4:05:56", "remaining_time": "0:38:04"}
149
+ {"current_steps": 1470, "total_steps": 1686, "loss": 0.8624, "accuracy": 0.5625, "learning_rate": 1.9979395367644428e-07, "epoch": 2.613914203156257, "percentage": 87.19, "elapsed_time": "4:07:35", "remaining_time": "0:36:22"}
150
+ {"current_steps": 1480, "total_steps": 1686, "loss": 0.9134, "accuracy": 0.4749999940395355, "learning_rate": 1.81945361631512e-07, "epoch": 2.631695932429429, "percentage": 87.78, "elapsed_time": "4:09:11", "remaining_time": "0:34:41"}
151
+ {"current_steps": 1490, "total_steps": 1686, "loss": 0.8593, "accuracy": 0.625, "learning_rate": 1.6490167940538343e-07, "epoch": 2.6494776617026004, "percentage": 88.37, "elapsed_time": "4:10:52", "remaining_time": "0:33:00"}
152
+ {"current_steps": 1500, "total_steps": 1686, "loss": 0.9019, "accuracy": 0.5874999761581421, "learning_rate": 1.4866882516191339e-07, "epoch": 2.6672593909757722, "percentage": 88.97, "elapsed_time": "4:12:33", "remaining_time": "0:31:18"}
153
+ {"current_steps": 1500, "total_steps": 1686, "eval_loss": 0.8975116014480591, "epoch": 2.6672593909757722, "percentage": 88.97, "elapsed_time": "4:15:42", "remaining_time": "0:31:42"}