sedrickkeh commited on
Commit
083f06c
·
verified ·
1 Parent(s): c31822a

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e858c7e9437a518cb195a3d5f7209474be8c9bd059841282e253e7eda744a2e2
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80c9a3c249a9e8bf61e0a750e10ae5c8d1de16c2cc9c59ac9cf155b14505b741
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3ea16e009a88e498da971b99a4e0b4a338e2fdd12aa1727b74f187bc1a989d4
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe1007abc5d42275a2ab9d42d15d5f0bb24aab7cbd92e524fbfe88f4f2fdbea
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0de5772d061255baa17d95d009f73507b4e7c4a75e203543ed65b42afca71415
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52adcdb4d69e3e4b5ddd9e890a01601bdb61d736c76aead1a17f450b4f110f31
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4d8775d8a34ec0f2ecc60880e4e8ac4fd9c4e6738f399e774daaef456ac55c2
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:899217975c8284eae7a22095717f797c40cdf00239d06a5e716977ebf2817f62
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -45,3 +45,45 @@
45
  {"current_steps": 45, "total_steps": 126, "loss": 0.7368, "lr": 8.14840211594757e-06, "epoch": 1.0627450980392157, "percentage": 35.71, "elapsed_time": "0:23:54", "remaining_time": "0:43:01"}
46
  {"current_steps": 46, "total_steps": 126, "loss": 0.7976, "lr": 8.039209983943201e-06, "epoch": 1.0862745098039215, "percentage": 36.51, "elapsed_time": "0:24:22", "remaining_time": "0:42:23"}
47
  {"current_steps": 47, "total_steps": 126, "loss": 0.7109, "lr": 7.927668892097288e-06, "epoch": 1.1098039215686275, "percentage": 37.3, "elapsed_time": "0:24:45", "remaining_time": "0:41:37"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
  {"current_steps": 45, "total_steps": 126, "loss": 0.7368, "lr": 8.14840211594757e-06, "epoch": 1.0627450980392157, "percentage": 35.71, "elapsed_time": "0:23:54", "remaining_time": "0:43:01"}
46
  {"current_steps": 46, "total_steps": 126, "loss": 0.7976, "lr": 8.039209983943201e-06, "epoch": 1.0862745098039215, "percentage": 36.51, "elapsed_time": "0:24:22", "remaining_time": "0:42:23"}
47
  {"current_steps": 47, "total_steps": 126, "loss": 0.7109, "lr": 7.927668892097288e-06, "epoch": 1.1098039215686275, "percentage": 37.3, "elapsed_time": "0:24:45", "remaining_time": "0:41:37"}
48
+ {"current_steps": 48, "total_steps": 126, "loss": 0.738, "lr": 7.81386504884782e-06, "epoch": 1.1333333333333333, "percentage": 38.1, "elapsed_time": "0:25:19", "remaining_time": "0:41:08"}
49
+ {"current_steps": 49, "total_steps": 126, "loss": 0.8269, "lr": 7.697886411479422e-06, "epoch": 1.156862745098039, "percentage": 38.89, "elapsed_time": "0:25:48", "remaining_time": "0:40:33"}
50
+ {"current_steps": 50, "total_steps": 126, "loss": 0.7993, "lr": 7.579822618142505e-06, "epoch": 1.1803921568627451, "percentage": 39.68, "elapsed_time": "0:26:19", "remaining_time": "0:40:01"}
51
+ {"current_steps": 51, "total_steps": 126, "loss": 0.8325, "lr": 7.459764918573264e-06, "epoch": 1.203921568627451, "percentage": 40.48, "elapsed_time": "0:26:52", "remaining_time": "0:39:31"}
52
+ {"current_steps": 52, "total_steps": 126, "loss": 0.73, "lr": 7.3378061035681415e-06, "epoch": 1.227450980392157, "percentage": 41.27, "elapsed_time": "0:27:19", "remaining_time": "0:38:53"}
53
+ {"current_steps": 53, "total_steps": 126, "loss": 0.7398, "lr": 7.2140404332671986e-06, "epoch": 1.2509803921568627, "percentage": 42.06, "elapsed_time": "0:27:47", "remaining_time": "0:38:16"}
54
+ {"current_steps": 54, "total_steps": 126, "loss": 0.8289, "lr": 7.088563564301874e-06, "epoch": 1.2745098039215685, "percentage": 42.86, "elapsed_time": "0:28:18", "remaining_time": "0:37:45"}
55
+ {"current_steps": 55, "total_steps": 126, "loss": 0.7454, "lr": 6.961472475863406e-06, "epoch": 1.2980392156862746, "percentage": 43.65, "elapsed_time": "0:28:57", "remaining_time": "0:37:22"}
56
+ {"current_steps": 56, "total_steps": 126, "loss": 0.6694, "lr": 6.832865394749065e-06, "epoch": 1.3215686274509804, "percentage": 44.44, "elapsed_time": "0:29:25", "remaining_time": "0:36:46"}
57
+ {"current_steps": 57, "total_steps": 126, "loss": 0.8093, "lr": 6.702841719444141e-06, "epoch": 1.3450980392156864, "percentage": 45.24, "elapsed_time": "0:29:57", "remaining_time": "0:36:16"}
58
+ {"current_steps": 58, "total_steps": 126, "loss": 0.7096, "lr": 6.571501943298335e-06, "epoch": 1.3686274509803922, "percentage": 46.03, "elapsed_time": "0:30:28", "remaining_time": "0:35:43"}
59
+ {"current_steps": 59, "total_steps": 126, "loss": 0.8138, "lr": 6.4389475768559675e-06, "epoch": 1.392156862745098, "percentage": 46.83, "elapsed_time": "0:30:56", "remaining_time": "0:35:07"}
60
+ {"current_steps": 60, "total_steps": 126, "loss": 0.6619, "lr": 6.305281069399989e-06, "epoch": 1.415686274509804, "percentage": 47.62, "elapsed_time": "0:31:19", "remaining_time": "0:34:27"}
61
+ {"current_steps": 61, "total_steps": 126, "loss": 0.693, "lr": 6.17060572977047e-06, "epoch": 1.4392156862745098, "percentage": 48.41, "elapsed_time": "0:31:51", "remaining_time": "0:33:56"}
62
+ {"current_steps": 62, "total_steps": 126, "loss": 0.7561, "lr": 6.035025646518747e-06, "epoch": 1.4627450980392158, "percentage": 49.21, "elapsed_time": "0:32:29", "remaining_time": "0:33:31"}
63
+ {"current_steps": 63, "total_steps": 126, "loss": 0.7799, "lr": 5.898645607458941e-06, "epoch": 1.4862745098039216, "percentage": 50.0, "elapsed_time": "0:32:57", "remaining_time": "0:32:57"}
64
+ {"current_steps": 64, "total_steps": 126, "loss": 0.7374, "lr": 5.761571018679025e-06, "epoch": 1.5098039215686274, "percentage": 50.79, "elapsed_time": "0:33:24", "remaining_time": "0:32:21"}
65
+ {"current_steps": 65, "total_steps": 126, "loss": 0.8134, "lr": 5.623907823074044e-06, "epoch": 1.5333333333333332, "percentage": 51.59, "elapsed_time": "0:34:01", "remaining_time": "0:31:56"}
66
+ {"current_steps": 66, "total_steps": 126, "loss": 0.7933, "lr": 5.48576241846443e-06, "epoch": 1.5568627450980392, "percentage": 52.38, "elapsed_time": "0:34:37", "remaining_time": "0:31:28"}
67
+ {"current_steps": 67, "total_steps": 126, "loss": 0.7209, "lr": 5.347241575362729e-06, "epoch": 1.5803921568627453, "percentage": 53.17, "elapsed_time": "0:35:09", "remaining_time": "0:30:57"}
68
+ {"current_steps": 68, "total_steps": 126, "loss": 0.7746, "lr": 5.208452354452275e-06, "epoch": 1.603921568627451, "percentage": 53.97, "elapsed_time": "0:35:45", "remaining_time": "0:30:29"}
69
+ {"current_steps": 69, "total_steps": 126, "loss": 0.7635, "lr": 5.069502023841576e-06, "epoch": 1.6274509803921569, "percentage": 54.76, "elapsed_time": "0:36:21", "remaining_time": "0:30:01"}
70
+ {"current_steps": 70, "total_steps": 126, "loss": 0.7708, "lr": 4.9304979761584256e-06, "epoch": 1.6509803921568627, "percentage": 55.56, "elapsed_time": "0:36:49", "remaining_time": "0:29:27"}
71
+ {"current_steps": 71, "total_steps": 126, "loss": 0.6827, "lr": 4.791547645547727e-06, "epoch": 1.6745098039215687, "percentage": 56.35, "elapsed_time": "0:37:17", "remaining_time": "0:28:53"}
72
+ {"current_steps": 72, "total_steps": 126, "loss": 0.794, "lr": 4.652758424637271e-06, "epoch": 1.6980392156862745, "percentage": 57.14, "elapsed_time": "0:37:49", "remaining_time": "0:28:22"}
73
+ {"current_steps": 73, "total_steps": 126, "loss": 0.7368, "lr": 4.514237581535571e-06, "epoch": 1.7215686274509805, "percentage": 57.94, "elapsed_time": "0:38:18", "remaining_time": "0:27:48"}
74
+ {"current_steps": 74, "total_steps": 126, "loss": 0.6936, "lr": 4.3760921769259585e-06, "epoch": 1.7450980392156863, "percentage": 58.73, "elapsed_time": "0:38:47", "remaining_time": "0:27:15"}
75
+ {"current_steps": 75, "total_steps": 126, "loss": 0.7475, "lr": 4.2384289813209754e-06, "epoch": 1.768627450980392, "percentage": 59.52, "elapsed_time": "0:39:15", "remaining_time": "0:26:41"}
76
+ {"current_steps": 76, "total_steps": 126, "loss": 0.7358, "lr": 4.101354392541061e-06, "epoch": 1.792156862745098, "percentage": 60.32, "elapsed_time": "0:39:46", "remaining_time": "0:26:09"}
77
+ {"current_steps": 77, "total_steps": 126, "loss": 0.7331, "lr": 3.964974353481254e-06, "epoch": 1.815686274509804, "percentage": 61.11, "elapsed_time": "0:40:16", "remaining_time": "0:25:37"}
78
+ {"current_steps": 78, "total_steps": 126, "loss": 0.7295, "lr": 3.829394270229531e-06, "epoch": 1.83921568627451, "percentage": 61.9, "elapsed_time": "0:40:48", "remaining_time": "0:25:06"}
79
+ {"current_steps": 79, "total_steps": 126, "loss": 0.642, "lr": 3.694718930600012e-06, "epoch": 1.8627450980392157, "percentage": 62.7, "elapsed_time": "0:41:22", "remaining_time": "0:24:37"}
80
+ {"current_steps": 80, "total_steps": 126, "loss": 0.7889, "lr": 3.5610524231440324e-06, "epoch": 1.8862745098039215, "percentage": 63.49, "elapsed_time": "0:41:56", "remaining_time": "0:24:06"}
81
+ {"current_steps": 81, "total_steps": 126, "loss": 0.7499, "lr": 3.428498056701665e-06, "epoch": 1.9098039215686273, "percentage": 64.29, "elapsed_time": "0:42:24", "remaining_time": "0:23:33"}
82
+ {"current_steps": 82, "total_steps": 126, "loss": 0.7663, "lr": 3.2971582805558622e-06, "epoch": 1.9333333333333333, "percentage": 65.08, "elapsed_time": "0:42:56", "remaining_time": "0:23:02"}
83
+ {"current_steps": 83, "total_steps": 126, "loss": 0.7652, "lr": 3.167134605250938e-06, "epoch": 1.9568627450980394, "percentage": 65.87, "elapsed_time": "0:43:27", "remaining_time": "0:22:30"}
84
+ {"current_steps": 84, "total_steps": 126, "loss": 0.7709, "lr": 3.0385275241365965e-06, "epoch": 1.9803921568627452, "percentage": 66.67, "elapsed_time": "0:44:03", "remaining_time": "0:22:01"}
85
+ {"current_steps": 85, "total_steps": 126, "loss": 1.2373, "lr": 2.9114364356981274e-06, "epoch": 2.007843137254902, "percentage": 67.46, "elapsed_time": "0:45:31", "remaining_time": "0:21:57"}
86
+ {"current_steps": 86, "total_steps": 126, "loss": 0.7255, "lr": 2.7859595667328027e-06, "epoch": 2.0313725490196077, "percentage": 68.25, "elapsed_time": "0:46:03", "remaining_time": "0:21:25"}
87
+ {"current_steps": 87, "total_steps": 126, "loss": 0.6407, "lr": 2.6621938964318593e-06, "epoch": 2.0549019607843135, "percentage": 69.05, "elapsed_time": "0:46:30", "remaining_time": "0:20:50"}
88
+ {"current_steps": 88, "total_steps": 126, "loss": 0.6873, "lr": 2.5402350814267364e-06, "epoch": 2.0784313725490198, "percentage": 69.84, "elapsed_time": "0:46:56", "remaining_time": "0:20:16"}
89
+ {"current_steps": 89, "total_steps": 126, "loss": 0.6542, "lr": 2.4201773818574956e-06, "epoch": 2.1019607843137256, "percentage": 70.63, "elapsed_time": "0:47:27", "remaining_time": "0:19:43"}