Rakancorle1 commited on
Commit
4e77a76
·
verified ·
1 Parent(s): 0917513

Training in progress, step 1000

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +50 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b7cd1c6b84f5277c99e7a115a3ac3b4847b209eb9829b115ebf6760dbb74f8e
3
  size 42002584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef6059da8352e52905470e3b9e7300b13a23926e02ba6acd33645b3f26b2d62c
3
  size 42002584
trainer_log.jsonl CHANGED
@@ -48,3 +48,53 @@
48
  {"current_steps": 480, "total_steps": 1875, "loss": 0.5039, "lr": 8.468266529064025e-05, "epoch": 0.768, "percentage": 25.6, "elapsed_time": "1:08:21", "remaining_time": "3:18:38"}
49
  {"current_steps": 490, "total_steps": 1875, "loss": 0.4737, "lr": 8.4074380635076e-05, "epoch": 0.784, "percentage": 26.13, "elapsed_time": "1:09:46", "remaining_time": "3:17:13"}
50
  {"current_steps": 500, "total_steps": 1875, "loss": 0.5296, "lr": 8.345653031794292e-05, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "1:11:12", "remaining_time": "3:15:48"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  {"current_steps": 480, "total_steps": 1875, "loss": 0.5039, "lr": 8.468266529064025e-05, "epoch": 0.768, "percentage": 25.6, "elapsed_time": "1:08:21", "remaining_time": "3:18:38"}
49
  {"current_steps": 490, "total_steps": 1875, "loss": 0.4737, "lr": 8.4074380635076e-05, "epoch": 0.784, "percentage": 26.13, "elapsed_time": "1:09:46", "remaining_time": "3:17:13"}
50
  {"current_steps": 500, "total_steps": 1875, "loss": 0.5296, "lr": 8.345653031794292e-05, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "1:11:12", "remaining_time": "3:15:48"}
51
+ {"current_steps": 510, "total_steps": 1875, "loss": 0.4688, "lr": 8.282928778764783e-05, "epoch": 0.816, "percentage": 27.2, "elapsed_time": "1:12:47", "remaining_time": "3:14:49"}
52
+ {"current_steps": 520, "total_steps": 1875, "loss": 0.4675, "lr": 8.21928291292627e-05, "epoch": 0.832, "percentage": 27.73, "elapsed_time": "1:14:12", "remaining_time": "3:13:21"}
53
+ {"current_steps": 530, "total_steps": 1875, "loss": 0.4408, "lr": 8.154733301509248e-05, "epoch": 0.848, "percentage": 28.27, "elapsed_time": "1:15:37", "remaining_time": "3:11:54"}
54
+ {"current_steps": 540, "total_steps": 1875, "loss": 0.4608, "lr": 8.089298065451672e-05, "epoch": 0.864, "percentage": 28.8, "elapsed_time": "1:17:02", "remaining_time": "3:10:27"}
55
+ {"current_steps": 550, "total_steps": 1875, "loss": 0.4476, "lr": 8.022995574311876e-05, "epoch": 0.88, "percentage": 29.33, "elapsed_time": "1:18:26", "remaining_time": "3:08:58"}
56
+ {"current_steps": 560, "total_steps": 1875, "loss": 0.5027, "lr": 7.95584444111171e-05, "epoch": 0.896, "percentage": 29.87, "elapsed_time": "1:19:50", "remaining_time": "3:07:29"}
57
+ {"current_steps": 570, "total_steps": 1875, "loss": 0.4929, "lr": 7.887863517111338e-05, "epoch": 0.912, "percentage": 30.4, "elapsed_time": "1:21:15", "remaining_time": "3:06:01"}
58
+ {"current_steps": 580, "total_steps": 1875, "loss": 0.4739, "lr": 7.819071886517134e-05, "epoch": 0.928, "percentage": 30.93, "elapsed_time": "1:22:39", "remaining_time": "3:04:33"}
59
+ {"current_steps": 590, "total_steps": 1875, "loss": 0.4529, "lr": 7.7494888611242e-05, "epoch": 0.944, "percentage": 31.47, "elapsed_time": "1:24:03", "remaining_time": "3:03:05"}
60
+ {"current_steps": 600, "total_steps": 1875, "loss": 0.4619, "lr": 7.679133974894983e-05, "epoch": 0.96, "percentage": 32.0, "elapsed_time": "1:25:28", "remaining_time": "3:01:37"}
61
+ {"current_steps": 610, "total_steps": 1875, "loss": 0.462, "lr": 7.60802697847554e-05, "epoch": 0.976, "percentage": 32.53, "elapsed_time": "1:26:52", "remaining_time": "3:00:10"}
62
+ {"current_steps": 620, "total_steps": 1875, "loss": 0.4478, "lr": 7.536187833650947e-05, "epoch": 0.992, "percentage": 33.07, "elapsed_time": "1:28:17", "remaining_time": "2:58:43"}
63
+ {"current_steps": 630, "total_steps": 1875, "loss": 0.4304, "lr": 7.463636707741458e-05, "epoch": 1.008, "percentage": 33.6, "elapsed_time": "1:29:42", "remaining_time": "2:57:17"}
64
+ {"current_steps": 640, "total_steps": 1875, "loss": 0.4138, "lr": 7.390393967940962e-05, "epoch": 1.024, "percentage": 34.13, "elapsed_time": "1:31:07", "remaining_time": "2:55:50"}
65
+ {"current_steps": 650, "total_steps": 1875, "loss": 0.3909, "lr": 7.316480175599309e-05, "epoch": 1.04, "percentage": 34.67, "elapsed_time": "1:32:32", "remaining_time": "2:54:23"}
66
+ {"current_steps": 660, "total_steps": 1875, "loss": 0.3873, "lr": 7.241916080450163e-05, "epoch": 1.056, "percentage": 35.2, "elapsed_time": "1:33:56", "remaining_time": "2:52:56"}
67
+ {"current_steps": 670, "total_steps": 1875, "loss": 0.3744, "lr": 7.166722614785937e-05, "epoch": 1.072, "percentage": 35.73, "elapsed_time": "1:35:21", "remaining_time": "2:51:29"}
68
+ {"current_steps": 680, "total_steps": 1875, "loss": 0.3641, "lr": 7.090920887581506e-05, "epoch": 1.088, "percentage": 36.27, "elapsed_time": "1:36:45", "remaining_time": "2:50:02"}
69
+ {"current_steps": 690, "total_steps": 1875, "loss": 0.3708, "lr": 7.014532178568314e-05, "epoch": 1.104, "percentage": 36.8, "elapsed_time": "1:38:10", "remaining_time": "2:48:35"}
70
+ {"current_steps": 700, "total_steps": 1875, "loss": 0.4147, "lr": 6.937577932260515e-05, "epoch": 1.12, "percentage": 37.33, "elapsed_time": "1:39:34", "remaining_time": "2:47:08"}
71
+ {"current_steps": 710, "total_steps": 1875, "loss": 0.3698, "lr": 6.860079751934908e-05, "epoch": 1.1360000000000001, "percentage": 37.87, "elapsed_time": "1:40:59", "remaining_time": "2:45:42"}
72
+ {"current_steps": 720, "total_steps": 1875, "loss": 0.3768, "lr": 6.782059393566253e-05, "epoch": 1.152, "percentage": 38.4, "elapsed_time": "1:42:24", "remaining_time": "2:44:16"}
73
+ {"current_steps": 730, "total_steps": 1875, "loss": 0.3713, "lr": 6.70353875971976e-05, "epoch": 1.168, "percentage": 38.93, "elapsed_time": "1:43:48", "remaining_time": "2:42:49"}
74
+ {"current_steps": 740, "total_steps": 1875, "loss": 0.376, "lr": 6.624539893402382e-05, "epoch": 1.184, "percentage": 39.47, "elapsed_time": "1:45:12", "remaining_time": "2:41:22"}
75
+ {"current_steps": 750, "total_steps": 1875, "loss": 0.3762, "lr": 6.545084971874738e-05, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "1:46:37", "remaining_time": "2:39:56"}
76
+ {"current_steps": 760, "total_steps": 1875, "loss": 0.3891, "lr": 6.465196300425287e-05, "epoch": 1.216, "percentage": 40.53, "elapsed_time": "1:48:01", "remaining_time": "2:38:29"}
77
+ {"current_steps": 770, "total_steps": 1875, "loss": 0.3772, "lr": 6.384896306108612e-05, "epoch": 1.232, "percentage": 41.07, "elapsed_time": "1:49:26", "remaining_time": "2:37:02"}
78
+ {"current_steps": 780, "total_steps": 1875, "loss": 0.3678, "lr": 6.304207531449486e-05, "epoch": 1.248, "percentage": 41.6, "elapsed_time": "1:50:50", "remaining_time": "2:35:36"}
79
+ {"current_steps": 790, "total_steps": 1875, "loss": 0.3648, "lr": 6.223152628114537e-05, "epoch": 1.264, "percentage": 42.13, "elapsed_time": "1:52:14", "remaining_time": "2:34:09"}
80
+ {"current_steps": 800, "total_steps": 1875, "loss": 0.3909, "lr": 6.141754350553279e-05, "epoch": 1.28, "percentage": 42.67, "elapsed_time": "1:53:39", "remaining_time": "2:32:44"}
81
+ {"current_steps": 810, "total_steps": 1875, "loss": 0.383, "lr": 6.0600355496102745e-05, "epoch": 1.296, "percentage": 43.2, "elapsed_time": "1:55:05", "remaining_time": "2:31:19"}
82
+ {"current_steps": 820, "total_steps": 1875, "loss": 0.3802, "lr": 5.9780191661102415e-05, "epoch": 1.312, "percentage": 43.73, "elapsed_time": "1:56:30", "remaining_time": "2:29:54"}
83
+ {"current_steps": 830, "total_steps": 1875, "loss": 0.423, "lr": 5.8957282244179124e-05, "epoch": 1.328, "percentage": 44.27, "elapsed_time": "1:57:56", "remaining_time": "2:28:29"}
84
+ {"current_steps": 840, "total_steps": 1875, "loss": 0.3641, "lr": 5.813185825974419e-05, "epoch": 1.3439999999999999, "percentage": 44.8, "elapsed_time": "1:59:21", "remaining_time": "2:27:03"}
85
+ {"current_steps": 850, "total_steps": 1875, "loss": 0.3519, "lr": 5.730415142812059e-05, "epoch": 1.3599999999999999, "percentage": 45.33, "elapsed_time": "2:00:46", "remaining_time": "2:25:38"}
86
+ {"current_steps": 860, "total_steps": 1875, "loss": 0.3732, "lr": 5.6474394110492344e-05, "epoch": 1.376, "percentage": 45.87, "elapsed_time": "2:02:12", "remaining_time": "2:24:13"}
87
+ {"current_steps": 870, "total_steps": 1875, "loss": 0.3954, "lr": 5.564281924367408e-05, "epoch": 1.392, "percentage": 46.4, "elapsed_time": "2:03:37", "remaining_time": "2:22:48"}
88
+ {"current_steps": 880, "total_steps": 1875, "loss": 0.3669, "lr": 5.480966027471889e-05, "epoch": 1.408, "percentage": 46.93, "elapsed_time": "2:05:02", "remaining_time": "2:21:23"}
89
+ {"current_steps": 890, "total_steps": 1875, "loss": 0.3994, "lr": 5.3975151095382995e-05, "epoch": 1.424, "percentage": 47.47, "elapsed_time": "2:06:28", "remaining_time": "2:19:57"}
90
+ {"current_steps": 900, "total_steps": 1875, "loss": 0.3904, "lr": 5.313952597646568e-05, "epoch": 1.44, "percentage": 48.0, "elapsed_time": "2:07:53", "remaining_time": "2:18:32"}
91
+ {"current_steps": 910, "total_steps": 1875, "loss": 0.3821, "lr": 5.230301950204262e-05, "epoch": 1.456, "percentage": 48.53, "elapsed_time": "2:09:18", "remaining_time": "2:17:07"}
92
+ {"current_steps": 920, "total_steps": 1875, "loss": 0.3713, "lr": 5.1465866503611426e-05, "epoch": 1.472, "percentage": 49.07, "elapsed_time": "2:10:42", "remaining_time": "2:15:41"}
93
+ {"current_steps": 930, "total_steps": 1875, "loss": 0.3785, "lr": 5.062830199416764e-05, "epoch": 1.488, "percentage": 49.6, "elapsed_time": "2:12:07", "remaining_time": "2:14:14"}
94
+ {"current_steps": 940, "total_steps": 1875, "loss": 0.3851, "lr": 4.979056110222981e-05, "epoch": 1.504, "percentage": 50.13, "elapsed_time": "2:13:31", "remaining_time": "2:12:48"}
95
+ {"current_steps": 950, "total_steps": 1875, "loss": 0.3991, "lr": 4.895287900583216e-05, "epoch": 1.52, "percentage": 50.67, "elapsed_time": "2:14:55", "remaining_time": "2:11:22"}
96
+ {"current_steps": 960, "total_steps": 1875, "loss": 0.3726, "lr": 4.811549086650327e-05, "epoch": 1.536, "percentage": 51.2, "elapsed_time": "2:16:20", "remaining_time": "2:09:57"}
97
+ {"current_steps": 970, "total_steps": 1875, "loss": 0.3703, "lr": 4.7278631763249554e-05, "epoch": 1.552, "percentage": 51.73, "elapsed_time": "2:17:45", "remaining_time": "2:08:31"}
98
+ {"current_steps": 980, "total_steps": 1875, "loss": 0.3462, "lr": 4.6442536626561675e-05, "epoch": 1.568, "percentage": 52.27, "elapsed_time": "2:19:09", "remaining_time": "2:07:05"}
99
+ {"current_steps": 990, "total_steps": 1875, "loss": 0.3486, "lr": 4.560744017246284e-05, "epoch": 1.584, "percentage": 52.8, "elapsed_time": "2:20:34", "remaining_time": "2:05:39"}
100
+ {"current_steps": 1000, "total_steps": 1875, "loss": 0.3384, "lr": 4.477357683661734e-05, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "2:21:58", "remaining_time": "2:04:13"}