sumuks commited on
Commit
03304dc
·
verified ·
1 Parent(s): b0f92f6

Training in progress, step 1000

Browse files
Files changed (2) hide show
  1. adapter_model.safetensors +1 -1
  2. trainer_log.jsonl +51 -0
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fed271f1467dfe2955d0a83d772e7bc039e67576a4a78e40af30f04d40064dc9
3
  size 645976488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e566f00233423ca5ec760737c8a1a42e020c5dc60749098b2a8c30f994f86381
3
  size 645976488
trainer_log.jsonl CHANGED
@@ -48,3 +48,54 @@
48
  {"current_steps": 480, "total_steps": 3573, "loss": 1.3579, "lr": 4.982255937758657e-05, "epoch": 0.40302267002518893, "percentage": 13.43, "elapsed_time": "0:10:04", "remaining_time": "1:04:56"}
49
  {"current_steps": 490, "total_steps": 3573, "loss": 1.348, "lr": 4.9792320583495975e-05, "epoch": 0.41141897565071367, "percentage": 13.71, "elapsed_time": "0:10:16", "remaining_time": "1:04:41"}
50
  {"current_steps": 500, "total_steps": 3573, "loss": 1.3474, "lr": 4.975971449912952e-05, "epoch": 0.41981528127623846, "percentage": 13.99, "elapsed_time": "0:10:29", "remaining_time": "1:04:26"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  {"current_steps": 480, "total_steps": 3573, "loss": 1.3579, "lr": 4.982255937758657e-05, "epoch": 0.40302267002518893, "percentage": 13.43, "elapsed_time": "0:10:04", "remaining_time": "1:04:56"}
49
  {"current_steps": 490, "total_steps": 3573, "loss": 1.348, "lr": 4.9792320583495975e-05, "epoch": 0.41141897565071367, "percentage": 13.71, "elapsed_time": "0:10:16", "remaining_time": "1:04:41"}
50
  {"current_steps": 500, "total_steps": 3573, "loss": 1.3474, "lr": 4.975971449912952e-05, "epoch": 0.41981528127623846, "percentage": 13.99, "elapsed_time": "0:10:29", "remaining_time": "1:04:26"}
51
+ {"current_steps": 510, "total_steps": 3573, "loss": 1.3609, "lr": 4.972474423787331e-05, "epoch": 0.4282115869017632, "percentage": 14.27, "elapsed_time": "0:11:08", "remaining_time": "1:06:56"}
52
+ {"current_steps": 520, "total_steps": 3573, "loss": 1.3829, "lr": 4.9687413138856446e-05, "epoch": 0.436607892527288, "percentage": 14.55, "elapsed_time": "0:11:20", "remaining_time": "1:06:38"}
53
+ {"current_steps": 530, "total_steps": 3573, "loss": 1.3554, "lr": 4.964772476663222e-05, "epoch": 0.4450041981528128, "percentage": 14.83, "elapsed_time": "0:11:33", "remaining_time": "1:06:20"}
54
+ {"current_steps": 540, "total_steps": 3573, "loss": 1.3515, "lr": 4.960568291083772e-05, "epoch": 0.4534005037783375, "percentage": 15.11, "elapsed_time": "0:11:45", "remaining_time": "1:06:02"}
55
+ {"current_steps": 550, "total_steps": 3573, "loss": 1.3547, "lr": 4.956129158583199e-05, "epoch": 0.4617968094038623, "percentage": 15.39, "elapsed_time": "0:11:57", "remaining_time": "1:05:44"}
56
+ {"current_steps": 560, "total_steps": 3573, "loss": 1.329, "lr": 4.951455503031271e-05, "epoch": 0.47019311502938704, "percentage": 15.67, "elapsed_time": "0:12:09", "remaining_time": "1:05:27"}
57
+ {"current_steps": 570, "total_steps": 3573, "loss": 1.3547, "lr": 4.946547770691152e-05, "epoch": 0.47858942065491183, "percentage": 15.95, "elapsed_time": "0:12:22", "remaining_time": "1:05:09"}
58
+ {"current_steps": 580, "total_steps": 3573, "loss": 1.3421, "lr": 4.9414064301767786e-05, "epoch": 0.4869857262804366, "percentage": 16.23, "elapsed_time": "0:12:34", "remaining_time": "1:04:52"}
59
+ {"current_steps": 590, "total_steps": 3573, "loss": 1.3576, "lr": 4.9360319724081285e-05, "epoch": 0.49538203190596136, "percentage": 16.51, "elapsed_time": "0:12:46", "remaining_time": "1:04:35"}
60
+ {"current_steps": 600, "total_steps": 3573, "loss": 1.3667, "lr": 4.930424910564334e-05, "epoch": 0.5037783375314862, "percentage": 16.79, "elapsed_time": "0:12:58", "remaining_time": "1:04:19"}
61
+ {"current_steps": 600, "total_steps": 3573, "eval_loss": 1.3807679414749146, "epoch": 0.5037783375314862, "percentage": 16.79, "elapsed_time": "0:13:36", "remaining_time": "1:07:24"}
62
+ {"current_steps": 610, "total_steps": 3573, "loss": 1.3504, "lr": 4.92458578003469e-05, "epoch": 0.5121746431570109, "percentage": 17.07, "elapsed_time": "0:13:48", "remaining_time": "1:07:04"}
63
+ {"current_steps": 620, "total_steps": 3573, "loss": 1.339, "lr": 4.9185151383675246e-05, "epoch": 0.5205709487825357, "percentage": 17.35, "elapsed_time": "0:14:00", "remaining_time": "1:06:44"}
64
+ {"current_steps": 630, "total_steps": 3573, "loss": 1.3358, "lr": 4.912213565216966e-05, "epoch": 0.5289672544080605, "percentage": 17.63, "elapsed_time": "0:14:12", "remaining_time": "1:06:24"}
65
+ {"current_steps": 640, "total_steps": 3573, "loss": 1.3708, "lr": 4.905681662287595e-05, "epoch": 0.5373635600335852, "percentage": 17.91, "elapsed_time": "0:14:25", "remaining_time": "1:06:05"}
66
+ {"current_steps": 650, "total_steps": 3573, "loss": 1.363, "lr": 4.898920053276989e-05, "epoch": 0.5457598656591099, "percentage": 18.19, "elapsed_time": "0:14:37", "remaining_time": "1:05:46"}
67
+ {"current_steps": 660, "total_steps": 3573, "loss": 1.3993, "lr": 4.891929383816169e-05, "epoch": 0.5541561712846348, "percentage": 18.47, "elapsed_time": "0:14:49", "remaining_time": "1:05:26"}
68
+ {"current_steps": 670, "total_steps": 3573, "loss": 1.351, "lr": 4.8847103214079524e-05, "epoch": 0.5625524769101595, "percentage": 18.75, "elapsed_time": "0:15:01", "remaining_time": "1:05:07"}
69
+ {"current_steps": 680, "total_steps": 3573, "loss": 1.3494, "lr": 4.877263555363216e-05, "epoch": 0.5709487825356843, "percentage": 19.03, "elapsed_time": "0:15:14", "remaining_time": "1:04:48"}
70
+ {"current_steps": 690, "total_steps": 3573, "loss": 1.3699, "lr": 4.869589796735078e-05, "epoch": 0.5793450881612091, "percentage": 19.31, "elapsed_time": "0:15:26", "remaining_time": "1:04:30"}
71
+ {"current_steps": 700, "total_steps": 3573, "loss": 1.3358, "lr": 4.8616897782510006e-05, "epoch": 0.5877413937867338, "percentage": 19.59, "elapsed_time": "0:15:38", "remaining_time": "1:04:12"}
72
+ {"current_steps": 710, "total_steps": 3573, "loss": 1.3417, "lr": 4.853564254242831e-05, "epoch": 0.5961376994122586, "percentage": 19.87, "elapsed_time": "0:15:50", "remaining_time": "1:03:54"}
73
+ {"current_steps": 720, "total_steps": 3573, "loss": 1.3633, "lr": 4.845214000574768e-05, "epoch": 0.6045340050377834, "percentage": 20.15, "elapsed_time": "0:16:03", "remaining_time": "1:03:36"}
74
+ {"current_steps": 730, "total_steps": 3573, "loss": 1.3582, "lr": 4.8366398145692824e-05, "epoch": 0.6129303106633082, "percentage": 20.43, "elapsed_time": "0:16:15", "remaining_time": "1:03:18"}
75
+ {"current_steps": 740, "total_steps": 3573, "loss": 1.3702, "lr": 4.827842514930985e-05, "epoch": 0.6213266162888329, "percentage": 20.71, "elapsed_time": "0:16:27", "remaining_time": "1:03:00"}
76
+ {"current_steps": 750, "total_steps": 3573, "loss": 1.3807, "lr": 4.81882294166845e-05, "epoch": 0.6297229219143576, "percentage": 20.99, "elapsed_time": "0:16:39", "remaining_time": "1:02:43"}
77
+ {"current_steps": 760, "total_steps": 3573, "loss": 1.3593, "lr": 4.8095819560140096e-05, "epoch": 0.6381192275398825, "percentage": 21.27, "elapsed_time": "0:16:51", "remaining_time": "1:02:25"}
78
+ {"current_steps": 770, "total_steps": 3573, "loss": 1.3583, "lr": 4.8001204403415204e-05, "epoch": 0.6465155331654072, "percentage": 21.55, "elapsed_time": "0:17:04", "remaining_time": "1:02:08"}
79
+ {"current_steps": 780, "total_steps": 3573, "loss": 1.3478, "lr": 4.7904392980821035e-05, "epoch": 0.654911838790932, "percentage": 21.83, "elapsed_time": "0:17:16", "remaining_time": "1:01:50"}
80
+ {"current_steps": 790, "total_steps": 3573, "loss": 1.361, "lr": 4.78053945363789e-05, "epoch": 0.6633081444164568, "percentage": 22.11, "elapsed_time": "0:17:28", "remaining_time": "1:01:33"}
81
+ {"current_steps": 800, "total_steps": 3573, "loss": 1.3445, "lr": 4.770421852293746e-05, "epoch": 0.6717044500419815, "percentage": 22.39, "elapsed_time": "0:17:40", "remaining_time": "1:01:17"}
82
+ {"current_steps": 810, "total_steps": 3573, "loss": 1.3328, "lr": 4.760087460127019e-05, "epoch": 0.6801007556675063, "percentage": 22.67, "elapsed_time": "0:17:53", "remaining_time": "1:01:00"}
83
+ {"current_steps": 820, "total_steps": 3573, "loss": 1.327, "lr": 4.749537263915288e-05, "epoch": 0.6884970612930311, "percentage": 22.95, "elapsed_time": "0:18:05", "remaining_time": "1:00:43"}
84
+ {"current_steps": 830, "total_steps": 3573, "loss": 1.3508, "lr": 4.7387722710421414e-05, "epoch": 0.6968933669185559, "percentage": 23.23, "elapsed_time": "0:18:17", "remaining_time": "1:00:26"}
85
+ {"current_steps": 840, "total_steps": 3573, "loss": 1.331, "lr": 4.7277935094009896e-05, "epoch": 0.7052896725440806, "percentage": 23.51, "elapsed_time": "0:18:29", "remaining_time": "1:00:09"}
86
+ {"current_steps": 850, "total_steps": 3573, "loss": 1.3398, "lr": 4.716602027296916e-05, "epoch": 0.7136859781696053, "percentage": 23.79, "elapsed_time": "0:18:41", "remaining_time": "0:59:53"}
87
+ {"current_steps": 860, "total_steps": 3573, "loss": 1.3557, "lr": 4.705198893346578e-05, "epoch": 0.7220822837951302, "percentage": 24.07, "elapsed_time": "0:18:53", "remaining_time": "0:59:36"}
88
+ {"current_steps": 870, "total_steps": 3573, "loss": 1.3422, "lr": 4.693585196376171e-05, "epoch": 0.7304785894206549, "percentage": 24.35, "elapsed_time": "0:19:05", "remaining_time": "0:59:20"}
89
+ {"current_steps": 880, "total_steps": 3573, "loss": 1.3767, "lr": 4.681762045317464e-05, "epoch": 0.7388748950461796, "percentage": 24.63, "elapsed_time": "0:19:18", "remaining_time": "0:59:03"}
90
+ {"current_steps": 890, "total_steps": 3573, "loss": 1.3459, "lr": 4.6697305691019105e-05, "epoch": 0.7472712006717045, "percentage": 24.91, "elapsed_time": "0:19:30", "remaining_time": "0:58:47"}
91
+ {"current_steps": 900, "total_steps": 3573, "loss": 1.3253, "lr": 4.6574919165528567e-05, "epoch": 0.7556675062972292, "percentage": 25.19, "elapsed_time": "0:19:42", "remaining_time": "0:58:31"}
92
+ {"current_steps": 910, "total_steps": 3573, "loss": 1.3419, "lr": 4.645047256275839e-05, "epoch": 0.764063811922754, "percentage": 25.47, "elapsed_time": "0:19:54", "remaining_time": "0:58:15"}
93
+ {"current_steps": 920, "total_steps": 3573, "loss": 1.3478, "lr": 4.632397776547011e-05, "epoch": 0.7724601175482787, "percentage": 25.75, "elapsed_time": "0:20:06", "remaining_time": "0:57:59"}
94
+ {"current_steps": 930, "total_steps": 3573, "loss": 1.3391, "lr": 4.619544685199669e-05, "epoch": 0.7808564231738035, "percentage": 26.03, "elapsed_time": "0:20:18", "remaining_time": "0:57:43"}
95
+ {"current_steps": 940, "total_steps": 3573, "loss": 1.3445, "lr": 4.6064892095089326e-05, "epoch": 0.7892527287993283, "percentage": 26.31, "elapsed_time": "0:20:30", "remaining_time": "0:57:27"}
96
+ {"current_steps": 950, "total_steps": 3573, "loss": 1.3167, "lr": 4.59323259607455e-05, "epoch": 0.797649034424853, "percentage": 26.59, "elapsed_time": "0:20:42", "remaining_time": "0:57:11"}
97
+ {"current_steps": 960, "total_steps": 3573, "loss": 1.3383, "lr": 4.5797761107018754e-05, "epoch": 0.8060453400503779, "percentage": 26.87, "elapsed_time": "0:20:54", "remaining_time": "0:56:55"}
98
+ {"current_steps": 970, "total_steps": 3573, "loss": 1.3404, "lr": 4.566121038280995e-05, "epoch": 0.8144416456759026, "percentage": 27.15, "elapsed_time": "0:21:07", "remaining_time": "0:56:40"}
99
+ {"current_steps": 980, "total_steps": 3573, "loss": 1.3333, "lr": 4.552268682664045e-05, "epoch": 0.8228379513014273, "percentage": 27.43, "elapsed_time": "0:21:19", "remaining_time": "0:56:24"}
100
+ {"current_steps": 990, "total_steps": 3573, "loss": 1.3182, "lr": 4.538220366540713e-05, "epoch": 0.8312342569269522, "percentage": 27.71, "elapsed_time": "0:21:31", "remaining_time": "0:56:09"}
101
+ {"current_steps": 1000, "total_steps": 3573, "loss": 1.3494, "lr": 4.52397743131194e-05, "epoch": 0.8396305625524769, "percentage": 27.99, "elapsed_time": "0:21:43", "remaining_time": "0:55:53"}