vapo_lora_all_data_iter_2 / trainer_log.jsonl
DongfuJiang's picture
Upload trainer_log.jsonl with huggingface_hub
dbad76e verified
{"current_steps": 5, "total_steps": 88, "loss": 0.8881, "accuracy": 1.0, "learning_rate": 2.7777777777777783e-06, "epoch": 0.05653710247349823, "percentage": 5.68, "elapsed_time": "0:02:05", "remaining_time": "0:34:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 10, "total_steps": 88, "loss": 0.8913, "accuracy": 1.0, "learning_rate": 4.998023493068255e-06, "epoch": 0.11307420494699646, "percentage": 11.36, "elapsed_time": "0:04:22", "remaining_time": "0:34:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 15, "total_steps": 88, "loss": 0.8848, "accuracy": 1.0, "learning_rate": 4.929173350101025e-06, "epoch": 0.1696113074204947, "percentage": 17.05, "elapsed_time": "0:06:31", "remaining_time": "0:31:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 88, "loss": 0.8808, "accuracy": 1.0, "learning_rate": 4.764600984163809e-06, "epoch": 0.22614840989399293, "percentage": 22.73, "elapsed_time": "0:08:41", "remaining_time": "0:29:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 25, "total_steps": 88, "loss": 0.8694, "accuracy": 0.987500011920929, "learning_rate": 4.510791413176912e-06, "epoch": 0.2826855123674912, "percentage": 28.41, "elapsed_time": "0:10:54", "remaining_time": "0:27:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 88, "loss": 0.864, "accuracy": 1.0, "learning_rate": 4.177746070897593e-06, "epoch": 0.3392226148409894, "percentage": 34.09, "elapsed_time": "0:12:58", "remaining_time": "0:25:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 35, "total_steps": 88, "loss": 0.8575, "accuracy": 0.9750000238418579, "learning_rate": 3.7785886977585562e-06, "epoch": 0.3957597173144876, "percentage": 39.77, "elapsed_time": "0:14:55", "remaining_time": "0:22:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 88, "loss": 0.853, "accuracy": 0.987500011920929, "learning_rate": 3.32904819638017e-06, "epoch": 0.45229681978798586, "percentage": 45.45, "elapsed_time": "0:17:05", "remaining_time": "0:20:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 45, "total_steps": 88, "loss": 0.8404, "accuracy": 1.0, "learning_rate": 2.8468388299726714e-06, "epoch": 0.508833922261484, "percentage": 51.14, "elapsed_time": "0:19:11", "remaining_time": "0:18:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 88, "loss": 0.8421, "accuracy": 1.0, "learning_rate": 2.3509621870754505e-06, "epoch": 0.5653710247349824, "percentage": 56.82, "elapsed_time": "0:21:13", "remaining_time": "0:16:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 55, "total_steps": 88, "loss": 0.8195, "accuracy": 1.0, "learning_rate": 1.8609584188988135e-06, "epoch": 0.6219081272084805, "percentage": 62.5, "elapsed_time": "0:23:29", "remaining_time": "0:14:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 88, "loss": 0.825, "accuracy": 1.0, "learning_rate": 1.3961362544602215e-06, "epoch": 0.6784452296819788, "percentage": 68.18, "elapsed_time": "0:25:35", "remaining_time": "0:11:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 65, "total_steps": 88, "loss": 0.8111, "accuracy": 0.987500011920929, "learning_rate": 9.74812134973689e-07, "epoch": 0.734982332155477, "percentage": 73.86, "elapsed_time": "0:27:40", "remaining_time": "0:09:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 88, "loss": 0.8105, "accuracy": 1.0, "learning_rate": 6.135884496044245e-07, "epoch": 0.7915194346289752, "percentage": 79.55, "elapsed_time": "0:29:47", "remaining_time": "0:07:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 75, "total_steps": 88, "loss": 0.798, "accuracy": 0.987500011920929, "learning_rate": 3.266993139010438e-07, "epoch": 0.8480565371024735, "percentage": 85.23, "elapsed_time": "0:31:59", "remaining_time": "0:05:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 88, "loss": 0.81, "accuracy": 0.987500011920929, "learning_rate": 1.2544967068054332e-07, "epoch": 0.9045936395759717, "percentage": 90.91, "elapsed_time": "0:34:06", "remaining_time": "0:03:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 85, "total_steps": 88, "loss": 0.8108, "accuracy": 0.987500011920929, "learning_rate": 1.7769815745066476e-08, "epoch": 0.9611307420494699, "percentage": 96.59, "elapsed_time": "0:36:18", "remaining_time": "0:01:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 88, "total_steps": 88, "epoch": 0.995053003533569, "percentage": 100.0, "elapsed_time": "0:37:39", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}