Text Generation
Safetensors
Chinese
English
conversational
Aurora / trainer_log.jsonl
wangrongsheng's picture
Upload 13 files
7981383
{"current_steps": 10100, "total_steps": 16548, "loss": 0.7798, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6514942107947466e-05, "epoch": 1.83, "percentage": 61.03, "elapsed_time": "1:07:59", "remaining_time": "0:43:24"}
{"current_steps": 10200, "total_steps": 16548, "loss": 0.786, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6070052506635487e-05, "epoch": 1.85, "percentage": 61.64, "elapsed_time": "2:16:17", "remaining_time": "1:24:49"}
{"current_steps": 10300, "total_steps": 16548, "loss": 0.7912, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5628381339135647e-05, "epoch": 1.87, "percentage": 62.24, "elapsed_time": "3:24:38", "remaining_time": "2:04:08"}
{"current_steps": 10400, "total_steps": 16548, "loss": 0.7767, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5190087787729873e-05, "epoch": 1.89, "percentage": 62.85, "elapsed_time": "4:32:38", "remaining_time": "2:41:10"}
{"current_steps": 10500, "total_steps": 16548, "loss": 0.7891, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4755329817376672e-05, "epoch": 1.9, "percentage": 63.45, "elapsed_time": "5:40:49", "remaining_time": "3:16:19"}
{"current_steps": 10600, "total_steps": 16548, "loss": 0.7885, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4324264118779218e-05, "epoch": 1.92, "percentage": 64.06, "elapsed_time": "6:49:27", "remaining_time": "3:49:45"}
{"current_steps": 10700, "total_steps": 16548, "loss": 0.7969, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.389704605191254e-05, "epoch": 1.94, "percentage": 64.66, "elapsed_time": "7:57:33", "remaining_time": "4:21:00"}
{"current_steps": 10800, "total_steps": 16548, "loss": 0.788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3473829590030412e-05, "epoch": 1.96, "percentage": 65.26, "elapsed_time": "9:05:45", "remaining_time": "4:50:27"}
{"current_steps": 10900, "total_steps": 16548, "loss": 0.7861, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3054767264171989e-05, "epoch": 1.98, "percentage": 65.87, "elapsed_time": "10:14:07", "remaining_time": "5:18:13"}
{"current_steps": 11000, "total_steps": 16548, "loss": 0.7864, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2640010108188234e-05, "epoch": 1.99, "percentage": 66.47, "elapsed_time": "11:22:31", "remaining_time": "5:44:14"}
{"current_steps": 11100, "total_steps": 16548, "loss": 0.7989, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2229707604308002e-05, "epoch": 2.01, "percentage": 67.08, "elapsed_time": "12:30:42", "remaining_time": "6:08:27"}
{"current_steps": 11200, "total_steps": 16548, "loss": 0.7764, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1824007629263217e-05, "epoch": 2.03, "percentage": 67.68, "elapsed_time": "13:39:17", "remaining_time": "6:31:12"}
{"current_steps": 11300, "total_steps": 16548, "loss": 0.7934, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1423056400992816e-05, "epoch": 2.05, "percentage": 68.29, "elapsed_time": "14:47:57", "remaining_time": "6:52:23"}
{"current_steps": 11400, "total_steps": 16548, "loss": 0.786, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1026998425944449e-05, "epoch": 2.07, "percentage": 68.89, "elapsed_time": "15:55:38", "remaining_time": "7:11:32"}
{"current_steps": 11500, "total_steps": 16548, "loss": 0.7922, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0635976446993102e-05, "epoch": 2.08, "percentage": 69.49, "elapsed_time": "17:03:23", "remaining_time": "7:29:13"}
{"current_steps": 11600, "total_steps": 16548, "loss": 0.7842, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.02501313919952e-05, "epoch": 2.1, "percentage": 70.1, "elapsed_time": "18:11:23", "remaining_time": "7:45:32"}
{"current_steps": 11700, "total_steps": 16548, "loss": 0.7932, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.869602322996985e-06, "epoch": 2.12, "percentage": 70.7, "elapsed_time": "19:19:45", "remaining_time": "8:00:33"}
{"current_steps": 11800, "total_steps": 16548, "loss": 0.7754, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.494526386115285e-06, "epoch": 2.14, "percentage": 71.31, "elapsed_time": "20:28:09", "remaining_time": "8:14:10"}
{"current_steps": 11900, "total_steps": 16548, "loss": 0.7921, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.125038762108796e-06, "epoch": 2.16, "percentage": 71.91, "elapsed_time": "21:36:12", "remaining_time": "8:26:17"}
{"current_steps": 12000, "total_steps": 16548, "loss": 0.7935, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.76127261765777e-06, "epoch": 2.18, "percentage": 72.52, "elapsed_time": "22:43:56", "remaining_time": "8:36:56"}
{"current_steps": 12100, "total_steps": 16548, "loss": 0.7857, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.403359057369443e-06, "epoch": 2.19, "percentage": 73.12, "elapsed_time": "23:51:48", "remaining_time": "8:46:20"}
{"current_steps": 12200, "total_steps": 16548, "loss": 0.7884, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.05142707652685e-06, "epoch": 2.21, "percentage": 73.72, "elapsed_time": "1 day, 0:59:54", "remaining_time": "8:54:33"}
{"current_steps": 12300, "total_steps": 16548, "loss": 0.7896, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.705603514597697e-06, "epoch": 2.23, "percentage": 74.33, "elapsed_time": "1 day, 2:08:30", "remaining_time": "9:01:42"}
{"current_steps": 12400, "total_steps": 16548, "loss": 0.7823, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.366013009520287e-06, "epoch": 2.25, "percentage": 74.93, "elapsed_time": "1 day, 3:16:13", "remaining_time": "9:07:20"}
{"current_steps": 12500, "total_steps": 16548, "loss": 0.7743, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.032777952782879e-06, "epoch": 2.27, "percentage": 75.54, "elapsed_time": "1 day, 4:24:50", "remaining_time": "9:12:05"}
{"current_steps": 12600, "total_steps": 16548, "loss": 0.7912, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.7060184453127065e-06, "epoch": 2.28, "percentage": 76.14, "elapsed_time": "1 day, 5:32:19", "remaining_time": "9:15:19"}
{"current_steps": 12700, "total_steps": 16548, "loss": 0.7814, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.385852254190483e-06, "epoch": 2.3, "percentage": 76.75, "elapsed_time": "1 day, 6:40:35", "remaining_time": "9:17:41"}
{"current_steps": 12800, "total_steps": 16548, "loss": 0.7882, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.072394770206108e-06, "epoch": 2.32, "percentage": 77.35, "elapsed_time": "1 day, 7:48:48", "remaining_time": "9:18:55"}
{"current_steps": 12900, "total_steps": 16548, "loss": 0.7895, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.7657589662707655e-06, "epoch": 2.34, "percentage": 77.96, "elapsed_time": "1 day, 8:57:09", "remaining_time": "9:19:07"}
{"current_steps": 13000, "total_steps": 16548, "loss": 0.7872, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.4660553567005e-06, "epoch": 2.36, "percentage": 78.56, "elapsed_time": "1 day, 10:05:42", "remaining_time": "9:18:19"}
{"current_steps": 13100, "total_steps": 16548, "loss": 0.7932, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.173391957385812e-06, "epoch": 2.37, "percentage": 79.16, "elapsed_time": "1 day, 11:14:51", "remaining_time": "9:16:38"}
{"current_steps": 13200, "total_steps": 16548, "loss": 0.7979, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.887874246861776e-06, "epoch": 2.39, "percentage": 79.77, "elapsed_time": "1 day, 12:23:48", "remaining_time": "9:13:53"}
{"current_steps": 13300, "total_steps": 16548, "loss": 0.7816, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.609605128292627e-06, "epoch": 2.41, "percentage": 80.37, "elapsed_time": "1 day, 13:32:19", "remaining_time": "9:10:02"}
{"current_steps": 13400, "total_steps": 16548, "loss": 0.798, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.33868489238452e-06, "epoch": 2.43, "percentage": 80.98, "elapsed_time": "1 day, 14:40:15", "remaining_time": "9:05:05"}
{"current_steps": 13500, "total_steps": 16548, "loss": 0.7787, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.0752111812398825e-06, "epoch": 2.45, "percentage": 81.58, "elapsed_time": "1 day, 15:48:12", "remaining_time": "8:59:12"}
{"current_steps": 13600, "total_steps": 16548, "loss": 0.7929, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.819278953166247e-06, "epoch": 2.47, "percentage": 82.19, "elapsed_time": "1 day, 16:56:45", "remaining_time": "8:52:32"}
{"current_steps": 13700, "total_steps": 16548, "loss": 0.7856, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.570980448452507e-06, "epoch": 2.48, "percentage": 82.79, "elapsed_time": "1 day, 18:05:27", "remaining_time": "8:44:59"}
{"current_steps": 13800, "total_steps": 16548, "loss": 0.7891, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.3304051561246193e-06, "epoch": 2.5, "percentage": 83.39, "elapsed_time": "1 day, 19:13:47", "remaining_time": "8:36:30"}
{"current_steps": 13900, "total_steps": 16548, "loss": 0.7871, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0976397816929847e-06, "epoch": 2.52, "percentage": 84.0, "elapsed_time": "1 day, 20:22:06", "remaining_time": "8:27:08"}
{"current_steps": 14000, "total_steps": 16548, "loss": 0.7771, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.872768215902963e-06, "epoch": 2.54, "percentage": 84.6, "elapsed_time": "1 day, 21:30:41", "remaining_time": "8:16:59"}
{"current_steps": 14100, "total_steps": 16548, "loss": 0.7852, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6558715044999407e-06, "epoch": 2.56, "percentage": 85.21, "elapsed_time": "1 day, 22:39:11", "remaining_time": "8:05:59"}
{"current_steps": 14200, "total_steps": 16548, "loss": 0.7848, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4470278190196565e-06, "epoch": 2.57, "percentage": 85.81, "elapsed_time": "1 day, 23:47:32", "remaining_time": "7:54:09"}
{"current_steps": 14300, "total_steps": 16548, "loss": 0.7832, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.246312428614519e-06, "epoch": 2.59, "percentage": 86.42, "elapsed_time": "2 days, 1:03:36", "remaining_time": "7:42:44"}
{"current_steps": 14400, "total_steps": 16548, "loss": 0.7903, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0537976729258834e-06, "epoch": 2.61, "percentage": 87.02, "elapsed_time": "2 days, 2:12:23", "remaining_time": "7:29:20"}
{"current_steps": 14500, "total_steps": 16548, "loss": 0.7787, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8695529360122367e-06, "epoch": 2.63, "percentage": 87.62, "elapsed_time": "2 days, 3:21:24", "remaining_time": "7:15:13"}
{"current_steps": 14600, "total_steps": 16548, "loss": 0.7867, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6936446213425079e-06, "epoch": 2.65, "percentage": 88.23, "elapsed_time": "2 days, 4:30:24", "remaining_time": "7:00:20"}
{"current_steps": 14700, "total_steps": 16548, "loss": 0.7915, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5261361278636949e-06, "epoch": 2.66, "percentage": 88.83, "elapsed_time": "2 days, 5:39:16", "remaining_time": "6:44:42"}
{"current_steps": 14800, "total_steps": 16548, "loss": 0.7798, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.367087827151284e-06, "epoch": 2.68, "percentage": 89.44, "elapsed_time": "2 days, 6:47:40", "remaining_time": "6:28:18"}
{"current_steps": 14900, "total_steps": 16548, "loss": 0.78, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2165570416508038e-06, "epoch": 2.7, "percentage": 90.04, "elapsed_time": "2 days, 7:56:27", "remaining_time": "6:11:14"}
{"current_steps": 15000, "total_steps": 16548, "loss": 0.7942, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.074598024018303e-06, "epoch": 2.72, "percentage": 90.65, "elapsed_time": "2 days, 9:04:47", "remaining_time": "5:53:26"}
{"current_steps": 15100, "total_steps": 16548, "loss": 0.7871, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.412619375671838e-07, "epoch": 2.74, "percentage": 91.25, "elapsed_time": "2 days, 10:13:09", "remaining_time": "5:34:58"}
{"current_steps": 15200, "total_steps": 16548, "loss": 0.7874, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.165968378284899e-07, "epoch": 2.76, "percentage": 91.85, "elapsed_time": "2 days, 11:21:29", "remaining_time": "5:15:50"}
{"current_steps": 15300, "total_steps": 16548, "loss": 0.8047, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.006476552312597e-07, "epoch": 2.77, "percentage": 92.46, "elapsed_time": "2 days, 12:29:53", "remaining_time": "4:56:05"}
{"current_steps": 15400, "total_steps": 16548, "loss": 0.7972, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.934561789092075e-07, "epoch": 2.79, "percentage": 93.06, "elapsed_time": "2 days, 13:38:20", "remaining_time": "4:35:41"}
{"current_steps": 15500, "total_steps": 16548, "loss": 0.7809, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.950610416395052e-07, "epoch": 2.81, "percentage": 93.67, "elapsed_time": "2 days, 14:47:01", "remaining_time": "4:14:41"}
{"current_steps": 15600, "total_steps": 16548, "loss": 0.7863, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.0549770591921944e-07, "epoch": 2.83, "percentage": 94.27, "elapsed_time": "2 days, 15:55:42", "remaining_time": "3:53:05"}
{"current_steps": 15700, "total_steps": 16548, "loss": 0.7823, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.2479845118428556e-07, "epoch": 2.85, "percentage": 94.88, "elapsed_time": "2 days, 17:04:06", "remaining_time": "3:30:52"}
{"current_steps": 15800, "total_steps": 16548, "loss": 0.7795, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.529923621757052e-07, "epoch": 2.86, "percentage": 95.48, "elapsed_time": "2 days, 18:12:29", "remaining_time": "3:08:03"}
{"current_steps": 15900, "total_steps": 16548, "loss": 0.7921, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.901053184571594e-07, "epoch": 2.88, "percentage": 96.08, "elapsed_time": "2 days, 19:20:22", "remaining_time": "2:44:39"}
{"current_steps": 16000, "total_steps": 16548, "loss": 0.7846, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.361599850877665e-07, "epoch": 2.9, "percentage": 96.69, "elapsed_time": "2 days, 20:29:03", "remaining_time": "2:20:44"}
{"current_steps": 16100, "total_steps": 16548, "loss": 0.7781, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.117580445338892e-08, "epoch": 2.92, "percentage": 97.29, "elapsed_time": "2 days, 21:37:43", "remaining_time": "1:56:14"}
{"current_steps": 16200, "total_steps": 16548, "loss": 0.7865, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.5168989259429816e-08, "epoch": 2.94, "percentage": 97.9, "elapsed_time": "2 days, 22:45:51", "remaining_time": "1:31:12"}
{"current_steps": 16300, "total_steps": 16548, "loss": 0.7831, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.81525166876212e-08, "epoch": 2.95, "percentage": 98.5, "elapsed_time": "2 days, 23:53:55", "remaining_time": "1:05:38"}
{"current_steps": 16400, "total_steps": 16548, "loss": 0.7788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.01361237189318e-08, "epoch": 2.97, "percentage": 99.11, "elapsed_time": "3 days, 1:02:52", "remaining_time": "0:39:33"}
{"current_steps": 16500, "total_steps": 16548, "loss": 0.7937, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1263036242797898e-09, "epoch": 2.99, "percentage": 99.71, "elapsed_time": "3 days, 2:11:01", "remaining_time": "0:12:56"}
{"current_steps": 16548, "total_steps": 16548, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "3 days, 2:43:51", "remaining_time": "0:00:00"}