{ "best_metric": null, "best_model_checkpoint": null, "epoch": 167.0, "eval_steps": 2500, "global_step": 30060, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.28, "learning_rate": 3.060545575515636e-07, "loss": 19.8566, "step": 50 }, { "epoch": 0.56, "learning_rate": 6.187624750499002e-07, "loss": 20.7169, "step": 100 }, { "epoch": 0.83, "learning_rate": 9.31470392548237e-07, "loss": 20.377, "step": 150 }, { "epoch": 1.11, "learning_rate": 1.2508316699933468e-06, "loss": 20.2675, "step": 200 }, { "epoch": 1.39, "learning_rate": 1.5701929474384566e-06, "loss": 19.7473, "step": 250 }, { "epoch": 1.67, "learning_rate": 1.862940785096474e-06, "loss": 18.7224, "step": 300 }, { "epoch": 1.94, "learning_rate": 2.1823020625415835e-06, "loss": 18.1483, "step": 350 }, { "epoch": 2.22, "learning_rate": 2.5016633399866937e-06, "loss": 17.4886, "step": 400 }, { "epoch": 2.5, "learning_rate": 2.801064537591484e-06, "loss": 17.7605, "step": 450 }, { "epoch": 2.78, "learning_rate": 3.127079174983367e-06, "loss": 17.7922, "step": 500 }, { "epoch": 3.06, "learning_rate": 3.4464404524284766e-06, "loss": 17.5965, "step": 550 }, { "epoch": 3.33, "learning_rate": 3.7658017298735864e-06, "loss": 17.9381, "step": 600 }, { "epoch": 3.61, "learning_rate": 4.078509647371924e-06, "loss": 17.1456, "step": 650 }, { "epoch": 3.89, "learning_rate": 4.4045242847638055e-06, "loss": 17.705, "step": 700 }, { "epoch": 4.17, "learning_rate": 4.703925482368596e-06, "loss": 17.0541, "step": 750 }, { "epoch": 4.44, "learning_rate": 5.023286759813706e-06, "loss": 17.998, "step": 800 }, { "epoch": 4.72, "learning_rate": 5.32934131736527e-06, "loss": 17.9034, "step": 850 }, { "epoch": 5.0, "learning_rate": 5.642049234863607e-06, "loss": 16.9998, "step": 900 }, { "epoch": 5.28, "learning_rate": 5.928143712574851e-06, "loss": 17.4889, "step": 950 }, { "epoch": 5.56, "learning_rate": 6.254158349966734e-06, "loss": 17.1789, "step": 1000 }, { "epoch": 5.83, "learning_rate": 6.5801729873586165e-06, "loss": 17.7747, "step": 1050 }, { "epoch": 6.11, "learning_rate": 6.899534264803727e-06, "loss": 17.4186, "step": 1100 }, { "epoch": 6.39, "learning_rate": 7.198935462408517e-06, "loss": 17.1787, "step": 1150 }, { "epoch": 6.67, "learning_rate": 7.518296739853627e-06, "loss": 17.7217, "step": 1200 }, { "epoch": 6.94, "learning_rate": 7.844311377245509e-06, "loss": 17.8271, "step": 1250 }, { "epoch": 7.22, "learning_rate": 8.16367265469062e-06, "loss": 17.8748, "step": 1300 }, { "epoch": 7.5, "learning_rate": 8.476380572188956e-06, "loss": 17.1441, "step": 1350 }, { "epoch": 7.78, "learning_rate": 8.802395209580839e-06, "loss": 17.5028, "step": 1400 }, { "epoch": 8.06, "learning_rate": 9.10179640718563e-06, "loss": 17.6395, "step": 1450 }, { "epoch": 8.33, "learning_rate": 9.427811044577513e-06, "loss": 17.7263, "step": 1500 }, { "epoch": 8.61, "learning_rate": 9.72055888223553e-06, "loss": 17.5629, "step": 1550 }, { "epoch": 8.89, "learning_rate": 1.0046573519627412e-05, "loss": 17.3875, "step": 1600 }, { "epoch": 9.17, "learning_rate": 1.0372588157019297e-05, "loss": 17.6111, "step": 1650 }, { "epoch": 9.44, "learning_rate": 1.0685296074517632e-05, "loss": 17.3748, "step": 1700 }, { "epoch": 9.72, "learning_rate": 1.0998003992015969e-05, "loss": 17.0905, "step": 1750 }, { "epoch": 10.0, "learning_rate": 1.1310711909514306e-05, "loss": 17.9498, "step": 1800 }, { "epoch": 10.28, "learning_rate": 1.1630073186959416e-05, "loss": 18.0702, "step": 1850 }, { "epoch": 10.56, "learning_rate": 1.1929474384564205e-05, "loss": 17.0911, "step": 1900 }, { "epoch": 10.83, "learning_rate": 1.2242182302062542e-05, "loss": 17.8286, "step": 1950 }, { "epoch": 11.11, "learning_rate": 1.2568196939454425e-05, "loss": 17.4852, "step": 2000 }, { "epoch": 11.39, "learning_rate": 1.2880904856952763e-05, "loss": 17.8215, "step": 2050 }, { "epoch": 11.67, "learning_rate": 1.3206919494344646e-05, "loss": 17.0628, "step": 2100 }, { "epoch": 11.94, "learning_rate": 1.3519627411842981e-05, "loss": 17.4526, "step": 2150 }, { "epoch": 12.22, "learning_rate": 1.3832335329341318e-05, "loss": 17.7588, "step": 2200 }, { "epoch": 12.5, "learning_rate": 1.4131736526946109e-05, "loss": 17.0106, "step": 2250 }, { "epoch": 12.78, "learning_rate": 1.4464404524284766e-05, "loss": 18.0131, "step": 2300 }, { "epoch": 13.06, "learning_rate": 1.4763805721889555e-05, "loss": 17.2767, "step": 2350 }, { "epoch": 13.33, "learning_rate": 1.5083166999334667e-05, "loss": 17.6692, "step": 2400 }, { "epoch": 13.61, "learning_rate": 1.5395874916833004e-05, "loss": 17.5548, "step": 2450 }, { "epoch": 13.89, "learning_rate": 1.5715236194278113e-05, "loss": 17.348, "step": 2500 }, { "epoch": 13.89, "eval_loss": 26.116436004638672, "eval_runtime": 6.8523, "eval_samples_per_second": 207.228, "eval_steps_per_second": 12.988, "eval_wer": 1.0, "step": 2500 }, { "epoch": 14.17, "learning_rate": 1.6034597471723222e-05, "loss": 17.1037, "step": 2550 }, { "epoch": 14.44, "learning_rate": 1.635395874916833e-05, "loss": 17.4847, "step": 2600 }, { "epoch": 14.72, "learning_rate": 1.6553559547571525e-05, "loss": 17.0939, "step": 2650 }, { "epoch": 15.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2700 }, { "epoch": 15.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2750 }, { "epoch": 15.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2800 }, { "epoch": 15.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2850 }, { "epoch": 16.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2900 }, { "epoch": 16.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 2950 }, { "epoch": 16.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3000 }, { "epoch": 16.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3050 }, { "epoch": 17.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3100 }, { "epoch": 17.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3150 }, { "epoch": 17.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3200 }, { "epoch": 18.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3250 }, { "epoch": 18.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3300 }, { "epoch": 18.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3350 }, { "epoch": 18.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3400 }, { "epoch": 19.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3450 }, { "epoch": 19.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3500 }, { "epoch": 19.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3550 }, { "epoch": 20.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3600 }, { "epoch": 20.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3650 }, { "epoch": 20.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3700 }, { "epoch": 20.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3750 }, { "epoch": 21.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3800 }, { "epoch": 21.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3850 }, { "epoch": 21.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3900 }, { "epoch": 21.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 3950 }, { "epoch": 22.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4000 }, { "epoch": 22.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4050 }, { "epoch": 22.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4100 }, { "epoch": 23.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4150 }, { "epoch": 23.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4200 }, { "epoch": 23.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4250 }, { "epoch": 23.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4300 }, { "epoch": 24.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4350 }, { "epoch": 24.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4400 }, { "epoch": 24.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4450 }, { "epoch": 25.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4500 }, { "epoch": 25.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4550 }, { "epoch": 25.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4600 }, { "epoch": 25.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4650 }, { "epoch": 26.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4700 }, { "epoch": 26.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4750 }, { "epoch": 26.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4800 }, { "epoch": 26.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4850 }, { "epoch": 27.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4900 }, { "epoch": 27.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 4950 }, { "epoch": 27.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5000 }, { "epoch": 27.78, "eval_loss": NaN, "eval_runtime": 5.8183, "eval_samples_per_second": 244.06, "eval_steps_per_second": 15.297, "eval_wer": 1.0, "step": 5000 }, { "epoch": 28.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5050 }, { "epoch": 28.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5100 }, { "epoch": 28.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5150 }, { "epoch": 28.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5200 }, { "epoch": 29.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5250 }, { "epoch": 29.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5300 }, { "epoch": 29.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5350 }, { "epoch": 30.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5400 }, { "epoch": 30.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5450 }, { "epoch": 30.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5500 }, { "epoch": 30.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5550 }, { "epoch": 31.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5600 }, { "epoch": 31.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5650 }, { "epoch": 31.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5700 }, { "epoch": 31.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5750 }, { "epoch": 32.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5800 }, { "epoch": 32.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5850 }, { "epoch": 32.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5900 }, { "epoch": 33.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 5950 }, { "epoch": 33.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6000 }, { "epoch": 33.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6050 }, { "epoch": 33.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6100 }, { "epoch": 34.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6150 }, { "epoch": 34.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6200 }, { "epoch": 34.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6250 }, { "epoch": 35.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6300 }, { "epoch": 35.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6350 }, { "epoch": 35.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6400 }, { "epoch": 35.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6450 }, { "epoch": 36.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6500 }, { "epoch": 36.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6550 }, { "epoch": 36.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6600 }, { "epoch": 36.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6650 }, { "epoch": 37.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6700 }, { "epoch": 37.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6750 }, { "epoch": 37.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6800 }, { "epoch": 38.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6850 }, { "epoch": 38.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6900 }, { "epoch": 38.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 6950 }, { "epoch": 38.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7000 }, { "epoch": 39.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7050 }, { "epoch": 39.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7100 }, { "epoch": 39.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7150 }, { "epoch": 40.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7200 }, { "epoch": 40.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7250 }, { "epoch": 40.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7300 }, { "epoch": 40.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7350 }, { "epoch": 41.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7400 }, { "epoch": 41.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7450 }, { "epoch": 41.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7500 }, { "epoch": 41.67, "eval_loss": NaN, "eval_runtime": 5.5711, "eval_samples_per_second": 254.885, "eval_steps_per_second": 15.975, "eval_wer": 1.0, "step": 7500 }, { "epoch": 41.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7550 }, { "epoch": 42.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7600 }, { "epoch": 42.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7650 }, { "epoch": 42.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7700 }, { "epoch": 43.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7750 }, { "epoch": 43.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7800 }, { "epoch": 43.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7850 }, { "epoch": 43.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7900 }, { "epoch": 44.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 7950 }, { "epoch": 44.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8000 }, { "epoch": 44.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8050 }, { "epoch": 45.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8100 }, { "epoch": 45.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8150 }, { "epoch": 45.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8200 }, { "epoch": 45.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8250 }, { "epoch": 46.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8300 }, { "epoch": 46.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8350 }, { "epoch": 46.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8400 }, { "epoch": 46.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8450 }, { "epoch": 47.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8500 }, { "epoch": 47.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8550 }, { "epoch": 47.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8600 }, { "epoch": 48.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8650 }, { "epoch": 48.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8700 }, { "epoch": 48.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8750 }, { "epoch": 48.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8800 }, { "epoch": 49.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8850 }, { "epoch": 49.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8900 }, { "epoch": 49.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 8950 }, { "epoch": 50.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9000 }, { "epoch": 50.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9050 }, { "epoch": 50.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9100 }, { "epoch": 50.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9150 }, { "epoch": 51.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9200 }, { "epoch": 51.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9250 }, { "epoch": 51.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9300 }, { "epoch": 51.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9350 }, { "epoch": 52.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9400 }, { "epoch": 52.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9450 }, { "epoch": 52.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9500 }, { "epoch": 53.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9550 }, { "epoch": 53.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9600 }, { "epoch": 53.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9650 }, { "epoch": 53.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9700 }, { "epoch": 54.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9750 }, { "epoch": 54.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9800 }, { "epoch": 54.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9850 }, { "epoch": 55.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9900 }, { "epoch": 55.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 9950 }, { "epoch": 55.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10000 }, { "epoch": 55.56, "eval_loss": NaN, "eval_runtime": 5.5572, "eval_samples_per_second": 255.523, "eval_steps_per_second": 16.015, "eval_wer": 1.0, "step": 10000 }, { "epoch": 55.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10050 }, { "epoch": 56.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10100 }, { "epoch": 56.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10150 }, { "epoch": 56.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10200 }, { "epoch": 56.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10250 }, { "epoch": 57.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10300 }, { "epoch": 57.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10350 }, { "epoch": 57.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10400 }, { "epoch": 58.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10450 }, { "epoch": 58.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10500 }, { "epoch": 58.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10550 }, { "epoch": 58.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10600 }, { "epoch": 59.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10650 }, { "epoch": 59.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10700 }, { "epoch": 59.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10750 }, { "epoch": 60.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10800 }, { "epoch": 60.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10850 }, { "epoch": 60.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10900 }, { "epoch": 60.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 10950 }, { "epoch": 61.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11000 }, { "epoch": 61.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11050 }, { "epoch": 61.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11100 }, { "epoch": 61.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11150 }, { "epoch": 62.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11200 }, { "epoch": 62.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11250 }, { "epoch": 62.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11300 }, { "epoch": 63.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11350 }, { "epoch": 63.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11400 }, { "epoch": 63.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11450 }, { "epoch": 63.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11500 }, { "epoch": 64.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11550 }, { "epoch": 64.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11600 }, { "epoch": 64.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11650 }, { "epoch": 65.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11700 }, { "epoch": 65.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11750 }, { "epoch": 65.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11800 }, { "epoch": 65.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11850 }, { "epoch": 66.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11900 }, { "epoch": 66.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 11950 }, { "epoch": 66.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12000 }, { "epoch": 66.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12050 }, { "epoch": 67.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12100 }, { "epoch": 67.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12150 }, { "epoch": 67.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12200 }, { "epoch": 68.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12250 }, { "epoch": 68.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12300 }, { "epoch": 68.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12350 }, { "epoch": 68.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12400 }, { "epoch": 69.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12450 }, { "epoch": 69.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12500 }, { "epoch": 69.44, "eval_loss": NaN, "eval_runtime": 5.6675, "eval_samples_per_second": 250.554, "eval_steps_per_second": 15.704, "eval_wer": 1.0, "step": 12500 }, { "epoch": 69.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12550 }, { "epoch": 70.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12600 }, { "epoch": 70.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12650 }, { "epoch": 70.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12700 }, { "epoch": 70.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12750 }, { "epoch": 71.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12800 }, { "epoch": 71.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12850 }, { "epoch": 71.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12900 }, { "epoch": 71.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 12950 }, { "epoch": 72.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13000 }, { "epoch": 72.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13050 }, { "epoch": 72.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13100 }, { "epoch": 73.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13150 }, { "epoch": 73.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13200 }, { "epoch": 73.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13250 }, { "epoch": 73.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13300 }, { "epoch": 74.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13350 }, { "epoch": 74.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13400 }, { "epoch": 74.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13450 }, { "epoch": 75.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13500 }, { "epoch": 75.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13550 }, { "epoch": 75.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13600 }, { "epoch": 75.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13650 }, { "epoch": 76.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13700 }, { "epoch": 76.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13750 }, { "epoch": 76.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13800 }, { "epoch": 76.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13850 }, { "epoch": 77.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13900 }, { "epoch": 77.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 13950 }, { "epoch": 77.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14000 }, { "epoch": 78.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14050 }, { "epoch": 78.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14100 }, { "epoch": 78.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14150 }, { "epoch": 78.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14200 }, { "epoch": 79.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14250 }, { "epoch": 79.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14300 }, { "epoch": 79.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14350 }, { "epoch": 80.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14400 }, { "epoch": 80.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14450 }, { "epoch": 80.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14500 }, { "epoch": 80.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14550 }, { "epoch": 81.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14600 }, { "epoch": 81.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14650 }, { "epoch": 81.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14700 }, { "epoch": 81.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14750 }, { "epoch": 82.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14800 }, { "epoch": 82.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14850 }, { "epoch": 82.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14900 }, { "epoch": 83.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 14950 }, { "epoch": 83.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15000 }, { "epoch": 83.33, "eval_loss": NaN, "eval_runtime": 5.6544, "eval_samples_per_second": 251.132, "eval_steps_per_second": 15.74, "eval_wer": 1.0, "step": 15000 }, { "epoch": 83.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15050 }, { "epoch": 83.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15100 }, { "epoch": 84.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15150 }, { "epoch": 84.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15200 }, { "epoch": 84.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15250 }, { "epoch": 85.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15300 }, { "epoch": 85.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15350 }, { "epoch": 85.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15400 }, { "epoch": 85.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15450 }, { "epoch": 86.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15500 }, { "epoch": 86.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15550 }, { "epoch": 86.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15600 }, { "epoch": 86.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15650 }, { "epoch": 87.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15700 }, { "epoch": 87.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15750 }, { "epoch": 87.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15800 }, { "epoch": 88.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15850 }, { "epoch": 88.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15900 }, { "epoch": 88.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 15950 }, { "epoch": 88.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16000 }, { "epoch": 89.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16050 }, { "epoch": 89.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16100 }, { "epoch": 89.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16150 }, { "epoch": 90.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16200 }, { "epoch": 90.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16250 }, { "epoch": 90.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16300 }, { "epoch": 90.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16350 }, { "epoch": 91.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16400 }, { "epoch": 91.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16450 }, { "epoch": 91.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16500 }, { "epoch": 91.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16550 }, { "epoch": 92.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16600 }, { "epoch": 92.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16650 }, { "epoch": 92.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16700 }, { "epoch": 93.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16750 }, { "epoch": 93.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16800 }, { "epoch": 93.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16850 }, { "epoch": 93.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16900 }, { "epoch": 94.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 16950 }, { "epoch": 94.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17000 }, { "epoch": 94.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17050 }, { "epoch": 95.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17100 }, { "epoch": 95.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17150 }, { "epoch": 95.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17200 }, { "epoch": 95.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17250 }, { "epoch": 96.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17300 }, { "epoch": 96.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17350 }, { "epoch": 96.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17400 }, { "epoch": 96.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17450 }, { "epoch": 97.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17500 }, { "epoch": 97.22, "eval_loss": NaN, "eval_runtime": 5.6567, "eval_samples_per_second": 251.03, "eval_steps_per_second": 15.734, "eval_wer": 1.0, "step": 17500 }, { "epoch": 97.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17550 }, { "epoch": 97.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17600 }, { "epoch": 98.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17650 }, { "epoch": 98.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17700 }, { "epoch": 98.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17750 }, { "epoch": 98.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17800 }, { "epoch": 99.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17850 }, { "epoch": 99.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17900 }, { "epoch": 99.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 17950 }, { "epoch": 100.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18000 }, { "epoch": 100.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18050 }, { "epoch": 100.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18100 }, { "epoch": 100.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18150 }, { "epoch": 101.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18200 }, { "epoch": 101.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18250 }, { "epoch": 101.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18300 }, { "epoch": 101.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18350 }, { "epoch": 102.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18400 }, { "epoch": 102.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18450 }, { "epoch": 102.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18500 }, { "epoch": 103.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18550 }, { "epoch": 103.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18600 }, { "epoch": 103.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18650 }, { "epoch": 103.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18700 }, { "epoch": 104.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18750 }, { "epoch": 104.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18800 }, { "epoch": 104.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18850 }, { "epoch": 105.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18900 }, { "epoch": 105.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 18950 }, { "epoch": 105.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19000 }, { "epoch": 105.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19050 }, { "epoch": 106.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19100 }, { "epoch": 106.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19150 }, { "epoch": 106.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19200 }, { "epoch": 106.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19250 }, { "epoch": 107.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19300 }, { "epoch": 107.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19350 }, { "epoch": 107.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19400 }, { "epoch": 108.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19450 }, { "epoch": 108.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19500 }, { "epoch": 108.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19550 }, { "epoch": 108.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19600 }, { "epoch": 109.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19650 }, { "epoch": 109.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19700 }, { "epoch": 109.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19750 }, { "epoch": 110.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19800 }, { "epoch": 110.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19850 }, { "epoch": 110.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19900 }, { "epoch": 110.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 19950 }, { "epoch": 111.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20000 }, { "epoch": 111.11, "eval_loss": NaN, "eval_runtime": 5.6012, "eval_samples_per_second": 253.518, "eval_steps_per_second": 15.889, "eval_wer": 1.0, "step": 20000 }, { "epoch": 111.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20050 }, { "epoch": 111.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20100 }, { "epoch": 111.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20150 }, { "epoch": 112.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20200 }, { "epoch": 112.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20250 }, { "epoch": 112.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20300 }, { "epoch": 113.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20350 }, { "epoch": 113.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20400 }, { "epoch": 113.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20450 }, { "epoch": 113.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20500 }, { "epoch": 114.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20550 }, { "epoch": 114.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20600 }, { "epoch": 114.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20650 }, { "epoch": 115.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20700 }, { "epoch": 115.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20750 }, { "epoch": 115.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20800 }, { "epoch": 115.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20850 }, { "epoch": 116.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20900 }, { "epoch": 116.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 20950 }, { "epoch": 116.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21000 }, { "epoch": 116.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21050 }, { "epoch": 117.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21100 }, { "epoch": 117.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21150 }, { "epoch": 117.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21200 }, { "epoch": 118.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21250 }, { "epoch": 118.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21300 }, { "epoch": 118.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21350 }, { "epoch": 118.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21400 }, { "epoch": 119.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21450 }, { "epoch": 119.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21500 }, { "epoch": 119.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21550 }, { "epoch": 120.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21600 }, { "epoch": 120.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21650 }, { "epoch": 120.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21700 }, { "epoch": 120.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21750 }, { "epoch": 121.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21800 }, { "epoch": 121.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21850 }, { "epoch": 121.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21900 }, { "epoch": 121.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 21950 }, { "epoch": 122.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22000 }, { "epoch": 122.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22050 }, { "epoch": 122.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22100 }, { "epoch": 123.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22150 }, { "epoch": 123.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22200 }, { "epoch": 123.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22250 }, { "epoch": 123.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22300 }, { "epoch": 124.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22350 }, { "epoch": 124.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22400 }, { "epoch": 124.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22450 }, { "epoch": 125.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22500 }, { "epoch": 125.0, "eval_loss": NaN, "eval_runtime": 5.5493, "eval_samples_per_second": 255.89, "eval_steps_per_second": 16.038, "eval_wer": 1.0, "step": 22500 }, { "epoch": 125.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22550 }, { "epoch": 125.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22600 }, { "epoch": 125.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22650 }, { "epoch": 126.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22700 }, { "epoch": 126.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22750 }, { "epoch": 126.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22800 }, { "epoch": 126.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22850 }, { "epoch": 127.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22900 }, { "epoch": 127.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 22950 }, { "epoch": 127.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23000 }, { "epoch": 128.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23050 }, { "epoch": 128.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23100 }, { "epoch": 128.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23150 }, { "epoch": 128.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23200 }, { "epoch": 129.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23250 }, { "epoch": 129.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23300 }, { "epoch": 129.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23350 }, { "epoch": 130.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23400 }, { "epoch": 130.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23450 }, { "epoch": 130.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23500 }, { "epoch": 130.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23550 }, { "epoch": 131.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23600 }, { "epoch": 131.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23650 }, { "epoch": 131.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23700 }, { "epoch": 131.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23750 }, { "epoch": 132.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23800 }, { "epoch": 132.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23850 }, { "epoch": 132.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23900 }, { "epoch": 133.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 23950 }, { "epoch": 133.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24000 }, { "epoch": 133.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24050 }, { "epoch": 133.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24100 }, { "epoch": 134.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24150 }, { "epoch": 134.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24200 }, { "epoch": 134.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24250 }, { "epoch": 135.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24300 }, { "epoch": 135.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24350 }, { "epoch": 135.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24400 }, { "epoch": 135.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24450 }, { "epoch": 136.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24500 }, { "epoch": 136.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24550 }, { "epoch": 136.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24600 }, { "epoch": 136.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24650 }, { "epoch": 137.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24700 }, { "epoch": 137.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24750 }, { "epoch": 137.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24800 }, { "epoch": 138.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24850 }, { "epoch": 138.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24900 }, { "epoch": 138.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 24950 }, { "epoch": 138.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25000 }, { "epoch": 138.89, "eval_loss": NaN, "eval_runtime": 5.5573, "eval_samples_per_second": 255.522, "eval_steps_per_second": 16.015, "eval_wer": 1.0, "step": 25000 }, { "epoch": 139.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25050 }, { "epoch": 139.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25100 }, { "epoch": 139.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25150 }, { "epoch": 140.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25200 }, { "epoch": 140.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25250 }, { "epoch": 140.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25300 }, { "epoch": 140.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25350 }, { "epoch": 141.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25400 }, { "epoch": 141.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25450 }, { "epoch": 141.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25500 }, { "epoch": 141.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25550 }, { "epoch": 142.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25600 }, { "epoch": 142.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25650 }, { "epoch": 142.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25700 }, { "epoch": 143.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25750 }, { "epoch": 143.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25800 }, { "epoch": 143.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25850 }, { "epoch": 143.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25900 }, { "epoch": 144.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 25950 }, { "epoch": 144.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26000 }, { "epoch": 144.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26050 }, { "epoch": 145.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26100 }, { "epoch": 145.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26150 }, { "epoch": 145.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26200 }, { "epoch": 145.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26250 }, { "epoch": 146.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26300 }, { "epoch": 146.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26350 }, { "epoch": 146.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26400 }, { "epoch": 146.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26450 }, { "epoch": 147.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26500 }, { "epoch": 147.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26550 }, { "epoch": 147.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26600 }, { "epoch": 148.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26650 }, { "epoch": 148.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26700 }, { "epoch": 148.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26750 }, { "epoch": 148.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26800 }, { "epoch": 149.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26850 }, { "epoch": 149.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26900 }, { "epoch": 149.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 26950 }, { "epoch": 150.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27000 }, { "epoch": 150.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27050 }, { "epoch": 150.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27100 }, { "epoch": 150.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27150 }, { "epoch": 151.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27200 }, { "epoch": 151.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27250 }, { "epoch": 151.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27300 }, { "epoch": 151.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27350 }, { "epoch": 152.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27400 }, { "epoch": 152.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27450 }, { "epoch": 152.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27500 }, { "epoch": 152.78, "eval_loss": NaN, "eval_runtime": 5.5583, "eval_samples_per_second": 255.472, "eval_steps_per_second": 16.012, "eval_wer": 1.0, "step": 27500 }, { "epoch": 153.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27550 }, { "epoch": 153.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27600 }, { "epoch": 153.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27650 }, { "epoch": 153.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27700 }, { "epoch": 154.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27750 }, { "epoch": 154.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27800 }, { "epoch": 154.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27850 }, { "epoch": 155.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27900 }, { "epoch": 155.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 27950 }, { "epoch": 155.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28000 }, { "epoch": 155.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28050 }, { "epoch": 156.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28100 }, { "epoch": 156.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28150 }, { "epoch": 156.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28200 }, { "epoch": 156.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28250 }, { "epoch": 157.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28300 }, { "epoch": 157.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28350 }, { "epoch": 157.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28400 }, { "epoch": 158.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28450 }, { "epoch": 158.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28500 }, { "epoch": 158.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28550 }, { "epoch": 158.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28600 }, { "epoch": 159.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28650 }, { "epoch": 159.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28700 }, { "epoch": 159.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28750 }, { "epoch": 160.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28800 }, { "epoch": 160.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28850 }, { "epoch": 160.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28900 }, { "epoch": 160.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 28950 }, { "epoch": 161.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29000 }, { "epoch": 161.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29050 }, { "epoch": 161.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29100 }, { "epoch": 161.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29150 }, { "epoch": 162.22, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29200 }, { "epoch": 162.5, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29250 }, { "epoch": 162.78, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29300 }, { "epoch": 163.06, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29350 }, { "epoch": 163.33, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29400 }, { "epoch": 163.61, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29450 }, { "epoch": 163.89, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29500 }, { "epoch": 164.17, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29550 }, { "epoch": 164.44, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29600 }, { "epoch": 164.72, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29650 }, { "epoch": 165.0, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29700 }, { "epoch": 165.28, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29750 }, { "epoch": 165.56, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29800 }, { "epoch": 165.83, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29850 }, { "epoch": 166.11, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29900 }, { "epoch": 166.39, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 29950 }, { "epoch": 166.67, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 30000 }, { "epoch": 166.67, "eval_loss": NaN, "eval_runtime": 5.6665, "eval_samples_per_second": 250.595, "eval_steps_per_second": 15.706, "eval_wer": 1.0, "step": 30000 }, { "epoch": 166.94, "learning_rate": 1.6553559547571525e-05, "loss": 0.0, "step": 30050 }, { "epoch": 167.0, "step": 30060, "total_flos": 3.424005261030641e+20, "train_loss": 1.5698537292277424, "train_runtime": 13564.7724, "train_samples_per_second": 88.444, "train_steps_per_second": 2.216 } ], "logging_steps": 50, "max_steps": 30060, "num_train_epochs": 167, "save_steps": 500, "total_flos": 3.424005261030641e+20, "trial_name": null, "trial_params": null }