|
{ |
|
"best_metric": 3.5358800888061523, |
|
"best_model_checkpoint": "/mnt/output/projects/sca-xiaoke-v3/amlt-results/7300886566.81622-380c5407-4540-4a74-b6ec-7def0683f098/checkpoint-185000", |
|
"epoch": 82.67879288962381, |
|
"global_step": 200000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"_prepare_inputs_in_ms": 10.839506983757019, |
|
"compute_loss_in_ms": 1584.6049636602402, |
|
"epoch": 0.0, |
|
"learning_rate/full": 0.0, |
|
"loss": 8.622, |
|
"step": 1, |
|
"training_step_in_ms": 2253.9908327162266 |
|
}, |
|
{ |
|
"epoch": 0.0, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 8.927019119262695, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.023580759441051608, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 150.659, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 5.31, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.166, |
|
"step": 1 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.052688444062369, |
|
"compute_loss_in_ms": 266.6276198354092, |
|
"epoch": 0.41, |
|
"learning_rate/full": 0.0003999851506717227, |
|
"loss": 4.9777, |
|
"step": 1000, |
|
"training_step_in_ms": 963.7469428184035 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.001575957983732, |
|
"compute_loss_in_ms": 266.9940203540027, |
|
"epoch": 0.83, |
|
"learning_rate/full": 0.0003999221107895784, |
|
"loss": 4.4794, |
|
"step": 2000, |
|
"training_step_in_ms": 964.067553780973 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.017723824828863, |
|
"compute_loss_in_ms": 266.8530354350805, |
|
"epoch": 1.24, |
|
"learning_rate/full": 0.0003998096443163716, |
|
"loss": 4.3589, |
|
"step": 3000, |
|
"training_step_in_ms": 964.8137692287564 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 3.9884973876178265, |
|
"compute_loss_in_ms": 266.8117158599198, |
|
"epoch": 1.65, |
|
"learning_rate/full": 0.0003996477790571026, |
|
"loss": 4.2668, |
|
"step": 4000, |
|
"training_step_in_ms": 963.3689811453223 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.001692395657301, |
|
"compute_loss_in_ms": 267.8194024413824, |
|
"epoch": 2.07, |
|
"learning_rate/full": 0.0003994365550295963, |
|
"loss": 4.2092, |
|
"step": 5000, |
|
"training_step_in_ms": 965.0005767121911 |
|
}, |
|
{ |
|
"epoch": 2.07, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 4.066258430480957, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.19624665436714503, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 81.5743, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.807, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.306, |
|
"step": 5000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.123009167066434, |
|
"compute_loss_in_ms": 267.90184961631894, |
|
"epoch": 2.48, |
|
"learning_rate/full": 0.0003991760244546079, |
|
"loss": 4.1535, |
|
"step": 6000, |
|
"training_step_in_ms": 963.1004312746227 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.096908804029226, |
|
"compute_loss_in_ms": 268.2109449021518, |
|
"epoch": 2.89, |
|
"learning_rate/full": 0.00039886625174291286, |
|
"loss": 4.1103, |
|
"step": 7000, |
|
"training_step_in_ms": 965.0139690972865 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.150357250124216, |
|
"compute_loss_in_ms": 269.2836431860924, |
|
"epoch": 3.31, |
|
"learning_rate/full": 0.0003985073134793826, |
|
"loss": 4.0761, |
|
"step": 8000, |
|
"training_step_in_ms": 969.6529387235641 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.171766873449087, |
|
"compute_loss_in_ms": 268.9554896838963, |
|
"epoch": 3.72, |
|
"learning_rate/full": 0.00039809973090042857, |
|
"loss": 4.0582, |
|
"step": 9000, |
|
"training_step_in_ms": 964.8072783201933 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.219205696135759, |
|
"compute_loss_in_ms": 268.6923326961696, |
|
"epoch": 4.13, |
|
"learning_rate/full": 0.00039764327017710485, |
|
"loss": 4.0324, |
|
"step": 10000, |
|
"training_step_in_ms": 962.4501793310046 |
|
}, |
|
{ |
|
"epoch": 4.13, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.913562059402466, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.22121572228147113, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.9476, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.007, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313, |
|
"step": 10000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.152017308444512, |
|
"compute_loss_in_ms": 268.094536613673, |
|
"epoch": 4.55, |
|
"learning_rate/full": 0.0003971380439342646, |
|
"loss": 4.0153, |
|
"step": 11000, |
|
"training_step_in_ms": 964.2485933154821 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1431227289140224, |
|
"compute_loss_in_ms": 268.42261432111263, |
|
"epoch": 4.96, |
|
"learning_rate/full": 0.00039658359808291836, |
|
"loss": 4.0053, |
|
"step": 12000, |
|
"training_step_in_ms": 965.7689935192466 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.223931197077036, |
|
"compute_loss_in_ms": 268.6585740670562, |
|
"epoch": 5.37, |
|
"learning_rate/full": 0.00039598117829320827, |
|
"loss": 3.9802, |
|
"step": 13000, |
|
"training_step_in_ms": 960.5111146196723 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1840940825641155, |
|
"compute_loss_in_ms": 268.2862157560885, |
|
"epoch": 5.79, |
|
"learning_rate/full": 0.00039533040308028367, |
|
"loss": 3.9633, |
|
"step": 14000, |
|
"training_step_in_ms": 968.1838200092316 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.200506843626499, |
|
"compute_loss_in_ms": 268.91191502287984, |
|
"epoch": 6.2, |
|
"learning_rate/full": 0.0003946307092543998, |
|
"loss": 3.941, |
|
"step": 15000, |
|
"training_step_in_ms": 968.3050900287926 |
|
}, |
|
{ |
|
"epoch": 6.2, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.8218424320220947, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2321593168121597, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2057, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.229, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, |
|
"step": 15000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.21836834491753, |
|
"compute_loss_in_ms": 268.7001321054995, |
|
"epoch": 6.61, |
|
"learning_rate/full": 0.0003938844405523341, |
|
"loss": 3.9323, |
|
"step": 16000, |
|
"training_step_in_ms": 984.531311199069 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.2030105367302895, |
|
"compute_loss_in_ms": 268.3060254715383, |
|
"epoch": 7.03, |
|
"learning_rate/full": 0.00039308879047835453, |
|
"loss": 3.9216, |
|
"step": 17000, |
|
"training_step_in_ms": 961.8699175454676 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.2327940091490746, |
|
"compute_loss_in_ms": 269.27323868498206, |
|
"epoch": 7.44, |
|
"learning_rate/full": 0.00039224627037346294, |
|
"loss": 3.8992, |
|
"step": 18000, |
|
"training_step_in_ms": 967.632270719856 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.229459121823311, |
|
"compute_loss_in_ms": 268.5666101500392, |
|
"epoch": 7.85, |
|
"learning_rate/full": 0.00039135631637799936, |
|
"loss": 3.8984, |
|
"step": 19000, |
|
"training_step_in_ms": 963.238344412297 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.240339521318674, |
|
"compute_loss_in_ms": 268.11582005023956, |
|
"epoch": 8.27, |
|
"learning_rate/full": 0.00039041818639024787, |
|
"loss": 3.8907, |
|
"step": 20000, |
|
"training_step_in_ms": 960.5583217255771 |
|
}, |
|
{ |
|
"epoch": 8.27, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.7651355266571045, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2403944760451539, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 80.0701, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.991, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.312, |
|
"step": 20000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.2025597829644274, |
|
"compute_loss_in_ms": 267.9062583371997, |
|
"epoch": 8.68, |
|
"learning_rate/full": 0.00038943398810118026, |
|
"loss": 3.8736, |
|
"step": 21000, |
|
"training_step_in_ms": 962.8509967587888 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1947984509170055, |
|
"compute_loss_in_ms": 268.05593667179346, |
|
"epoch": 9.09, |
|
"learning_rate/full": 0.00038840304981011036, |
|
"loss": 3.8689, |
|
"step": 22000, |
|
"training_step_in_ms": 965.0497910194099 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.219467684626579, |
|
"compute_loss_in_ms": 268.2473221644759, |
|
"epoch": 9.51, |
|
"learning_rate/full": 0.0003873256258856351, |
|
"loss": 3.8553, |
|
"step": 23000, |
|
"training_step_in_ms": 967.3452698886395 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.203684389591217, |
|
"compute_loss_in_ms": 268.0240872502327, |
|
"epoch": 9.92, |
|
"learning_rate/full": 0.00038620312995292836, |
|
"loss": 3.8464, |
|
"step": 24000, |
|
"training_step_in_ms": 960.33872378245 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.218942817300558, |
|
"compute_loss_in_ms": 268.9947931431234, |
|
"epoch": 10.33, |
|
"learning_rate/full": 0.0003850323958934377, |
|
"loss": 3.8356, |
|
"step": 25000, |
|
"training_step_in_ms": 967.6199573352933 |
|
}, |
|
{ |
|
"epoch": 10.33, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.71928071975708, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.24336343080593542, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.8751, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.016, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313, |
|
"step": 25000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.202740984718974, |
|
"compute_loss_in_ms": 268.5807599723339, |
|
"epoch": 10.75, |
|
"learning_rate/full": 0.0003838183948306088, |
|
"loss": 3.8328, |
|
"step": 26000, |
|
"training_step_in_ms": 961.2188336364925 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.2269067615270615, |
|
"compute_loss_in_ms": 267.7264535538852, |
|
"epoch": 11.16, |
|
"learning_rate/full": 0.00038255656126572534, |
|
"loss": 3.8214, |
|
"step": 27000, |
|
"training_step_in_ms": 960.6881345175207 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.240487921983004, |
|
"compute_loss_in_ms": 268.31112349405885, |
|
"epoch": 11.58, |
|
"learning_rate/full": 0.00038125092378570903, |
|
"loss": 3.8196, |
|
"step": 28000, |
|
"training_step_in_ms": 964.0034716315567 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.273211572319269, |
|
"compute_loss_in_ms": 268.9577633589506, |
|
"epoch": 11.99, |
|
"learning_rate/full": 0.0003798991913473777, |
|
"loss": 3.8171, |
|
"step": 29000, |
|
"training_step_in_ms": 973.0124748162925 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.244079362601042, |
|
"compute_loss_in_ms": 267.9022591896355, |
|
"epoch": 12.4, |
|
"learning_rate/full": 0.0003785058191464291, |
|
"loss": 3.8013, |
|
"step": 30000, |
|
"training_step_in_ms": 962.8623519428074 |
|
}, |
|
{ |
|
"epoch": 12.4, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.687087297439575, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.24789182257436765, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5068, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.19, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 30000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.183955312502094, |
|
"compute_loss_in_ms": 267.3523456119001, |
|
"epoch": 12.82, |
|
"learning_rate/full": 0.00037706702930065926, |
|
"loss": 3.8065, |
|
"step": 31000, |
|
"training_step_in_ms": 957.8949020504951 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.198232229799032, |
|
"compute_loss_in_ms": 267.4514962993562, |
|
"epoch": 13.23, |
|
"learning_rate/full": 0.0003755830450857345, |
|
"loss": 3.7986, |
|
"step": 32000, |
|
"training_step_in_ms": 963.8669461458921 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.18659433722496, |
|
"compute_loss_in_ms": 268.10614936053753, |
|
"epoch": 13.64, |
|
"learning_rate/full": 0.0003740572005600189, |
|
"loss": 3.7923, |
|
"step": 33000, |
|
"training_step_in_ms": 965.2572022378445 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.225778687745333, |
|
"compute_loss_in_ms": 268.18950264155865, |
|
"epoch": 14.06, |
|
"learning_rate/full": 0.00037248681827609586, |
|
"loss": 3.7947, |
|
"step": 34000, |
|
"training_step_in_ms": 960.6446040645242 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.189065434038639, |
|
"compute_loss_in_ms": 267.6565695255995, |
|
"epoch": 14.47, |
|
"learning_rate/full": 0.00037087542640234865, |
|
"loss": 3.7849, |
|
"step": 35000, |
|
"training_step_in_ms": 964.44107465446 |
|
}, |
|
{ |
|
"epoch": 14.47, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6763927936553955, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.246958162767791, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6323, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, |
|
"step": 35000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.164576116131573, |
|
"compute_loss_in_ms": 267.3913585655391, |
|
"epoch": 14.88, |
|
"learning_rate/full": 0.0003692218735740006, |
|
"loss": 3.7838, |
|
"step": 36000, |
|
"training_step_in_ms": 965.0988348089159 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.195226285606623, |
|
"compute_loss_in_ms": 268.244338080287, |
|
"epoch": 15.3, |
|
"learning_rate/full": 0.00036752484999829976, |
|
"loss": 3.7779, |
|
"step": 37000, |
|
"training_step_in_ms": 966.1850301101804 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.189992021769285, |
|
"compute_loss_in_ms": 267.8583819307387, |
|
"epoch": 15.71, |
|
"learning_rate/full": 0.0003657881683678541, |
|
"loss": 3.7748, |
|
"step": 38000, |
|
"training_step_in_ms": 963.9664278812706 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.199680101126432, |
|
"compute_loss_in_ms": 268.06280748173594, |
|
"epoch": 16.12, |
|
"learning_rate/full": 0.00036401058098760525, |
|
"loss": 3.7695, |
|
"step": 39000, |
|
"training_step_in_ms": 967.5451415590942 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.182811006903648, |
|
"compute_loss_in_ms": 267.7034317664802, |
|
"epoch": 16.54, |
|
"learning_rate/full": 0.00036219252645064074, |
|
"loss": 3.7688, |
|
"step": 40000, |
|
"training_step_in_ms": 967.6426770947874 |
|
}, |
|
{ |
|
"epoch": 16.54, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.658348321914673, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25104865208221006, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.4516, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.329, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323, |
|
"step": 40000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.188235598366435, |
|
"compute_loss_in_ms": 267.2028581239283, |
|
"epoch": 16.95, |
|
"learning_rate/full": 0.0003603344533347134, |
|
"loss": 3.761, |
|
"step": 41000, |
|
"training_step_in_ms": 958.9369925446808 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.214274771511555, |
|
"compute_loss_in_ms": 267.64739087969065, |
|
"epoch": 17.36, |
|
"learning_rate/full": 0.00035843490089475537, |
|
"loss": 3.7527, |
|
"step": 42000, |
|
"training_step_in_ms": 966.9140360169113 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.22203628346324, |
|
"compute_loss_in_ms": 268.2027486599982, |
|
"epoch": 17.78, |
|
"learning_rate/full": 0.00035650009493379324, |
|
"loss": 3.7569, |
|
"step": 43000, |
|
"training_step_in_ms": 965.1608090028167 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.219520688056946, |
|
"compute_loss_in_ms": 268.0517144687474, |
|
"epoch": 18.19, |
|
"learning_rate/full": 0.00035452275921920933, |
|
"loss": 3.7513, |
|
"step": 44000, |
|
"training_step_in_ms": 965.6609862968326 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1790814362466335, |
|
"compute_loss_in_ms": 267.46442713588476, |
|
"epoch": 18.6, |
|
"learning_rate/full": 0.0003525092554160055, |
|
"loss": 3.7467, |
|
"step": 45000, |
|
"training_step_in_ms": 965.7583395838737 |
|
}, |
|
{ |
|
"epoch": 18.6, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6469690799713135, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25092950859358, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5468, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.185, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 45000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.220321690890847, |
|
"compute_loss_in_ms": 267.56717593222857, |
|
"epoch": 19.02, |
|
"learning_rate/full": 0.0003504601940692656, |
|
"loss": 3.7497, |
|
"step": 46000, |
|
"training_step_in_ms": 964.2354487106204 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.205725617706776, |
|
"compute_loss_in_ms": 268.48560455814004, |
|
"epoch": 19.43, |
|
"learning_rate/full": 0.0003483698657658315, |
|
"loss": 3.7388, |
|
"step": 47000, |
|
"training_step_in_ms": 967.1772802136838 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.253620557487011, |
|
"compute_loss_in_ms": 267.8220782019198, |
|
"epoch": 19.84, |
|
"learning_rate/full": 0.0003462450012513184, |
|
"loss": 3.744, |
|
"step": 48000, |
|
"training_step_in_ms": 962.239847779274 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.241022698581219, |
|
"compute_loss_in_ms": 268.39736769348383, |
|
"epoch": 20.26, |
|
"learning_rate/full": 0.00034408405297105753, |
|
"loss": 3.7372, |
|
"step": 49000, |
|
"training_step_in_ms": 966.1254425011575 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.21300457790494, |
|
"compute_loss_in_ms": 268.7097208276391, |
|
"epoch": 20.67, |
|
"learning_rate/full": 0.0003418853377786221, |
|
"loss": 3.7334, |
|
"step": 50000, |
|
"training_step_in_ms": 968.8591329194605 |
|
}, |
|
{ |
|
"epoch": 20.67, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.632450580596924, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.253658040934189, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9084, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 50000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.228368219805927, |
|
"compute_loss_in_ms": 268.4243040457368, |
|
"epoch": 21.08, |
|
"learning_rate/full": 0.0003396560466114797, |
|
"loss": 3.7438, |
|
"step": 51000, |
|
"training_step_in_ms": 964.8838895820081 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.233973186463118, |
|
"compute_loss_in_ms": 268.22105176746845, |
|
"epoch": 21.5, |
|
"learning_rate/full": 0.0003373900810764743, |
|
"loss": 3.728, |
|
"step": 52000, |
|
"training_step_in_ms": 962.5837270207703 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.230040587484837, |
|
"compute_loss_in_ms": 267.9561189264059, |
|
"epoch": 21.91, |
|
"learning_rate/full": 0.0003350878976336386, |
|
"loss": 3.7287, |
|
"step": 53000, |
|
"training_step_in_ms": 964.1780665256083 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.2476331405341625, |
|
"compute_loss_in_ms": 268.6795903816819, |
|
"epoch": 22.32, |
|
"learning_rate/full": 0.0003327546685845955, |
|
"loss": 3.7223, |
|
"step": 54000, |
|
"training_step_in_ms": 967.9701336547732 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.220093585550785, |
|
"compute_loss_in_ms": 267.76603213325143, |
|
"epoch": 22.74, |
|
"learning_rate/full": 0.00033038868430752995, |
|
"loss": 3.7261, |
|
"step": 55000, |
|
"training_step_in_ms": 962.9226383566856 |
|
}, |
|
{ |
|
"epoch": 22.74, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6242456436157227, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25521777862203787, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5774, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.181, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 55000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.227604019205745, |
|
"compute_loss_in_ms": 267.647510971874, |
|
"epoch": 23.15, |
|
"learning_rate/full": 0.00032799052857365924, |
|
"loss": 3.7232, |
|
"step": 56000, |
|
"training_step_in_ms": 963.1331409327686 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1824629083275795, |
|
"compute_loss_in_ms": 267.5452450104058, |
|
"epoch": 23.56, |
|
"learning_rate/full": 0.0003255583453025672, |
|
"loss": 3.7153, |
|
"step": 57000, |
|
"training_step_in_ms": 965.8048706538975 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.190924048423767, |
|
"compute_loss_in_ms": 268.4611966535449, |
|
"epoch": 23.98, |
|
"learning_rate/full": 0.0003230975988657048, |
|
"loss": 3.72, |
|
"step": 58000, |
|
"training_step_in_ms": 965.0302759557962 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.20093110203743, |
|
"compute_loss_in_ms": 267.884086355567, |
|
"epoch": 24.39, |
|
"learning_rate/full": 0.0003206064799382713, |
|
"loss": 3.7127, |
|
"step": 59000, |
|
"training_step_in_ms": 964.0987507812679 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.210771672427654, |
|
"compute_loss_in_ms": 267.6700286902487, |
|
"epoch": 24.8, |
|
"learning_rate/full": 0.00031808560316658635, |
|
"loss": 3.7115, |
|
"step": 60000, |
|
"training_step_in_ms": 965.6994955539703 |
|
}, |
|
{ |
|
"epoch": 24.8, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.61262583732605, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.259026039077661, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8405, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 60000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.141795973225338, |
|
"compute_loss_in_ms": 267.2422932982445, |
|
"epoch": 25.22, |
|
"learning_rate/full": 0.0003155330235866319, |
|
"loss": 3.7085, |
|
"step": 61000, |
|
"training_step_in_ms": 965.9709356427193 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.12061008810997, |
|
"compute_loss_in_ms": 268.04699283093214, |
|
"epoch": 25.63, |
|
"learning_rate/full": 0.000312954476063518, |
|
"loss": 3.7031, |
|
"step": 62000, |
|
"training_step_in_ms": 964.8432326950133 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14773878082633, |
|
"compute_loss_in_ms": 268.0800936706364, |
|
"epoch": 26.04, |
|
"learning_rate/full": 0.00031035068146119334, |
|
"loss": 3.7053, |
|
"step": 63000, |
|
"training_step_in_ms": 964.9066540151834 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.157721221446991, |
|
"compute_loss_in_ms": 267.8991154767573, |
|
"epoch": 26.46, |
|
"learning_rate/full": 0.00030771441463138695, |
|
"loss": 3.6991, |
|
"step": 64000, |
|
"training_step_in_ms": 966.7548437044024 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127573002129793, |
|
"compute_loss_in_ms": 268.0769842043519, |
|
"epoch": 26.87, |
|
"learning_rate/full": 0.00030505419362911944, |
|
"loss": 3.7026, |
|
"step": 65000, |
|
"training_step_in_ms": 966.6518254801631 |
|
}, |
|
{ |
|
"epoch": 26.87, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.604250907897949, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2600293381296915, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.2046, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, |
|
"step": 65000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138722216210714, |
|
"compute_loss_in_ms": 268.0730670392513, |
|
"epoch": 27.28, |
|
"learning_rate/full": 0.0003023653504808654, |
|
"loss": 3.6903, |
|
"step": 66000, |
|
"training_step_in_ms": 965.3969647027552 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.153087247163057, |
|
"compute_loss_in_ms": 268.1363028138876, |
|
"epoch": 27.7, |
|
"learning_rate/full": 0.0002996566527388639, |
|
"loss": 3.6969, |
|
"step": 67000, |
|
"training_step_in_ms": 965.2745163962245 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.149796262383461, |
|
"compute_loss_in_ms": 267.83912086486816, |
|
"epoch": 28.11, |
|
"learning_rate/full": 0.0002969179137925403, |
|
"loss": 3.6937, |
|
"step": 68000, |
|
"training_step_in_ms": 968.0436515249312 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1318743117153645, |
|
"compute_loss_in_ms": 268.5812944062054, |
|
"epoch": 28.52, |
|
"learning_rate/full": 0.0002941579883457959, |
|
"loss": 3.6891, |
|
"step": 69000, |
|
"training_step_in_ms": 964.7220857255161 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.13500452041626, |
|
"compute_loss_in_ms": 267.81502260267735, |
|
"epoch": 28.94, |
|
"learning_rate/full": 0.0002913748308243434, |
|
"loss": 3.6864, |
|
"step": 70000, |
|
"training_step_in_ms": 964.9831298328936 |
|
}, |
|
{ |
|
"epoch": 28.94, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5996363162994385, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26106738202465474, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.1905, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.102, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316, |
|
"step": 70000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127892008641871, |
|
"compute_loss_in_ms": 267.3319378942251, |
|
"epoch": 29.35, |
|
"learning_rate/full": 0.000288569127930656, |
|
"loss": 3.6864, |
|
"step": 71000, |
|
"training_step_in_ms": 964.4970440678298 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127237547188997, |
|
"compute_loss_in_ms": 267.12262638285756, |
|
"epoch": 29.76, |
|
"learning_rate/full": 0.0002857387308278068, |
|
"loss": 3.688, |
|
"step": 72000, |
|
"training_step_in_ms": 963.8779099695385 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.134644038975239, |
|
"compute_loss_in_ms": 268.62900394946337, |
|
"epoch": 30.18, |
|
"learning_rate/full": 0.0002828899985518552, |
|
"loss": 3.6777, |
|
"step": 73000, |
|
"training_step_in_ms": 966.1114624030888 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.121612053364515, |
|
"compute_loss_in_ms": 267.61186150833964, |
|
"epoch": 30.59, |
|
"learning_rate/full": 0.00028002081440907064, |
|
"loss": 3.6805, |
|
"step": 74000, |
|
"training_step_in_ms": 966.5145794674754 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.143208879977465, |
|
"compute_loss_in_ms": 268.1201763525605, |
|
"epoch": 31.0, |
|
"learning_rate/full": 0.00027713188632770775, |
|
"loss": 3.6879, |
|
"step": 75000, |
|
"training_step_in_ms": 965.0215070433915 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5912275314331055, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26092454356630995, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6905, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 75000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.137767382511279, |
|
"compute_loss_in_ms": 267.779229991138, |
|
"epoch": 31.42, |
|
"learning_rate/full": 0.00027422684725453034, |
|
"loss": 3.6725, |
|
"step": 76000, |
|
"training_step_in_ms": 963.9590919055045 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138436369597912, |
|
"compute_loss_in_ms": 268.5314156524837, |
|
"epoch": 31.83, |
|
"learning_rate/full": 0.0002712976542440004, |
|
"loss": 3.6758, |
|
"step": 77000, |
|
"training_step_in_ms": 964.5805881880224 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146489001810551, |
|
"compute_loss_in_ms": 268.08270847052336, |
|
"epoch": 32.24, |
|
"learning_rate/full": 0.00026835083436875734, |
|
"loss": 3.6692, |
|
"step": 78000, |
|
"training_step_in_ms": 966.2784307040274 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1479257568717, |
|
"compute_loss_in_ms": 267.2712250612676, |
|
"epoch": 32.66, |
|
"learning_rate/full": 0.0002653930599834242, |
|
"loss": 3.6736, |
|
"step": 79000, |
|
"training_step_in_ms": 968.4041320718825 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.126915082335472, |
|
"compute_loss_in_ms": 268.5138017758727, |
|
"epoch": 33.07, |
|
"learning_rate/full": 0.0002624132077738845, |
|
"loss": 3.6731, |
|
"step": 80000, |
|
"training_step_in_ms": 969.1153637133539 |
|
}, |
|
{ |
|
"epoch": 33.07, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5850701332092285, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2637883107097123, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.0939, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.377, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, |
|
"step": 80000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.120095092348937, |
|
"compute_loss_in_ms": 267.7357228696346, |
|
"epoch": 33.48, |
|
"learning_rate/full": 0.0002594179251945605, |
|
"loss": 3.6671, |
|
"step": 81000, |
|
"training_step_in_ms": 963.6873134560883 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.124605063349009, |
|
"compute_loss_in_ms": 267.57319816574454, |
|
"epoch": 33.9, |
|
"learning_rate/full": 0.00025641096982950234, |
|
"loss": 3.6662, |
|
"step": 82000, |
|
"training_step_in_ms": 965.3064449094236 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.129976071417332, |
|
"compute_loss_in_ms": 267.9822950810194, |
|
"epoch": 34.31, |
|
"learning_rate/full": 0.00025339009590173424, |
|
"loss": 3.6651, |
|
"step": 83000, |
|
"training_step_in_ms": 967.112907551229 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.144246697425842, |
|
"compute_loss_in_ms": 268.09172417223454, |
|
"epoch": 34.73, |
|
"learning_rate/full": 0.0002503530053325778, |
|
"loss": 3.6622, |
|
"step": 84000, |
|
"training_step_in_ms": 963.3224161304533 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138608705252409, |
|
"compute_loss_in_ms": 267.34737430512905, |
|
"epoch": 35.14, |
|
"learning_rate/full": 0.0002473065215350535, |
|
"loss": 3.66, |
|
"step": 85000, |
|
"training_step_in_ms": 964.2706917002797 |
|
}, |
|
{ |
|
"epoch": 35.14, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5811269283294678, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2639846881301574, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4776, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.194, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 85000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.154233903419681, |
|
"compute_loss_in_ms": 267.71352230757475, |
|
"epoch": 35.55, |
|
"learning_rate/full": 0.00024424836556120313, |
|
"loss": 3.6547, |
|
"step": 86000, |
|
"training_step_in_ms": 962.3722572363913 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.109987150877714, |
|
"compute_loss_in_ms": 267.4717643670738, |
|
"epoch": 35.97, |
|
"learning_rate/full": 0.000241179291965253, |
|
"loss": 3.662, |
|
"step": 87000, |
|
"training_step_in_ms": 962.7631023935974 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.130292858928442, |
|
"compute_loss_in_ms": 268.7110885903239, |
|
"epoch": 36.38, |
|
"learning_rate/full": 0.0002381000579951894, |
|
"loss": 3.6533, |
|
"step": 88000, |
|
"training_step_in_ms": 966.5117364116013 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127315446734428, |
|
"compute_loss_in_ms": 267.80369279161096, |
|
"epoch": 36.79, |
|
"learning_rate/full": 0.00023501142340591894, |
|
"loss": 3.6541, |
|
"step": 89000, |
|
"training_step_in_ms": 966.1625612042844 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.147790517657995, |
|
"compute_loss_in_ms": 268.44236666709185, |
|
"epoch": 37.21, |
|
"learning_rate/full": 0.00023191415027181022, |
|
"loss": 3.6505, |
|
"step": 90000, |
|
"training_step_in_ms": 969.9625728055835 |
|
}, |
|
{ |
|
"epoch": 37.21, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5739023685455322, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2666824586460844, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5693, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.182, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 90000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1041579188370125, |
|
"compute_loss_in_ms": 267.84072072431445, |
|
"epoch": 37.62, |
|
"learning_rate/full": 0.00022880900279866363, |
|
"loss": 3.6517, |
|
"step": 91000, |
|
"training_step_in_ms": 962.2163318134844 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.135395355522633, |
|
"compute_loss_in_ms": 267.92124405503273, |
|
"epoch": 38.03, |
|
"learning_rate/full": 0.0002256936284593779, |
|
"loss": 3.6526, |
|
"step": 92000, |
|
"training_step_in_ms": 965.9340194314718 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.124495934695005, |
|
"compute_loss_in_ms": 267.63855477049947, |
|
"epoch": 38.45, |
|
"learning_rate/full": 0.00022257502654664658, |
|
"loss": 3.6411, |
|
"step": 93000, |
|
"training_step_in_ms": 968.471509065479 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.13615457713604, |
|
"compute_loss_in_ms": 268.6791280247271, |
|
"epoch": 38.86, |
|
"learning_rate/full": 0.00021945398441148287, |
|
"loss": 3.6456, |
|
"step": 94000, |
|
"training_step_in_ms": 964.7193784303963 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138962186872959, |
|
"compute_loss_in_ms": 267.87416788190603, |
|
"epoch": 39.27, |
|
"learning_rate/full": 0.00021632188341385878, |
|
"loss": 3.6474, |
|
"step": 95000, |
|
"training_step_in_ms": 964.3936127200723 |
|
}, |
|
{ |
|
"epoch": 39.27, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.570530414581299, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26555671498307476, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8889, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.271, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 95000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.114193618297577, |
|
"compute_loss_in_ms": 267.61803087219596, |
|
"epoch": 39.69, |
|
"learning_rate/full": 0.0002131888850633025, |
|
"loss": 3.6443, |
|
"step": 96000, |
|
"training_step_in_ms": 962.9699364975095 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.118229653686285, |
|
"compute_loss_in_ms": 267.60003339126706, |
|
"epoch": 40.1, |
|
"learning_rate/full": 0.00021005263255270636, |
|
"loss": 3.6436, |
|
"step": 97000, |
|
"training_step_in_ms": 967.0044349320233 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14753895252943, |
|
"compute_loss_in_ms": 267.94382878765464, |
|
"epoch": 40.51, |
|
"learning_rate/full": 0.00020691389970544863, |
|
"loss": 3.6409, |
|
"step": 98000, |
|
"training_step_in_ms": 965.2209133654833 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.132391892373562, |
|
"compute_loss_in_ms": 268.32156636565924, |
|
"epoch": 40.93, |
|
"learning_rate/full": 0.00020377031677881017, |
|
"loss": 3.6386, |
|
"step": 99000, |
|
"training_step_in_ms": 965.1960897520185 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.139371138066053, |
|
"compute_loss_in_ms": 268.1989936903119, |
|
"epoch": 41.34, |
|
"learning_rate/full": 0.00020062894644154732, |
|
"loss": 3.628, |
|
"step": 100000, |
|
"training_step_in_ms": 969.4596163183451 |
|
}, |
|
{ |
|
"epoch": 41.34, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.565774440765381, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26571601552352997, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6144, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.307, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, |
|
"step": 100000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.108485870245026, |
|
"compute_loss_in_ms": 267.23163178935647, |
|
"epoch": 41.75, |
|
"learning_rate/full": 0.00019748742092116103, |
|
"loss": 3.6364, |
|
"step": 101000, |
|
"training_step_in_ms": 962.6803079359233 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.145125687122345, |
|
"compute_loss_in_ms": 267.68679490312934, |
|
"epoch": 42.17, |
|
"learning_rate/full": 0.00019434651534206603, |
|
"loss": 3.6315, |
|
"step": 102000, |
|
"training_step_in_ms": 964.9059623852372 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14092817902565, |
|
"compute_loss_in_ms": 268.40766886249185, |
|
"epoch": 42.58, |
|
"learning_rate/full": 0.00019120700467571537, |
|
"loss": 3.6249, |
|
"step": 103000, |
|
"training_step_in_ms": 968.5381288193166 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.131742633879185, |
|
"compute_loss_in_ms": 267.6234121248126, |
|
"epoch": 42.99, |
|
"learning_rate/full": 0.00018806966354938863, |
|
"loss": 3.6302, |
|
"step": 104000, |
|
"training_step_in_ms": 965.0357882864773 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.159636992961168, |
|
"compute_loss_in_ms": 268.2043272703886, |
|
"epoch": 43.41, |
|
"learning_rate/full": 0.0001849352660550636, |
|
"loss": 3.6221, |
|
"step": 105000, |
|
"training_step_in_ms": 966.8701088428497 |
|
}, |
|
{ |
|
"epoch": 43.41, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.560976266860962, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2679473083105533, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6952, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 105000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1656713769203275, |
|
"compute_loss_in_ms": 267.7097022458911, |
|
"epoch": 43.82, |
|
"learning_rate/full": 0.00018180458555842107, |
|
"loss": 3.6281, |
|
"step": 106000, |
|
"training_step_in_ms": 960.9392982535064 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1548894718289375, |
|
"compute_loss_in_ms": 268.3351138718426, |
|
"epoch": 44.23, |
|
"learning_rate/full": 0.00017867839450802815, |
|
"loss": 3.6257, |
|
"step": 107000, |
|
"training_step_in_ms": 967.5997758358717 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.136493876576424, |
|
"compute_loss_in_ms": 267.79356829449534, |
|
"epoch": 44.65, |
|
"learning_rate/full": 0.0001755574642447484, |
|
"loss": 3.6275, |
|
"step": 108000, |
|
"training_step_in_ms": 964.6688169278204 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146924342960119, |
|
"compute_loss_in_ms": 268.7044747136533, |
|
"epoch": 45.06, |
|
"learning_rate/full": 0.00017244256481142465, |
|
"loss": 3.6272, |
|
"step": 109000, |
|
"training_step_in_ms": 966.0691562928259 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.129870388656855, |
|
"compute_loss_in_ms": 267.92700193077326, |
|
"epoch": 45.47, |
|
"learning_rate/full": 0.00016933446476288295, |
|
"loss": 3.6231, |
|
"step": 110000, |
|
"training_step_in_ms": 968.8978024721146 |
|
}, |
|
{ |
|
"epoch": 45.47, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.557985544204712, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26707363597972006, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.4146, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.334, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323, |
|
"step": 110000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14337538001014, |
|
"compute_loss_in_ms": 267.68642891570926, |
|
"epoch": 45.89, |
|
"learning_rate/full": 0.0001662308313853947, |
|
"loss": 3.6179, |
|
"step": 111000, |
|
"training_step_in_ms": 963.7148243077099 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14999657869339, |
|
"compute_loss_in_ms": 267.70868534594774, |
|
"epoch": 46.3, |
|
"learning_rate/full": 0.000163135546733723, |
|
"loss": 3.6124, |
|
"step": 112000, |
|
"training_step_in_ms": 967.6017691344023 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146619476377964, |
|
"compute_loss_in_ms": 268.191356562078, |
|
"epoch": 46.71, |
|
"learning_rate/full": 0.00016005245741683915, |
|
"loss": 3.62, |
|
"step": 113000, |
|
"training_step_in_ms": 966.300628580153 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.153369773179293, |
|
"compute_loss_in_ms": 267.8536421582103, |
|
"epoch": 47.13, |
|
"learning_rate/full": 0.00015697922455833988, |
|
"loss": 3.6157, |
|
"step": 114000, |
|
"training_step_in_ms": 964.6176136285067 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.187301464378834, |
|
"compute_loss_in_ms": 268.31423101201653, |
|
"epoch": 47.54, |
|
"learning_rate/full": 0.0001539166064324471, |
|
"loss": 3.6143, |
|
"step": 115000, |
|
"training_step_in_ms": 968.9795580692589 |
|
}, |
|
{ |
|
"epoch": 47.54, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.556086778640747, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2680325079129448, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6426, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.173, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 115000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146232630421475, |
|
"compute_loss_in_ms": 267.5073589235544, |
|
"epoch": 47.95, |
|
"learning_rate/full": 0.00015086535869435647, |
|
"loss": 3.6143, |
|
"step": 116000, |
|
"training_step_in_ms": 961.0740608982742 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.149144068360329, |
|
"compute_loss_in_ms": 268.67081797868013, |
|
"epoch": 48.37, |
|
"learning_rate/full": 0.00014782623419379065, |
|
"loss": 3.6076, |
|
"step": 117000, |
|
"training_step_in_ms": 968.1870553046465 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.165053818374872, |
|
"compute_loss_in_ms": 267.5217378772795, |
|
"epoch": 48.78, |
|
"learning_rate/full": 0.00014479998278924466, |
|
"loss": 3.6033, |
|
"step": 118000, |
|
"training_step_in_ms": 964.0207477062941 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.148088995367289, |
|
"compute_loss_in_ms": 267.9359416142106, |
|
"epoch": 49.19, |
|
"learning_rate/full": 0.00014178735116296984, |
|
"loss": 3.6099, |
|
"step": 119000, |
|
"training_step_in_ms": 965.35854877159 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.147441305220127, |
|
"compute_loss_in_ms": 268.18652522563934, |
|
"epoch": 49.61, |
|
"learning_rate/full": 0.00013878908263674099, |
|
"loss": 3.6041, |
|
"step": 120000, |
|
"training_step_in_ms": 966.7598981000483 |
|
}, |
|
{ |
|
"epoch": 49.61, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5552496910095215, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2690825925881079, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.206, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, |
|
"step": 120000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.151007533073425, |
|
"compute_loss_in_ms": 267.91314566135406, |
|
"epoch": 50.02, |
|
"learning_rate/full": 0.00013580293864950247, |
|
"loss": 3.6068, |
|
"step": 121000, |
|
"training_step_in_ms": 965.1756884045899 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.154482748359442, |
|
"compute_loss_in_ms": 268.1262241154909, |
|
"epoch": 50.43, |
|
"learning_rate/full": 0.00013283562815289706, |
|
"loss": 3.5972, |
|
"step": 122000, |
|
"training_step_in_ms": 965.2079959511757 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1559099070727825, |
|
"compute_loss_in_ms": 267.7796282917261, |
|
"epoch": 50.85, |
|
"learning_rate/full": 0.0001298848894600429, |
|
"loss": 3.6031, |
|
"step": 123000, |
|
"training_step_in_ms": 966.0297281630337 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1683206632733345, |
|
"compute_loss_in_ms": 268.80906841158867, |
|
"epoch": 51.26, |
|
"learning_rate/full": 0.00012694852315582903, |
|
"loss": 3.5985, |
|
"step": 124000, |
|
"training_step_in_ms": 967.5091603025794 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.137588050216436, |
|
"compute_loss_in_ms": 267.6871258877218, |
|
"epoch": 51.67, |
|
"learning_rate/full": 0.00012403603541958643, |
|
"loss": 3.6029, |
|
"step": 125000, |
|
"training_step_in_ms": 964.4286920540035 |
|
}, |
|
{ |
|
"epoch": 51.67, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5499510765075684, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.268844144332836, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.7216, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.293, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, |
|
"step": 125000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127907207826289, |
|
"compute_loss_in_ms": 267.8013560883701, |
|
"epoch": 52.09, |
|
"learning_rate/full": 0.00012113936318920029, |
|
"loss": 3.5962, |
|
"step": 126000, |
|
"training_step_in_ms": 962.9286280833185 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.151306886225939, |
|
"compute_loss_in_ms": 267.83537547290325, |
|
"epoch": 52.5, |
|
"learning_rate/full": 0.00011825927853225391, |
|
"loss": 3.5974, |
|
"step": 127000, |
|
"training_step_in_ms": 967.7427954226732 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.118186391890049, |
|
"compute_loss_in_ms": 268.2419737614691, |
|
"epoch": 52.91, |
|
"learning_rate/full": 0.00011540225211753402, |
|
"loss": 3.5979, |
|
"step": 128000, |
|
"training_step_in_ms": 963.5640154518187 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146437399089336, |
|
"compute_loss_in_ms": 267.88536206260324, |
|
"epoch": 53.33, |
|
"learning_rate/full": 0.00011256609893124084, |
|
"loss": 3.5919, |
|
"step": 129000, |
|
"training_step_in_ms": 965.4581209644675 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.140674088150263, |
|
"compute_loss_in_ms": 267.7817959152162, |
|
"epoch": 53.74, |
|
"learning_rate/full": 0.00010975151875173475, |
|
"loss": 3.5954, |
|
"step": 130000, |
|
"training_step_in_ms": 967.2819016650319 |
|
}, |
|
{ |
|
"epoch": 53.74, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5497984886169434, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27146193885645503, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8468, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 130000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.144404723149974, |
|
"compute_loss_in_ms": 267.8810519017279, |
|
"epoch": 54.15, |
|
"learning_rate/full": 0.00010695920603455975, |
|
"loss": 3.5914, |
|
"step": 131000, |
|
"training_step_in_ms": 962.7643201723695 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.15174587816, |
|
"compute_loss_in_ms": 268.55379743501544, |
|
"epoch": 54.57, |
|
"learning_rate/full": 0.00010418984974109642, |
|
"loss": 3.5916, |
|
"step": 132000, |
|
"training_step_in_ms": 965.8136657737195 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.164624106138945, |
|
"compute_loss_in_ms": 268.1068575233221, |
|
"epoch": 54.98, |
|
"learning_rate/full": 0.00010144413316857143, |
|
"loss": 3.5824, |
|
"step": 133000, |
|
"training_step_in_ms": 961.5831676833332 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1917338743805885, |
|
"compute_loss_in_ms": 268.29790291562676, |
|
"epoch": 55.39, |
|
"learning_rate/full": 9.872273378146393e-05, |
|
"loss": 3.5822, |
|
"step": 134000, |
|
"training_step_in_ms": 967.4604325480759 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.154745582491159, |
|
"compute_loss_in_ms": 268.35503727942705, |
|
"epoch": 55.81, |
|
"learning_rate/full": 9.602632304435166e-05, |
|
"loss": 3.5837, |
|
"step": 135000, |
|
"training_step_in_ms": 963.2355434708297 |
|
}, |
|
{ |
|
"epoch": 55.81, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5466184616088867, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2701472521164958, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.7707, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.287, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 135000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1385579000159005, |
|
"compute_loss_in_ms": 268.1807456240058, |
|
"epoch": 56.22, |
|
"learning_rate/full": 9.335556625623667e-05, |
|
"loss": 3.5886, |
|
"step": 136000, |
|
"training_step_in_ms": 964.7279985249043 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.140180014073849, |
|
"compute_loss_in_ms": 268.0731739960611, |
|
"epoch": 56.63, |
|
"learning_rate/full": 9.071112238639306e-05, |
|
"loss": 3.5841, |
|
"step": 137000, |
|
"training_step_in_ms": 964.2245756573975 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.159709714353085, |
|
"compute_loss_in_ms": 268.24955869838595, |
|
"epoch": 57.05, |
|
"learning_rate/full": 8.809103753928327e-05, |
|
"loss": 3.5843, |
|
"step": 138000, |
|
"training_step_in_ms": 966.5491472817957 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.165288005024195, |
|
"compute_loss_in_ms": 268.81143694743514, |
|
"epoch": 57.46, |
|
"learning_rate/full": 8.550119824369325e-05, |
|
"loss": 3.5867, |
|
"step": 139000, |
|
"training_step_in_ms": 964.0126786530018 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.144395582377911, |
|
"compute_loss_in_ms": 268.206242531538, |
|
"epoch": 57.88, |
|
"learning_rate/full": 8.29370600270935e-05, |
|
"loss": 3.5852, |
|
"step": 140000, |
|
"training_step_in_ms": 962.685001052916 |
|
}, |
|
{ |
|
"epoch": 57.88, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5455029010772705, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2711795494440531, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9766, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.259, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 140000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.152141958475113, |
|
"compute_loss_in_ms": 267.9933222196996, |
|
"epoch": 58.29, |
|
"learning_rate/full": 8.040438372331344e-05, |
|
"loss": 3.5737, |
|
"step": 141000, |
|
"training_step_in_ms": 965.1287141442299 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.142403397709131, |
|
"compute_loss_in_ms": 267.5065658353269, |
|
"epoch": 58.7, |
|
"learning_rate/full": 7.790121584830201e-05, |
|
"loss": 3.575, |
|
"step": 142000, |
|
"training_step_in_ms": 962.7664158046246 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.150233589112759, |
|
"compute_loss_in_ms": 268.65408623218536, |
|
"epoch": 59.12, |
|
"learning_rate/full": 7.542817402127658e-05, |
|
"loss": 3.5709, |
|
"step": 143000, |
|
"training_step_in_ms": 964.2099178209901 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.130799826234579, |
|
"compute_loss_in_ms": 267.8640896603465, |
|
"epoch": 59.53, |
|
"learning_rate/full": 7.298586842830323e-05, |
|
"loss": 3.5775, |
|
"step": 144000, |
|
"training_step_in_ms": 964.5784216374159 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146471511572599, |
|
"compute_loss_in_ms": 268.14434216171503, |
|
"epoch": 59.94, |
|
"learning_rate/full": 7.057490167174197e-05, |
|
"loss": 3.5781, |
|
"step": 145000, |
|
"training_step_in_ms": 964.2295859828591 |
|
}, |
|
{ |
|
"epoch": 59.94, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5419652462005615, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2710637844956296, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2475, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.224, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 145000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.13495619122575, |
|
"compute_loss_in_ms": 267.6772438697517, |
|
"epoch": 60.36, |
|
"learning_rate/full": 6.819586862156388e-05, |
|
"loss": 3.5713, |
|
"step": 146000, |
|
"training_step_in_ms": 963.0674764961004 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138938769698143, |
|
"compute_loss_in_ms": 268.4652929417789, |
|
"epoch": 60.77, |
|
"learning_rate/full": 6.58493562685758e-05, |
|
"loss": 3.5755, |
|
"step": 147000, |
|
"training_step_in_ms": 965.1382315270603 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.149636901915073, |
|
"compute_loss_in_ms": 268.6144716888666, |
|
"epoch": 61.18, |
|
"learning_rate/full": 6.35336446255852e-05, |
|
"loss": 3.5689, |
|
"step": 148000, |
|
"training_step_in_ms": 967.6213804855943 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.154591448605061, |
|
"compute_loss_in_ms": 268.10440719127655, |
|
"epoch": 61.6, |
|
"learning_rate/full": 6.125393638794017e-05, |
|
"loss": 3.5736, |
|
"step": 149000, |
|
"training_step_in_ms": 966.7320594601333 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.149040505290031, |
|
"compute_loss_in_ms": 268.75643199309707, |
|
"epoch": 62.01, |
|
"learning_rate/full": 5.900623127984053e-05, |
|
"loss": 3.57, |
|
"step": 150000, |
|
"training_step_in_ms": 965.394243825227 |
|
}, |
|
{ |
|
"epoch": 62.01, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.542189359664917, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27182213175584513, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2758, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.22, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 150000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.197841770038372, |
|
"compute_loss_in_ms": 268.5856811106205, |
|
"epoch": 62.42, |
|
"learning_rate/full": 5.6795579206763614e-05, |
|
"loss": 3.5655, |
|
"step": 151000, |
|
"training_step_in_ms": 963.427967004478 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1404072009027, |
|
"compute_loss_in_ms": 267.94744442403316, |
|
"epoch": 62.84, |
|
"learning_rate/full": 5.462026068170363e-05, |
|
"loss": 3.5665, |
|
"step": 152000, |
|
"training_step_in_ms": 965.5440159775317 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.148986879736185, |
|
"compute_loss_in_ms": 268.1357101947069, |
|
"epoch": 63.25, |
|
"learning_rate/full": 5.247868899032384e-05, |
|
"loss": 3.5648, |
|
"step": 153000, |
|
"training_step_in_ms": 965.260343439877 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.144355583935976, |
|
"compute_loss_in_ms": 268.8695700503886, |
|
"epoch": 63.66, |
|
"learning_rate/full": 5.0375675588795876e-05, |
|
"loss": 3.5699, |
|
"step": 154000, |
|
"training_step_in_ms": 968.1045257672668 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.134350396692753, |
|
"compute_loss_in_ms": 267.78631913661957, |
|
"epoch": 64.08, |
|
"learning_rate/full": 4.830957975043959e-05, |
|
"loss": 3.5654, |
|
"step": 155000, |
|
"training_step_in_ms": 965.367557708174 |
|
}, |
|
{ |
|
"epoch": 64.08, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5409913063049316, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.273054083346476, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4578, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.197, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 155000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.169517766411712, |
|
"compute_loss_in_ms": 267.94907980412245, |
|
"epoch": 64.49, |
|
"learning_rate/full": 4.628091125348743e-05, |
|
"loss": 3.562, |
|
"step": 156000, |
|
"training_step_in_ms": 964.7187770940363 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127725187689066, |
|
"compute_loss_in_ms": 267.56007508188486, |
|
"epoch": 64.9, |
|
"learning_rate/full": 4.429017064153536e-05, |
|
"loss": 3.5599, |
|
"step": 157000, |
|
"training_step_in_ms": 961.402901135385 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.122306831181049, |
|
"compute_loss_in_ms": 268.3586079515517, |
|
"epoch": 65.32, |
|
"learning_rate/full": 4.233784910004124e-05, |
|
"loss": 3.5666, |
|
"step": 158000, |
|
"training_step_in_ms": 965.8669985719025 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.136414989829063, |
|
"compute_loss_in_ms": 267.9736096225679, |
|
"epoch": 65.73, |
|
"learning_rate/full": 4.0424428335132335e-05, |
|
"loss": 3.5573, |
|
"step": 159000, |
|
"training_step_in_ms": 965.0534134693444 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.14548010751605, |
|
"compute_loss_in_ms": 268.10164315626025, |
|
"epoch": 66.14, |
|
"learning_rate/full": 3.855038045475119e-05, |
|
"loss": 3.5569, |
|
"step": 160000, |
|
"training_step_in_ms": 965.0257755257189 |
|
}, |
|
{ |
|
"epoch": 66.14, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.540762424468994, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735980306318844, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6347, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, |
|
"step": 160000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.134731147347427, |
|
"compute_loss_in_ms": 268.0676885545254, |
|
"epoch": 66.56, |
|
"learning_rate/full": 3.671616785217033e-05, |
|
"loss": 3.559, |
|
"step": 161000, |
|
"training_step_in_ms": 961.5968884006143 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.13828482478857, |
|
"compute_loss_in_ms": 268.11520731821656, |
|
"epoch": 66.97, |
|
"learning_rate/full": 3.4920467704438286e-05, |
|
"loss": 3.5617, |
|
"step": 162000, |
|
"training_step_in_ms": 963.3356633149087 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1371137127280235, |
|
"compute_loss_in_ms": 267.97775723040104, |
|
"epoch": 67.38, |
|
"learning_rate/full": 3.3169048798042254e-05, |
|
"loss": 3.5629, |
|
"step": 163000, |
|
"training_step_in_ms": 964.7222346775234 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.129249203950167, |
|
"compute_loss_in_ms": 267.63603001460433, |
|
"epoch": 67.8, |
|
"learning_rate/full": 3.145532456480391e-05, |
|
"loss": 3.5596, |
|
"step": 164000, |
|
"training_step_in_ms": 964.5063005648553 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.151564922183752, |
|
"compute_loss_in_ms": 268.839259788394, |
|
"epoch": 68.21, |
|
"learning_rate/full": 2.9784920606062528e-05, |
|
"loss": 3.5602, |
|
"step": 165000, |
|
"training_step_in_ms": 972.3141440451145 |
|
}, |
|
{ |
|
"epoch": 68.21, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.539008855819702, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2725576622048259, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4123, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.202, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 165000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.126259837208725, |
|
"compute_loss_in_ms": 267.8272004313767, |
|
"epoch": 68.62, |
|
"learning_rate/full": 2.8156514671178745e-05, |
|
"loss": 3.5603, |
|
"step": 166000, |
|
"training_step_in_ms": 964.2809295020998 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.134287599474192, |
|
"compute_loss_in_ms": 267.94721764326096, |
|
"epoch": 69.04, |
|
"learning_rate/full": 2.65705085449506e-05, |
|
"loss": 3.5591, |
|
"step": 167000, |
|
"training_step_in_ms": 963.7021813839674 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.147611241787672, |
|
"compute_loss_in_ms": 268.29229406639934, |
|
"epoch": 69.45, |
|
"learning_rate/full": 2.5025770357450595e-05, |
|
"loss": 3.5561, |
|
"step": 168000, |
|
"training_step_in_ms": 967.2244190610945 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.15412675216794, |
|
"compute_loss_in_ms": 268.25271063297987, |
|
"epoch": 69.86, |
|
"learning_rate/full": 2.352577066262569e-05, |
|
"loss": 3.5576, |
|
"step": 169000, |
|
"training_step_in_ms": 965.3532739318907 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.129838448017836, |
|
"compute_loss_in_ms": 267.92896181344986, |
|
"epoch": 70.28, |
|
"learning_rate/full": 2.206931334324922e-05, |
|
"loss": 3.5536, |
|
"step": 170000, |
|
"training_step_in_ms": 965.5082765445113 |
|
}, |
|
{ |
|
"epoch": 70.28, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5376806259155273, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2738309179784362, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9139, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, |
|
"step": 170000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.163786387298165, |
|
"compute_loss_in_ms": 267.95297726243734, |
|
"epoch": 70.69, |
|
"learning_rate/full": 2.0656757758371282e-05, |
|
"loss": 3.5571, |
|
"step": 171000, |
|
"training_step_in_ms": 960.7510039620101 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.137572426348925, |
|
"compute_loss_in_ms": 267.8121683038771, |
|
"epoch": 71.1, |
|
"learning_rate/full": 1.9287105043128472e-05, |
|
"loss": 3.555, |
|
"step": 172000, |
|
"training_step_in_ms": 963.8648240976036 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.139789171516895, |
|
"compute_loss_in_ms": 268.3458735384047, |
|
"epoch": 71.52, |
|
"learning_rate/full": 1.796343238799574e-05, |
|
"loss": 3.5518, |
|
"step": 173000, |
|
"training_step_in_ms": 965.790959071368 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.144272416830063, |
|
"compute_loss_in_ms": 268.10323084518313, |
|
"epoch": 71.93, |
|
"learning_rate/full": 1.6684674532049582e-05, |
|
"loss": 3.5512, |
|
"step": 174000, |
|
"training_step_in_ms": 961.3717007525265 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1666854321956635, |
|
"compute_loss_in_ms": 268.03433157876134, |
|
"epoch": 72.34, |
|
"learning_rate/full": 1.5451146989656617e-05, |
|
"loss": 3.5495, |
|
"step": 175000, |
|
"training_step_in_ms": 967.3243609592319 |
|
}, |
|
{ |
|
"epoch": 72.34, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.536776065826416, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2743759293675203, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6158, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.176, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, |
|
"step": 175000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.134207051701662, |
|
"compute_loss_in_ms": 267.52714550867677, |
|
"epoch": 72.76, |
|
"learning_rate/full": 1.4261987845053304e-05, |
|
"loss": 3.5555, |
|
"step": 176000, |
|
"training_step_in_ms": 962.5389591343701 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.146069306880236, |
|
"compute_loss_in_ms": 268.7413688749075, |
|
"epoch": 73.17, |
|
"learning_rate/full": 1.3119868774900613e-05, |
|
"loss": 3.5512, |
|
"step": 177000, |
|
"training_step_in_ms": 964.9299626871943 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.148835156112909, |
|
"compute_loss_in_ms": 268.0495460778475, |
|
"epoch": 73.58, |
|
"learning_rate/full": 1.2023859580780273e-05, |
|
"loss": 3.5529, |
|
"step": 178000, |
|
"training_step_in_ms": 967.7268707863986 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.1666895635426044, |
|
"compute_loss_in_ms": 268.2634797357023, |
|
"epoch": 74.0, |
|
"learning_rate/full": 1.0973203331088377e-05, |
|
"loss": 3.5538, |
|
"step": 179000, |
|
"training_step_in_ms": 965.1008929647505 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.153850518167019, |
|
"compute_loss_in_ms": 268.7998457066715, |
|
"epoch": 74.41, |
|
"learning_rate/full": 9.970260528869224e-06, |
|
"loss": 3.5524, |
|
"step": 180000, |
|
"training_step_in_ms": 968.3517145328224 |
|
}, |
|
{ |
|
"epoch": 74.41, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.536918878555298, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735705193198496, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.7713, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.156, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.317, |
|
"step": 180000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.127806843054004, |
|
"compute_loss_in_ms": 268.1048993989825, |
|
"epoch": 74.82, |
|
"learning_rate/full": 9.01420472138852e-06, |
|
"loss": 3.5468, |
|
"step": 181000, |
|
"training_step_in_ms": 960.1139997318387 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.13564395532012, |
|
"compute_loss_in_ms": 267.3685629181564, |
|
"epoch": 75.24, |
|
"learning_rate/full": 8.105271801111003e-06, |
|
"loss": 3.552, |
|
"step": 182000, |
|
"training_step_in_ms": 964.2471651136875 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.140480011701584, |
|
"compute_loss_in_ms": 267.48710445687175, |
|
"epoch": 75.65, |
|
"learning_rate/full": 7.243686033634145e-06, |
|
"loss": 3.5473, |
|
"step": 183000, |
|
"training_step_in_ms": 966.0506127551198 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.12862478941679, |
|
"compute_loss_in_ms": 268.38187746331096, |
|
"epoch": 76.06, |
|
"learning_rate/full": 6.429660002353832e-06, |
|
"loss": 3.5535, |
|
"step": 184000, |
|
"training_step_in_ms": 963.8830341026187 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.138918172568083, |
|
"compute_loss_in_ms": 267.91103532910347, |
|
"epoch": 76.48, |
|
"learning_rate/full": 5.663394556012769e-06, |
|
"loss": 3.5489, |
|
"step": 185000, |
|
"training_step_in_ms": 969.0565127506852 |
|
}, |
|
{ |
|
"epoch": 76.48, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5358800888061523, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2731816800574383, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2007, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.23, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, |
|
"step": 185000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.125211863982968, |
|
"compute_loss_in_ms": 267.94072189182043, |
|
"epoch": 76.89, |
|
"learning_rate/full": 4.944383807374142e-06, |
|
"loss": 3.5495, |
|
"step": 186000, |
|
"training_step_in_ms": 963.789376296103 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.155690658837557, |
|
"compute_loss_in_ms": 267.86934616044164, |
|
"epoch": 77.3, |
|
"learning_rate/full": 4.273596510048239e-06, |
|
"loss": 3.5465, |
|
"step": 187000, |
|
"training_step_in_ms": 966.8210936710238 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.130576055496931, |
|
"compute_loss_in_ms": 268.2106507457793, |
|
"epoch": 77.72, |
|
"learning_rate/full": 3.6517966776118407e-06, |
|
"loss": 3.5445, |
|
"step": 188000, |
|
"training_step_in_ms": 966.5816915780306 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.133735220879316, |
|
"compute_loss_in_ms": 267.8969533368945, |
|
"epoch": 78.13, |
|
"learning_rate/full": 3.0789924830065154e-06, |
|
"loss": 3.5528, |
|
"step": 189000, |
|
"training_step_in_ms": 964.6940425820649 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.137146957218647, |
|
"compute_loss_in_ms": 267.9762873612344, |
|
"epoch": 78.54, |
|
"learning_rate/full": 2.5536764226682607e-06, |
|
"loss": 3.5458, |
|
"step": 190000, |
|
"training_step_in_ms": 966.734307706356 |
|
}, |
|
{ |
|
"epoch": 78.54, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5369150638580322, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.272921503437743, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.0337, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.122, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316, |
|
"step": 190000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.113826969774758, |
|
"compute_loss_in_ms": 267.3543768711388, |
|
"epoch": 78.96, |
|
"learning_rate/full": 2.077174866407172e-06, |
|
"loss": 3.5455, |
|
"step": 191000, |
|
"training_step_in_ms": 959.5898663066328 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.15868678689003, |
|
"compute_loss_in_ms": 268.5514197871089, |
|
"epoch": 79.37, |
|
"learning_rate/full": 1.650411851111966e-06, |
|
"loss": 3.5422, |
|
"step": 192000, |
|
"training_step_in_ms": 966.848380189389 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.152705859392881, |
|
"compute_loss_in_ms": 267.7775506339967, |
|
"epoch": 79.79, |
|
"learning_rate/full": 1.2717824473816864e-06, |
|
"loss": 3.5542, |
|
"step": 193000, |
|
"training_step_in_ms": 966.0438013672829 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.149454560130835, |
|
"compute_loss_in_ms": 268.18433906137943, |
|
"epoch": 80.2, |
|
"learning_rate/full": 9.425893981038769e-07, |
|
"loss": 3.5513, |
|
"step": 194000, |
|
"training_step_in_ms": 968.7132156044245 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.145272459834814, |
|
"compute_loss_in_ms": 269.00753265991807, |
|
"epoch": 80.61, |
|
"learning_rate/full": 6.625107863321489e-07, |
|
"loss": 3.5423, |
|
"step": 195000, |
|
"training_step_in_ms": 966.2778741791844 |
|
}, |
|
{ |
|
"epoch": 80.61, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5363166332244873, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2732828183368321, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.105, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.243, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, |
|
"step": 195000 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.114095866680145, |
|
"compute_loss_in_ms": 267.9977478161454, |
|
"epoch": 81.03, |
|
"learning_rate/full": 4.3161571727299287e-07, |
|
"loss": 3.5457, |
|
"step": 196000, |
|
"training_step_in_ms": 963.1876187734306 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.132705166935921, |
|
"compute_loss_in_ms": 268.0948423668742, |
|
"epoch": 81.44, |
|
"learning_rate/full": 2.4980400999989885e-07, |
|
"loss": 3.5462, |
|
"step": 197000, |
|
"training_step_in_ms": 967.0936130546033 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.152493238449097, |
|
"compute_loss_in_ms": 268.8196250721812, |
|
"epoch": 81.85, |
|
"learning_rate/full": 1.174841397763915e-07, |
|
"loss": 3.5462, |
|
"step": 198000, |
|
"training_step_in_ms": 964.0161675550044 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.15958097204566, |
|
"compute_loss_in_ms": 268.9542033970356, |
|
"epoch": 82.27, |
|
"learning_rate/full": 3.4482289435100457e-08, |
|
"loss": 3.5489, |
|
"step": 199000, |
|
"training_step_in_ms": 964.1794747672975 |
|
}, |
|
{ |
|
"_prepare_inputs_in_ms": 4.161274570971727, |
|
"compute_loss_in_ms": 268.2289356328547, |
|
"epoch": 82.68, |
|
"learning_rate/full": 8.099638465708381e-10, |
|
"loss": 3.5503, |
|
"step": 200000, |
|
"training_step_in_ms": 966.4167955368757 |
|
}, |
|
{ |
|
"epoch": 82.68, |
|
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5363588333129883, |
|
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27337310510486335, |
|
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.3968, |
|
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.204, |
|
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, |
|
"step": 200000 |
|
} |
|
], |
|
"max_steps": 200000, |
|
"num_train_epochs": 83, |
|
"total_flos": 1.6535680980503157e+23, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|