xk-huang
[add] model
86a1106
{
"best_metric": 3.5358800888061523,
"best_model_checkpoint": "/mnt/output/projects/sca-xiaoke-v3/amlt-results/7300886566.81622-380c5407-4540-4a74-b6ec-7def0683f098/checkpoint-185000",
"epoch": 82.67879288962381,
"global_step": 200000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"_prepare_inputs_in_ms": 10.839506983757019,
"compute_loss_in_ms": 1584.6049636602402,
"epoch": 0.0,
"learning_rate/full": 0.0,
"loss": 8.622,
"step": 1,
"training_step_in_ms": 2253.9908327162266
},
{
"epoch": 0.0,
"eval_visual_genome-densecap-local-densecap-test_loss": 8.927019119262695,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.023580759441051608,
"eval_visual_genome-densecap-local-densecap-test_runtime": 150.659,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 5.31,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.166,
"step": 1
},
{
"_prepare_inputs_in_ms": 4.052688444062369,
"compute_loss_in_ms": 266.6276198354092,
"epoch": 0.41,
"learning_rate/full": 0.0003999851506717227,
"loss": 4.9777,
"step": 1000,
"training_step_in_ms": 963.7469428184035
},
{
"_prepare_inputs_in_ms": 4.001575957983732,
"compute_loss_in_ms": 266.9940203540027,
"epoch": 0.83,
"learning_rate/full": 0.0003999221107895784,
"loss": 4.4794,
"step": 2000,
"training_step_in_ms": 964.067553780973
},
{
"_prepare_inputs_in_ms": 4.017723824828863,
"compute_loss_in_ms": 266.8530354350805,
"epoch": 1.24,
"learning_rate/full": 0.0003998096443163716,
"loss": 4.3589,
"step": 3000,
"training_step_in_ms": 964.8137692287564
},
{
"_prepare_inputs_in_ms": 3.9884973876178265,
"compute_loss_in_ms": 266.8117158599198,
"epoch": 1.65,
"learning_rate/full": 0.0003996477790571026,
"loss": 4.2668,
"step": 4000,
"training_step_in_ms": 963.3689811453223
},
{
"_prepare_inputs_in_ms": 4.001692395657301,
"compute_loss_in_ms": 267.8194024413824,
"epoch": 2.07,
"learning_rate/full": 0.0003994365550295963,
"loss": 4.2092,
"step": 5000,
"training_step_in_ms": 965.0005767121911
},
{
"epoch": 2.07,
"eval_visual_genome-densecap-local-densecap-test_loss": 4.066258430480957,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.19624665436714503,
"eval_visual_genome-densecap-local-densecap-test_runtime": 81.5743,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.807,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.306,
"step": 5000
},
{
"_prepare_inputs_in_ms": 4.123009167066434,
"compute_loss_in_ms": 267.90184961631894,
"epoch": 2.48,
"learning_rate/full": 0.0003991760244546079,
"loss": 4.1535,
"step": 6000,
"training_step_in_ms": 963.1004312746227
},
{
"_prepare_inputs_in_ms": 4.096908804029226,
"compute_loss_in_ms": 268.2109449021518,
"epoch": 2.89,
"learning_rate/full": 0.00039886625174291286,
"loss": 4.1103,
"step": 7000,
"training_step_in_ms": 965.0139690972865
},
{
"_prepare_inputs_in_ms": 4.150357250124216,
"compute_loss_in_ms": 269.2836431860924,
"epoch": 3.31,
"learning_rate/full": 0.0003985073134793826,
"loss": 4.0761,
"step": 8000,
"training_step_in_ms": 969.6529387235641
},
{
"_prepare_inputs_in_ms": 4.171766873449087,
"compute_loss_in_ms": 268.9554896838963,
"epoch": 3.72,
"learning_rate/full": 0.00039809973090042857,
"loss": 4.0582,
"step": 9000,
"training_step_in_ms": 964.8072783201933
},
{
"_prepare_inputs_in_ms": 4.219205696135759,
"compute_loss_in_ms": 268.6923326961696,
"epoch": 4.13,
"learning_rate/full": 0.00039764327017710485,
"loss": 4.0324,
"step": 10000,
"training_step_in_ms": 962.4501793310046
},
{
"epoch": 4.13,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.913562059402466,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.22121572228147113,
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.9476,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.007,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313,
"step": 10000
},
{
"_prepare_inputs_in_ms": 4.152017308444512,
"compute_loss_in_ms": 268.094536613673,
"epoch": 4.55,
"learning_rate/full": 0.0003971380439342646,
"loss": 4.0153,
"step": 11000,
"training_step_in_ms": 964.2485933154821
},
{
"_prepare_inputs_in_ms": 4.1431227289140224,
"compute_loss_in_ms": 268.42261432111263,
"epoch": 4.96,
"learning_rate/full": 0.00039658359808291836,
"loss": 4.0053,
"step": 12000,
"training_step_in_ms": 965.7689935192466
},
{
"_prepare_inputs_in_ms": 4.223931197077036,
"compute_loss_in_ms": 268.6585740670562,
"epoch": 5.37,
"learning_rate/full": 0.00039598117829320827,
"loss": 3.9802,
"step": 13000,
"training_step_in_ms": 960.5111146196723
},
{
"_prepare_inputs_in_ms": 4.1840940825641155,
"compute_loss_in_ms": 268.2862157560885,
"epoch": 5.79,
"learning_rate/full": 0.00039533040308028367,
"loss": 3.9633,
"step": 14000,
"training_step_in_ms": 968.1838200092316
},
{
"_prepare_inputs_in_ms": 4.200506843626499,
"compute_loss_in_ms": 268.91191502287984,
"epoch": 6.2,
"learning_rate/full": 0.0003946307092543998,
"loss": 3.941,
"step": 15000,
"training_step_in_ms": 968.3050900287926
},
{
"epoch": 6.2,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.8218424320220947,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2321593168121597,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2057,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.229,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32,
"step": 15000
},
{
"_prepare_inputs_in_ms": 4.21836834491753,
"compute_loss_in_ms": 268.7001321054995,
"epoch": 6.61,
"learning_rate/full": 0.0003938844405523341,
"loss": 3.9323,
"step": 16000,
"training_step_in_ms": 984.531311199069
},
{
"_prepare_inputs_in_ms": 4.2030105367302895,
"compute_loss_in_ms": 268.3060254715383,
"epoch": 7.03,
"learning_rate/full": 0.00039308879047835453,
"loss": 3.9216,
"step": 17000,
"training_step_in_ms": 961.8699175454676
},
{
"_prepare_inputs_in_ms": 4.2327940091490746,
"compute_loss_in_ms": 269.27323868498206,
"epoch": 7.44,
"learning_rate/full": 0.00039224627037346294,
"loss": 3.8992,
"step": 18000,
"training_step_in_ms": 967.632270719856
},
{
"_prepare_inputs_in_ms": 4.229459121823311,
"compute_loss_in_ms": 268.5666101500392,
"epoch": 7.85,
"learning_rate/full": 0.00039135631637799936,
"loss": 3.8984,
"step": 19000,
"training_step_in_ms": 963.238344412297
},
{
"_prepare_inputs_in_ms": 4.240339521318674,
"compute_loss_in_ms": 268.11582005023956,
"epoch": 8.27,
"learning_rate/full": 0.00039041818639024787,
"loss": 3.8907,
"step": 20000,
"training_step_in_ms": 960.5583217255771
},
{
"epoch": 8.27,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.7651355266571045,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2403944760451539,
"eval_visual_genome-densecap-local-densecap-test_runtime": 80.0701,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.991,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.312,
"step": 20000
},
{
"_prepare_inputs_in_ms": 4.2025597829644274,
"compute_loss_in_ms": 267.9062583371997,
"epoch": 8.68,
"learning_rate/full": 0.00038943398810118026,
"loss": 3.8736,
"step": 21000,
"training_step_in_ms": 962.8509967587888
},
{
"_prepare_inputs_in_ms": 4.1947984509170055,
"compute_loss_in_ms": 268.05593667179346,
"epoch": 9.09,
"learning_rate/full": 0.00038840304981011036,
"loss": 3.8689,
"step": 22000,
"training_step_in_ms": 965.0497910194099
},
{
"_prepare_inputs_in_ms": 4.219467684626579,
"compute_loss_in_ms": 268.2473221644759,
"epoch": 9.51,
"learning_rate/full": 0.0003873256258856351,
"loss": 3.8553,
"step": 23000,
"training_step_in_ms": 967.3452698886395
},
{
"_prepare_inputs_in_ms": 4.203684389591217,
"compute_loss_in_ms": 268.0240872502327,
"epoch": 9.92,
"learning_rate/full": 0.00038620312995292836,
"loss": 3.8464,
"step": 24000,
"training_step_in_ms": 960.33872378245
},
{
"_prepare_inputs_in_ms": 4.218942817300558,
"compute_loss_in_ms": 268.9947931431234,
"epoch": 10.33,
"learning_rate/full": 0.0003850323958934377,
"loss": 3.8356,
"step": 25000,
"training_step_in_ms": 967.6199573352933
},
{
"epoch": 10.33,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.71928071975708,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.24336343080593542,
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.8751,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.016,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313,
"step": 25000
},
{
"_prepare_inputs_in_ms": 4.202740984718974,
"compute_loss_in_ms": 268.5807599723339,
"epoch": 10.75,
"learning_rate/full": 0.0003838183948306088,
"loss": 3.8328,
"step": 26000,
"training_step_in_ms": 961.2188336364925
},
{
"_prepare_inputs_in_ms": 4.2269067615270615,
"compute_loss_in_ms": 267.7264535538852,
"epoch": 11.16,
"learning_rate/full": 0.00038255656126572534,
"loss": 3.8214,
"step": 27000,
"training_step_in_ms": 960.6881345175207
},
{
"_prepare_inputs_in_ms": 4.240487921983004,
"compute_loss_in_ms": 268.31112349405885,
"epoch": 11.58,
"learning_rate/full": 0.00038125092378570903,
"loss": 3.8196,
"step": 28000,
"training_step_in_ms": 964.0034716315567
},
{
"_prepare_inputs_in_ms": 4.273211572319269,
"compute_loss_in_ms": 268.9577633589506,
"epoch": 11.99,
"learning_rate/full": 0.0003798991913473777,
"loss": 3.8171,
"step": 29000,
"training_step_in_ms": 973.0124748162925
},
{
"_prepare_inputs_in_ms": 4.244079362601042,
"compute_loss_in_ms": 267.9022591896355,
"epoch": 12.4,
"learning_rate/full": 0.0003785058191464291,
"loss": 3.8013,
"step": 30000,
"training_step_in_ms": 962.8623519428074
},
{
"epoch": 12.4,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.687087297439575,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.24789182257436765,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5068,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.19,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 30000
},
{
"_prepare_inputs_in_ms": 4.183955312502094,
"compute_loss_in_ms": 267.3523456119001,
"epoch": 12.82,
"learning_rate/full": 0.00037706702930065926,
"loss": 3.8065,
"step": 31000,
"training_step_in_ms": 957.8949020504951
},
{
"_prepare_inputs_in_ms": 4.198232229799032,
"compute_loss_in_ms": 267.4514962993562,
"epoch": 13.23,
"learning_rate/full": 0.0003755830450857345,
"loss": 3.7986,
"step": 32000,
"training_step_in_ms": 963.8669461458921
},
{
"_prepare_inputs_in_ms": 4.18659433722496,
"compute_loss_in_ms": 268.10614936053753,
"epoch": 13.64,
"learning_rate/full": 0.0003740572005600189,
"loss": 3.7923,
"step": 33000,
"training_step_in_ms": 965.2572022378445
},
{
"_prepare_inputs_in_ms": 4.225778687745333,
"compute_loss_in_ms": 268.18950264155865,
"epoch": 14.06,
"learning_rate/full": 0.00037248681827609586,
"loss": 3.7947,
"step": 34000,
"training_step_in_ms": 960.6446040645242
},
{
"_prepare_inputs_in_ms": 4.189065434038639,
"compute_loss_in_ms": 267.6565695255995,
"epoch": 14.47,
"learning_rate/full": 0.00037087542640234865,
"loss": 3.7849,
"step": 35000,
"training_step_in_ms": 964.44107465446
},
{
"epoch": 14.47,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6763927936553955,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.246958162767791,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6323,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322,
"step": 35000
},
{
"_prepare_inputs_in_ms": 4.164576116131573,
"compute_loss_in_ms": 267.3913585655391,
"epoch": 14.88,
"learning_rate/full": 0.0003692218735740006,
"loss": 3.7838,
"step": 36000,
"training_step_in_ms": 965.0988348089159
},
{
"_prepare_inputs_in_ms": 4.195226285606623,
"compute_loss_in_ms": 268.244338080287,
"epoch": 15.3,
"learning_rate/full": 0.00036752484999829976,
"loss": 3.7779,
"step": 37000,
"training_step_in_ms": 966.1850301101804
},
{
"_prepare_inputs_in_ms": 4.189992021769285,
"compute_loss_in_ms": 267.8583819307387,
"epoch": 15.71,
"learning_rate/full": 0.0003657881683678541,
"loss": 3.7748,
"step": 38000,
"training_step_in_ms": 963.9664278812706
},
{
"_prepare_inputs_in_ms": 4.199680101126432,
"compute_loss_in_ms": 268.06280748173594,
"epoch": 16.12,
"learning_rate/full": 0.00036401058098760525,
"loss": 3.7695,
"step": 39000,
"training_step_in_ms": 967.5451415590942
},
{
"_prepare_inputs_in_ms": 4.182811006903648,
"compute_loss_in_ms": 267.7034317664802,
"epoch": 16.54,
"learning_rate/full": 0.00036219252645064074,
"loss": 3.7688,
"step": 40000,
"training_step_in_ms": 967.6426770947874
},
{
"epoch": 16.54,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.658348321914673,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25104865208221006,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.4516,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.329,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323,
"step": 40000
},
{
"_prepare_inputs_in_ms": 4.188235598366435,
"compute_loss_in_ms": 267.2028581239283,
"epoch": 16.95,
"learning_rate/full": 0.0003603344533347134,
"loss": 3.761,
"step": 41000,
"training_step_in_ms": 958.9369925446808
},
{
"_prepare_inputs_in_ms": 4.214274771511555,
"compute_loss_in_ms": 267.64739087969065,
"epoch": 17.36,
"learning_rate/full": 0.00035843490089475537,
"loss": 3.7527,
"step": 42000,
"training_step_in_ms": 966.9140360169113
},
{
"_prepare_inputs_in_ms": 4.22203628346324,
"compute_loss_in_ms": 268.2027486599982,
"epoch": 17.78,
"learning_rate/full": 0.00035650009493379324,
"loss": 3.7569,
"step": 43000,
"training_step_in_ms": 965.1608090028167
},
{
"_prepare_inputs_in_ms": 4.219520688056946,
"compute_loss_in_ms": 268.0517144687474,
"epoch": 18.19,
"learning_rate/full": 0.00035452275921920933,
"loss": 3.7513,
"step": 44000,
"training_step_in_ms": 965.6609862968326
},
{
"_prepare_inputs_in_ms": 4.1790814362466335,
"compute_loss_in_ms": 267.46442713588476,
"epoch": 18.6,
"learning_rate/full": 0.0003525092554160055,
"loss": 3.7467,
"step": 45000,
"training_step_in_ms": 965.7583395838737
},
{
"epoch": 18.6,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6469690799713135,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25092950859358,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5468,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.185,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 45000
},
{
"_prepare_inputs_in_ms": 4.220321690890847,
"compute_loss_in_ms": 267.56717593222857,
"epoch": 19.02,
"learning_rate/full": 0.0003504601940692656,
"loss": 3.7497,
"step": 46000,
"training_step_in_ms": 964.2354487106204
},
{
"_prepare_inputs_in_ms": 4.205725617706776,
"compute_loss_in_ms": 268.48560455814004,
"epoch": 19.43,
"learning_rate/full": 0.0003483698657658315,
"loss": 3.7388,
"step": 47000,
"training_step_in_ms": 967.1772802136838
},
{
"_prepare_inputs_in_ms": 4.253620557487011,
"compute_loss_in_ms": 267.8220782019198,
"epoch": 19.84,
"learning_rate/full": 0.0003462450012513184,
"loss": 3.744,
"step": 48000,
"training_step_in_ms": 962.239847779274
},
{
"_prepare_inputs_in_ms": 4.241022698581219,
"compute_loss_in_ms": 268.39736769348383,
"epoch": 20.26,
"learning_rate/full": 0.00034408405297105753,
"loss": 3.7372,
"step": 49000,
"training_step_in_ms": 966.1254425011575
},
{
"_prepare_inputs_in_ms": 4.21300457790494,
"compute_loss_in_ms": 268.7097208276391,
"epoch": 20.67,
"learning_rate/full": 0.0003418853377786221,
"loss": 3.7334,
"step": 50000,
"training_step_in_ms": 968.8591329194605
},
{
"epoch": 20.67,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.632450580596924,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.253658040934189,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9084,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 50000
},
{
"_prepare_inputs_in_ms": 4.228368219805927,
"compute_loss_in_ms": 268.4243040457368,
"epoch": 21.08,
"learning_rate/full": 0.0003396560466114797,
"loss": 3.7438,
"step": 51000,
"training_step_in_ms": 964.8838895820081
},
{
"_prepare_inputs_in_ms": 4.233973186463118,
"compute_loss_in_ms": 268.22105176746845,
"epoch": 21.5,
"learning_rate/full": 0.0003373900810764743,
"loss": 3.728,
"step": 52000,
"training_step_in_ms": 962.5837270207703
},
{
"_prepare_inputs_in_ms": 4.230040587484837,
"compute_loss_in_ms": 267.9561189264059,
"epoch": 21.91,
"learning_rate/full": 0.0003350878976336386,
"loss": 3.7287,
"step": 53000,
"training_step_in_ms": 964.1780665256083
},
{
"_prepare_inputs_in_ms": 4.2476331405341625,
"compute_loss_in_ms": 268.6795903816819,
"epoch": 22.32,
"learning_rate/full": 0.0003327546685845955,
"loss": 3.7223,
"step": 54000,
"training_step_in_ms": 967.9701336547732
},
{
"_prepare_inputs_in_ms": 4.220093585550785,
"compute_loss_in_ms": 267.76603213325143,
"epoch": 22.74,
"learning_rate/full": 0.00033038868430752995,
"loss": 3.7261,
"step": 55000,
"training_step_in_ms": 962.9226383566856
},
{
"epoch": 22.74,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.6242456436157227,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.25521777862203787,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5774,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.181,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 55000
},
{
"_prepare_inputs_in_ms": 4.227604019205745,
"compute_loss_in_ms": 267.647510971874,
"epoch": 23.15,
"learning_rate/full": 0.00032799052857365924,
"loss": 3.7232,
"step": 56000,
"training_step_in_ms": 963.1331409327686
},
{
"_prepare_inputs_in_ms": 4.1824629083275795,
"compute_loss_in_ms": 267.5452450104058,
"epoch": 23.56,
"learning_rate/full": 0.0003255583453025672,
"loss": 3.7153,
"step": 57000,
"training_step_in_ms": 965.8048706538975
},
{
"_prepare_inputs_in_ms": 4.190924048423767,
"compute_loss_in_ms": 268.4611966535449,
"epoch": 23.98,
"learning_rate/full": 0.0003230975988657048,
"loss": 3.72,
"step": 58000,
"training_step_in_ms": 965.0302759557962
},
{
"_prepare_inputs_in_ms": 4.20093110203743,
"compute_loss_in_ms": 267.884086355567,
"epoch": 24.39,
"learning_rate/full": 0.0003206064799382713,
"loss": 3.7127,
"step": 59000,
"training_step_in_ms": 964.0987507812679
},
{
"_prepare_inputs_in_ms": 4.210771672427654,
"compute_loss_in_ms": 267.6700286902487,
"epoch": 24.8,
"learning_rate/full": 0.00031808560316658635,
"loss": 3.7115,
"step": 60000,
"training_step_in_ms": 965.6994955539703
},
{
"epoch": 24.8,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.61262583732605,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.259026039077661,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8405,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 60000
},
{
"_prepare_inputs_in_ms": 4.141795973225338,
"compute_loss_in_ms": 267.2422932982445,
"epoch": 25.22,
"learning_rate/full": 0.0003155330235866319,
"loss": 3.7085,
"step": 61000,
"training_step_in_ms": 965.9709356427193
},
{
"_prepare_inputs_in_ms": 4.12061008810997,
"compute_loss_in_ms": 268.04699283093214,
"epoch": 25.63,
"learning_rate/full": 0.000312954476063518,
"loss": 3.7031,
"step": 62000,
"training_step_in_ms": 964.8432326950133
},
{
"_prepare_inputs_in_ms": 4.14773878082633,
"compute_loss_in_ms": 268.0800936706364,
"epoch": 26.04,
"learning_rate/full": 0.00031035068146119334,
"loss": 3.7053,
"step": 63000,
"training_step_in_ms": 964.9066540151834
},
{
"_prepare_inputs_in_ms": 4.157721221446991,
"compute_loss_in_ms": 267.8991154767573,
"epoch": 26.46,
"learning_rate/full": 0.00030771441463138695,
"loss": 3.6991,
"step": 64000,
"training_step_in_ms": 966.7548437044024
},
{
"_prepare_inputs_in_ms": 4.127573002129793,
"compute_loss_in_ms": 268.0769842043519,
"epoch": 26.87,
"learning_rate/full": 0.00030505419362911944,
"loss": 3.7026,
"step": 65000,
"training_step_in_ms": 966.6518254801631
},
{
"epoch": 26.87,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.604250907897949,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2600293381296915,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.2046,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324,
"step": 65000
},
{
"_prepare_inputs_in_ms": 4.138722216210714,
"compute_loss_in_ms": 268.0730670392513,
"epoch": 27.28,
"learning_rate/full": 0.0003023653504808654,
"loss": 3.6903,
"step": 66000,
"training_step_in_ms": 965.3969647027552
},
{
"_prepare_inputs_in_ms": 4.153087247163057,
"compute_loss_in_ms": 268.1363028138876,
"epoch": 27.7,
"learning_rate/full": 0.0002996566527388639,
"loss": 3.6969,
"step": 67000,
"training_step_in_ms": 965.2745163962245
},
{
"_prepare_inputs_in_ms": 4.149796262383461,
"compute_loss_in_ms": 267.83912086486816,
"epoch": 28.11,
"learning_rate/full": 0.0002969179137925403,
"loss": 3.6937,
"step": 68000,
"training_step_in_ms": 968.0436515249312
},
{
"_prepare_inputs_in_ms": 4.1318743117153645,
"compute_loss_in_ms": 268.5812944062054,
"epoch": 28.52,
"learning_rate/full": 0.0002941579883457959,
"loss": 3.6891,
"step": 69000,
"training_step_in_ms": 964.7220857255161
},
{
"_prepare_inputs_in_ms": 4.13500452041626,
"compute_loss_in_ms": 267.81502260267735,
"epoch": 28.94,
"learning_rate/full": 0.0002913748308243434,
"loss": 3.6864,
"step": 70000,
"training_step_in_ms": 964.9831298328936
},
{
"epoch": 28.94,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5996363162994385,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26106738202465474,
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.1905,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.102,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316,
"step": 70000
},
{
"_prepare_inputs_in_ms": 4.127892008641871,
"compute_loss_in_ms": 267.3319378942251,
"epoch": 29.35,
"learning_rate/full": 0.000288569127930656,
"loss": 3.6864,
"step": 71000,
"training_step_in_ms": 964.4970440678298
},
{
"_prepare_inputs_in_ms": 4.127237547188997,
"compute_loss_in_ms": 267.12262638285756,
"epoch": 29.76,
"learning_rate/full": 0.0002857387308278068,
"loss": 3.688,
"step": 72000,
"training_step_in_ms": 963.8779099695385
},
{
"_prepare_inputs_in_ms": 4.134644038975239,
"compute_loss_in_ms": 268.62900394946337,
"epoch": 30.18,
"learning_rate/full": 0.0002828899985518552,
"loss": 3.6777,
"step": 73000,
"training_step_in_ms": 966.1114624030888
},
{
"_prepare_inputs_in_ms": 4.121612053364515,
"compute_loss_in_ms": 267.61186150833964,
"epoch": 30.59,
"learning_rate/full": 0.00028002081440907064,
"loss": 3.6805,
"step": 74000,
"training_step_in_ms": 966.5145794674754
},
{
"_prepare_inputs_in_ms": 4.143208879977465,
"compute_loss_in_ms": 268.1201763525605,
"epoch": 31.0,
"learning_rate/full": 0.00027713188632770775,
"loss": 3.6879,
"step": 75000,
"training_step_in_ms": 965.0215070433915
},
{
"epoch": 31.0,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5912275314331055,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26092454356630995,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6905,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 75000
},
{
"_prepare_inputs_in_ms": 4.137767382511279,
"compute_loss_in_ms": 267.779229991138,
"epoch": 31.42,
"learning_rate/full": 0.00027422684725453034,
"loss": 3.6725,
"step": 76000,
"training_step_in_ms": 963.9590919055045
},
{
"_prepare_inputs_in_ms": 4.138436369597912,
"compute_loss_in_ms": 268.5314156524837,
"epoch": 31.83,
"learning_rate/full": 0.0002712976542440004,
"loss": 3.6758,
"step": 77000,
"training_step_in_ms": 964.5805881880224
},
{
"_prepare_inputs_in_ms": 4.146489001810551,
"compute_loss_in_ms": 268.08270847052336,
"epoch": 32.24,
"learning_rate/full": 0.00026835083436875734,
"loss": 3.6692,
"step": 78000,
"training_step_in_ms": 966.2784307040274
},
{
"_prepare_inputs_in_ms": 4.1479257568717,
"compute_loss_in_ms": 267.2712250612676,
"epoch": 32.66,
"learning_rate/full": 0.0002653930599834242,
"loss": 3.6736,
"step": 79000,
"training_step_in_ms": 968.4041320718825
},
{
"_prepare_inputs_in_ms": 4.126915082335472,
"compute_loss_in_ms": 268.5138017758727,
"epoch": 33.07,
"learning_rate/full": 0.0002624132077738845,
"loss": 3.6731,
"step": 80000,
"training_step_in_ms": 969.1153637133539
},
{
"epoch": 33.07,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5850701332092285,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2637883107097123,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.0939,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.377,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324,
"step": 80000
},
{
"_prepare_inputs_in_ms": 4.120095092348937,
"compute_loss_in_ms": 267.7357228696346,
"epoch": 33.48,
"learning_rate/full": 0.0002594179251945605,
"loss": 3.6671,
"step": 81000,
"training_step_in_ms": 963.6873134560883
},
{
"_prepare_inputs_in_ms": 4.124605063349009,
"compute_loss_in_ms": 267.57319816574454,
"epoch": 33.9,
"learning_rate/full": 0.00025641096982950234,
"loss": 3.6662,
"step": 82000,
"training_step_in_ms": 965.3064449094236
},
{
"_prepare_inputs_in_ms": 4.129976071417332,
"compute_loss_in_ms": 267.9822950810194,
"epoch": 34.31,
"learning_rate/full": 0.00025339009590173424,
"loss": 3.6651,
"step": 83000,
"training_step_in_ms": 967.112907551229
},
{
"_prepare_inputs_in_ms": 4.144246697425842,
"compute_loss_in_ms": 268.09172417223454,
"epoch": 34.73,
"learning_rate/full": 0.0002503530053325778,
"loss": 3.6622,
"step": 84000,
"training_step_in_ms": 963.3224161304533
},
{
"_prepare_inputs_in_ms": 4.138608705252409,
"compute_loss_in_ms": 267.34737430512905,
"epoch": 35.14,
"learning_rate/full": 0.0002473065215350535,
"loss": 3.66,
"step": 85000,
"training_step_in_ms": 964.2706917002797
},
{
"epoch": 35.14,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5811269283294678,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2639846881301574,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4776,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.194,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 85000
},
{
"_prepare_inputs_in_ms": 4.154233903419681,
"compute_loss_in_ms": 267.71352230757475,
"epoch": 35.55,
"learning_rate/full": 0.00024424836556120313,
"loss": 3.6547,
"step": 86000,
"training_step_in_ms": 962.3722572363913
},
{
"_prepare_inputs_in_ms": 4.109987150877714,
"compute_loss_in_ms": 267.4717643670738,
"epoch": 35.97,
"learning_rate/full": 0.000241179291965253,
"loss": 3.662,
"step": 87000,
"training_step_in_ms": 962.7631023935974
},
{
"_prepare_inputs_in_ms": 4.130292858928442,
"compute_loss_in_ms": 268.7110885903239,
"epoch": 36.38,
"learning_rate/full": 0.0002381000579951894,
"loss": 3.6533,
"step": 88000,
"training_step_in_ms": 966.5117364116013
},
{
"_prepare_inputs_in_ms": 4.127315446734428,
"compute_loss_in_ms": 267.80369279161096,
"epoch": 36.79,
"learning_rate/full": 0.00023501142340591894,
"loss": 3.6541,
"step": 89000,
"training_step_in_ms": 966.1625612042844
},
{
"_prepare_inputs_in_ms": 4.147790517657995,
"compute_loss_in_ms": 268.44236666709185,
"epoch": 37.21,
"learning_rate/full": 0.00023191415027181022,
"loss": 3.6505,
"step": 90000,
"training_step_in_ms": 969.9625728055835
},
{
"epoch": 37.21,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5739023685455322,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2666824586460844,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.5693,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.182,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 90000
},
{
"_prepare_inputs_in_ms": 4.1041579188370125,
"compute_loss_in_ms": 267.84072072431445,
"epoch": 37.62,
"learning_rate/full": 0.00022880900279866363,
"loss": 3.6517,
"step": 91000,
"training_step_in_ms": 962.2163318134844
},
{
"_prepare_inputs_in_ms": 4.135395355522633,
"compute_loss_in_ms": 267.92124405503273,
"epoch": 38.03,
"learning_rate/full": 0.0002256936284593779,
"loss": 3.6526,
"step": 92000,
"training_step_in_ms": 965.9340194314718
},
{
"_prepare_inputs_in_ms": 4.124495934695005,
"compute_loss_in_ms": 267.63855477049947,
"epoch": 38.45,
"learning_rate/full": 0.00022257502654664658,
"loss": 3.6411,
"step": 93000,
"training_step_in_ms": 968.471509065479
},
{
"_prepare_inputs_in_ms": 4.13615457713604,
"compute_loss_in_ms": 268.6791280247271,
"epoch": 38.86,
"learning_rate/full": 0.00021945398441148287,
"loss": 3.6456,
"step": 94000,
"training_step_in_ms": 964.7193784303963
},
{
"_prepare_inputs_in_ms": 4.138962186872959,
"compute_loss_in_ms": 267.87416788190603,
"epoch": 39.27,
"learning_rate/full": 0.00021632188341385878,
"loss": 3.6474,
"step": 95000,
"training_step_in_ms": 964.3936127200723
},
{
"epoch": 39.27,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.570530414581299,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26555671498307476,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8889,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.271,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 95000
},
{
"_prepare_inputs_in_ms": 4.114193618297577,
"compute_loss_in_ms": 267.61803087219596,
"epoch": 39.69,
"learning_rate/full": 0.0002131888850633025,
"loss": 3.6443,
"step": 96000,
"training_step_in_ms": 962.9699364975095
},
{
"_prepare_inputs_in_ms": 4.118229653686285,
"compute_loss_in_ms": 267.60003339126706,
"epoch": 40.1,
"learning_rate/full": 0.00021005263255270636,
"loss": 3.6436,
"step": 97000,
"training_step_in_ms": 967.0044349320233
},
{
"_prepare_inputs_in_ms": 4.14753895252943,
"compute_loss_in_ms": 267.94382878765464,
"epoch": 40.51,
"learning_rate/full": 0.00020691389970544863,
"loss": 3.6409,
"step": 98000,
"training_step_in_ms": 965.2209133654833
},
{
"_prepare_inputs_in_ms": 4.132391892373562,
"compute_loss_in_ms": 268.32156636565924,
"epoch": 40.93,
"learning_rate/full": 0.00020377031677881017,
"loss": 3.6386,
"step": 99000,
"training_step_in_ms": 965.1960897520185
},
{
"_prepare_inputs_in_ms": 4.139371138066053,
"compute_loss_in_ms": 268.1989936903119,
"epoch": 41.34,
"learning_rate/full": 0.00020062894644154732,
"loss": 3.628,
"step": 100000,
"training_step_in_ms": 969.4596163183451
},
{
"epoch": 41.34,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.565774440765381,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26571601552352997,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6144,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.307,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322,
"step": 100000
},
{
"_prepare_inputs_in_ms": 4.108485870245026,
"compute_loss_in_ms": 267.23163178935647,
"epoch": 41.75,
"learning_rate/full": 0.00019748742092116103,
"loss": 3.6364,
"step": 101000,
"training_step_in_ms": 962.6803079359233
},
{
"_prepare_inputs_in_ms": 4.145125687122345,
"compute_loss_in_ms": 267.68679490312934,
"epoch": 42.17,
"learning_rate/full": 0.00019434651534206603,
"loss": 3.6315,
"step": 102000,
"training_step_in_ms": 964.9059623852372
},
{
"_prepare_inputs_in_ms": 4.14092817902565,
"compute_loss_in_ms": 268.40766886249185,
"epoch": 42.58,
"learning_rate/full": 0.00019120700467571537,
"loss": 3.6249,
"step": 103000,
"training_step_in_ms": 968.5381288193166
},
{
"_prepare_inputs_in_ms": 4.131742633879185,
"compute_loss_in_ms": 267.6234121248126,
"epoch": 42.99,
"learning_rate/full": 0.00018806966354938863,
"loss": 3.6302,
"step": 104000,
"training_step_in_ms": 965.0357882864773
},
{
"_prepare_inputs_in_ms": 4.159636992961168,
"compute_loss_in_ms": 268.2043272703886,
"epoch": 43.41,
"learning_rate/full": 0.0001849352660550636,
"loss": 3.6221,
"step": 105000,
"training_step_in_ms": 966.8701088428497
},
{
"epoch": 43.41,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.560976266860962,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2679473083105533,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6952,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 105000
},
{
"_prepare_inputs_in_ms": 4.1656713769203275,
"compute_loss_in_ms": 267.7097022458911,
"epoch": 43.82,
"learning_rate/full": 0.00018180458555842107,
"loss": 3.6281,
"step": 106000,
"training_step_in_ms": 960.9392982535064
},
{
"_prepare_inputs_in_ms": 4.1548894718289375,
"compute_loss_in_ms": 268.3351138718426,
"epoch": 44.23,
"learning_rate/full": 0.00017867839450802815,
"loss": 3.6257,
"step": 107000,
"training_step_in_ms": 967.5997758358717
},
{
"_prepare_inputs_in_ms": 4.136493876576424,
"compute_loss_in_ms": 267.79356829449534,
"epoch": 44.65,
"learning_rate/full": 0.0001755574642447484,
"loss": 3.6275,
"step": 108000,
"training_step_in_ms": 964.6688169278204
},
{
"_prepare_inputs_in_ms": 4.146924342960119,
"compute_loss_in_ms": 268.7044747136533,
"epoch": 45.06,
"learning_rate/full": 0.00017244256481142465,
"loss": 3.6272,
"step": 109000,
"training_step_in_ms": 966.0691562928259
},
{
"_prepare_inputs_in_ms": 4.129870388656855,
"compute_loss_in_ms": 267.92700193077326,
"epoch": 45.47,
"learning_rate/full": 0.00016933446476288295,
"loss": 3.6231,
"step": 110000,
"training_step_in_ms": 968.8978024721146
},
{
"epoch": 45.47,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.557985544204712,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.26707363597972006,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.4146,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.334,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323,
"step": 110000
},
{
"_prepare_inputs_in_ms": 4.14337538001014,
"compute_loss_in_ms": 267.68642891570926,
"epoch": 45.89,
"learning_rate/full": 0.0001662308313853947,
"loss": 3.6179,
"step": 111000,
"training_step_in_ms": 963.7148243077099
},
{
"_prepare_inputs_in_ms": 4.14999657869339,
"compute_loss_in_ms": 267.70868534594774,
"epoch": 46.3,
"learning_rate/full": 0.000163135546733723,
"loss": 3.6124,
"step": 112000,
"training_step_in_ms": 967.6017691344023
},
{
"_prepare_inputs_in_ms": 4.146619476377964,
"compute_loss_in_ms": 268.191356562078,
"epoch": 46.71,
"learning_rate/full": 0.00016005245741683915,
"loss": 3.62,
"step": 113000,
"training_step_in_ms": 966.300628580153
},
{
"_prepare_inputs_in_ms": 4.153369773179293,
"compute_loss_in_ms": 267.8536421582103,
"epoch": 47.13,
"learning_rate/full": 0.00015697922455833988,
"loss": 3.6157,
"step": 114000,
"training_step_in_ms": 964.6176136285067
},
{
"_prepare_inputs_in_ms": 4.187301464378834,
"compute_loss_in_ms": 268.31423101201653,
"epoch": 47.54,
"learning_rate/full": 0.0001539166064324471,
"loss": 3.6143,
"step": 115000,
"training_step_in_ms": 968.9795580692589
},
{
"epoch": 47.54,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.556086778640747,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2680325079129448,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6426,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.173,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 115000
},
{
"_prepare_inputs_in_ms": 4.146232630421475,
"compute_loss_in_ms": 267.5073589235544,
"epoch": 47.95,
"learning_rate/full": 0.00015086535869435647,
"loss": 3.6143,
"step": 116000,
"training_step_in_ms": 961.0740608982742
},
{
"_prepare_inputs_in_ms": 4.149144068360329,
"compute_loss_in_ms": 268.67081797868013,
"epoch": 48.37,
"learning_rate/full": 0.00014782623419379065,
"loss": 3.6076,
"step": 117000,
"training_step_in_ms": 968.1870553046465
},
{
"_prepare_inputs_in_ms": 4.165053818374872,
"compute_loss_in_ms": 267.5217378772795,
"epoch": 48.78,
"learning_rate/full": 0.00014479998278924466,
"loss": 3.6033,
"step": 118000,
"training_step_in_ms": 964.0207477062941
},
{
"_prepare_inputs_in_ms": 4.148088995367289,
"compute_loss_in_ms": 267.9359416142106,
"epoch": 49.19,
"learning_rate/full": 0.00014178735116296984,
"loss": 3.6099,
"step": 119000,
"training_step_in_ms": 965.35854877159
},
{
"_prepare_inputs_in_ms": 4.147441305220127,
"compute_loss_in_ms": 268.18652522563934,
"epoch": 49.61,
"learning_rate/full": 0.00013878908263674099,
"loss": 3.6041,
"step": 120000,
"training_step_in_ms": 966.7598981000483
},
{
"epoch": 49.61,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5552496910095215,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2690825925881079,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.206,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324,
"step": 120000
},
{
"_prepare_inputs_in_ms": 4.151007533073425,
"compute_loss_in_ms": 267.91314566135406,
"epoch": 50.02,
"learning_rate/full": 0.00013580293864950247,
"loss": 3.6068,
"step": 121000,
"training_step_in_ms": 965.1756884045899
},
{
"_prepare_inputs_in_ms": 4.154482748359442,
"compute_loss_in_ms": 268.1262241154909,
"epoch": 50.43,
"learning_rate/full": 0.00013283562815289706,
"loss": 3.5972,
"step": 122000,
"training_step_in_ms": 965.2079959511757
},
{
"_prepare_inputs_in_ms": 4.1559099070727825,
"compute_loss_in_ms": 267.7796282917261,
"epoch": 50.85,
"learning_rate/full": 0.0001298848894600429,
"loss": 3.6031,
"step": 123000,
"training_step_in_ms": 966.0297281630337
},
{
"_prepare_inputs_in_ms": 4.1683206632733345,
"compute_loss_in_ms": 268.80906841158867,
"epoch": 51.26,
"learning_rate/full": 0.00012694852315582903,
"loss": 3.5985,
"step": 124000,
"training_step_in_ms": 967.5091603025794
},
{
"_prepare_inputs_in_ms": 4.137588050216436,
"compute_loss_in_ms": 267.6871258877218,
"epoch": 51.67,
"learning_rate/full": 0.00012403603541958643,
"loss": 3.6029,
"step": 125000,
"training_step_in_ms": 964.4286920540035
},
{
"epoch": 51.67,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5499510765075684,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.268844144332836,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.7216,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.293,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322,
"step": 125000
},
{
"_prepare_inputs_in_ms": 4.127907207826289,
"compute_loss_in_ms": 267.8013560883701,
"epoch": 52.09,
"learning_rate/full": 0.00012113936318920029,
"loss": 3.5962,
"step": 126000,
"training_step_in_ms": 962.9286280833185
},
{
"_prepare_inputs_in_ms": 4.151306886225939,
"compute_loss_in_ms": 267.83537547290325,
"epoch": 52.5,
"learning_rate/full": 0.00011825927853225391,
"loss": 3.5974,
"step": 127000,
"training_step_in_ms": 967.7427954226732
},
{
"_prepare_inputs_in_ms": 4.118186391890049,
"compute_loss_in_ms": 268.2419737614691,
"epoch": 52.91,
"learning_rate/full": 0.00011540225211753402,
"loss": 3.5979,
"step": 128000,
"training_step_in_ms": 963.5640154518187
},
{
"_prepare_inputs_in_ms": 4.146437399089336,
"compute_loss_in_ms": 267.88536206260324,
"epoch": 53.33,
"learning_rate/full": 0.00011256609893124084,
"loss": 3.5919,
"step": 129000,
"training_step_in_ms": 965.4581209644675
},
{
"_prepare_inputs_in_ms": 4.140674088150263,
"compute_loss_in_ms": 267.7817959152162,
"epoch": 53.74,
"learning_rate/full": 0.00010975151875173475,
"loss": 3.5954,
"step": 130000,
"training_step_in_ms": 967.2819016650319
},
{
"epoch": 53.74,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5497984886169434,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27146193885645503,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.8468,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 130000
},
{
"_prepare_inputs_in_ms": 4.144404723149974,
"compute_loss_in_ms": 267.8810519017279,
"epoch": 54.15,
"learning_rate/full": 0.00010695920603455975,
"loss": 3.5914,
"step": 131000,
"training_step_in_ms": 962.7643201723695
},
{
"_prepare_inputs_in_ms": 4.15174587816,
"compute_loss_in_ms": 268.55379743501544,
"epoch": 54.57,
"learning_rate/full": 0.00010418984974109642,
"loss": 3.5916,
"step": 132000,
"training_step_in_ms": 965.8136657737195
},
{
"_prepare_inputs_in_ms": 4.164624106138945,
"compute_loss_in_ms": 268.1068575233221,
"epoch": 54.98,
"learning_rate/full": 0.00010144413316857143,
"loss": 3.5824,
"step": 133000,
"training_step_in_ms": 961.5831676833332
},
{
"_prepare_inputs_in_ms": 4.1917338743805885,
"compute_loss_in_ms": 268.29790291562676,
"epoch": 55.39,
"learning_rate/full": 9.872273378146393e-05,
"loss": 3.5822,
"step": 134000,
"training_step_in_ms": 967.4604325480759
},
{
"_prepare_inputs_in_ms": 4.154745582491159,
"compute_loss_in_ms": 268.35503727942705,
"epoch": 55.81,
"learning_rate/full": 9.602632304435166e-05,
"loss": 3.5837,
"step": 135000,
"training_step_in_ms": 963.2355434708297
},
{
"epoch": 55.81,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5466184616088867,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2701472521164958,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.7707,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.287,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 135000
},
{
"_prepare_inputs_in_ms": 4.1385579000159005,
"compute_loss_in_ms": 268.1807456240058,
"epoch": 56.22,
"learning_rate/full": 9.335556625623667e-05,
"loss": 3.5886,
"step": 136000,
"training_step_in_ms": 964.7279985249043
},
{
"_prepare_inputs_in_ms": 4.140180014073849,
"compute_loss_in_ms": 268.0731739960611,
"epoch": 56.63,
"learning_rate/full": 9.071112238639306e-05,
"loss": 3.5841,
"step": 137000,
"training_step_in_ms": 964.2245756573975
},
{
"_prepare_inputs_in_ms": 4.159709714353085,
"compute_loss_in_ms": 268.24955869838595,
"epoch": 57.05,
"learning_rate/full": 8.809103753928327e-05,
"loss": 3.5843,
"step": 138000,
"training_step_in_ms": 966.5491472817957
},
{
"_prepare_inputs_in_ms": 4.165288005024195,
"compute_loss_in_ms": 268.81143694743514,
"epoch": 57.46,
"learning_rate/full": 8.550119824369325e-05,
"loss": 3.5867,
"step": 139000,
"training_step_in_ms": 964.0126786530018
},
{
"_prepare_inputs_in_ms": 4.144395582377911,
"compute_loss_in_ms": 268.206242531538,
"epoch": 57.88,
"learning_rate/full": 8.29370600270935e-05,
"loss": 3.5852,
"step": 140000,
"training_step_in_ms": 962.685001052916
},
{
"epoch": 57.88,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5455029010772705,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2711795494440531,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9766,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.259,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 140000
},
{
"_prepare_inputs_in_ms": 4.152141958475113,
"compute_loss_in_ms": 267.9933222196996,
"epoch": 58.29,
"learning_rate/full": 8.040438372331344e-05,
"loss": 3.5737,
"step": 141000,
"training_step_in_ms": 965.1287141442299
},
{
"_prepare_inputs_in_ms": 4.142403397709131,
"compute_loss_in_ms": 267.5065658353269,
"epoch": 58.7,
"learning_rate/full": 7.790121584830201e-05,
"loss": 3.575,
"step": 142000,
"training_step_in_ms": 962.7664158046246
},
{
"_prepare_inputs_in_ms": 4.150233589112759,
"compute_loss_in_ms": 268.65408623218536,
"epoch": 59.12,
"learning_rate/full": 7.542817402127658e-05,
"loss": 3.5709,
"step": 143000,
"training_step_in_ms": 964.2099178209901
},
{
"_prepare_inputs_in_ms": 4.130799826234579,
"compute_loss_in_ms": 267.8640896603465,
"epoch": 59.53,
"learning_rate/full": 7.298586842830323e-05,
"loss": 3.5775,
"step": 144000,
"training_step_in_ms": 964.5784216374159
},
{
"_prepare_inputs_in_ms": 4.146471511572599,
"compute_loss_in_ms": 268.14434216171503,
"epoch": 59.94,
"learning_rate/full": 7.057490167174197e-05,
"loss": 3.5781,
"step": 145000,
"training_step_in_ms": 964.2295859828591
},
{
"epoch": 59.94,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5419652462005615,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2710637844956296,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2475,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.224,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 145000
},
{
"_prepare_inputs_in_ms": 4.13495619122575,
"compute_loss_in_ms": 267.6772438697517,
"epoch": 60.36,
"learning_rate/full": 6.819586862156388e-05,
"loss": 3.5713,
"step": 146000,
"training_step_in_ms": 963.0674764961004
},
{
"_prepare_inputs_in_ms": 4.138938769698143,
"compute_loss_in_ms": 268.4652929417789,
"epoch": 60.77,
"learning_rate/full": 6.58493562685758e-05,
"loss": 3.5755,
"step": 147000,
"training_step_in_ms": 965.1382315270603
},
{
"_prepare_inputs_in_ms": 4.149636901915073,
"compute_loss_in_ms": 268.6144716888666,
"epoch": 61.18,
"learning_rate/full": 6.35336446255852e-05,
"loss": 3.5689,
"step": 148000,
"training_step_in_ms": 967.6213804855943
},
{
"_prepare_inputs_in_ms": 4.154591448605061,
"compute_loss_in_ms": 268.10440719127655,
"epoch": 61.6,
"learning_rate/full": 6.125393638794017e-05,
"loss": 3.5736,
"step": 149000,
"training_step_in_ms": 966.7320594601333
},
{
"_prepare_inputs_in_ms": 4.149040505290031,
"compute_loss_in_ms": 268.75643199309707,
"epoch": 62.01,
"learning_rate/full": 5.900623127984053e-05,
"loss": 3.57,
"step": 150000,
"training_step_in_ms": 965.394243825227
},
{
"epoch": 62.01,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.542189359664917,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27182213175584513,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2758,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.22,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 150000
},
{
"_prepare_inputs_in_ms": 4.197841770038372,
"compute_loss_in_ms": 268.5856811106205,
"epoch": 62.42,
"learning_rate/full": 5.6795579206763614e-05,
"loss": 3.5655,
"step": 151000,
"training_step_in_ms": 963.427967004478
},
{
"_prepare_inputs_in_ms": 4.1404072009027,
"compute_loss_in_ms": 267.94744442403316,
"epoch": 62.84,
"learning_rate/full": 5.462026068170363e-05,
"loss": 3.5665,
"step": 152000,
"training_step_in_ms": 965.5440159775317
},
{
"_prepare_inputs_in_ms": 4.148986879736185,
"compute_loss_in_ms": 268.1357101947069,
"epoch": 63.25,
"learning_rate/full": 5.247868899032384e-05,
"loss": 3.5648,
"step": 153000,
"training_step_in_ms": 965.260343439877
},
{
"_prepare_inputs_in_ms": 4.144355583935976,
"compute_loss_in_ms": 268.8695700503886,
"epoch": 63.66,
"learning_rate/full": 5.0375675588795876e-05,
"loss": 3.5699,
"step": 154000,
"training_step_in_ms": 968.1045257672668
},
{
"_prepare_inputs_in_ms": 4.134350396692753,
"compute_loss_in_ms": 267.78631913661957,
"epoch": 64.08,
"learning_rate/full": 4.830957975043959e-05,
"loss": 3.5654,
"step": 155000,
"training_step_in_ms": 965.367557708174
},
{
"epoch": 64.08,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5409913063049316,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.273054083346476,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4578,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.197,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 155000
},
{
"_prepare_inputs_in_ms": 4.169517766411712,
"compute_loss_in_ms": 267.94907980412245,
"epoch": 64.49,
"learning_rate/full": 4.628091125348743e-05,
"loss": 3.562,
"step": 156000,
"training_step_in_ms": 964.7187770940363
},
{
"_prepare_inputs_in_ms": 4.127725187689066,
"compute_loss_in_ms": 267.56007508188486,
"epoch": 64.9,
"learning_rate/full": 4.429017064153536e-05,
"loss": 3.5599,
"step": 157000,
"training_step_in_ms": 961.402901135385
},
{
"_prepare_inputs_in_ms": 4.122306831181049,
"compute_loss_in_ms": 268.3586079515517,
"epoch": 65.32,
"learning_rate/full": 4.233784910004124e-05,
"loss": 3.5666,
"step": 158000,
"training_step_in_ms": 965.8669985719025
},
{
"_prepare_inputs_in_ms": 4.136414989829063,
"compute_loss_in_ms": 267.9736096225679,
"epoch": 65.73,
"learning_rate/full": 4.0424428335132335e-05,
"loss": 3.5573,
"step": 159000,
"training_step_in_ms": 965.0534134693444
},
{
"_prepare_inputs_in_ms": 4.14548010751605,
"compute_loss_in_ms": 268.10164315626025,
"epoch": 66.14,
"learning_rate/full": 3.855038045475119e-05,
"loss": 3.5569,
"step": 160000,
"training_step_in_ms": 965.0257755257189
},
{
"epoch": 66.14,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.540762424468994,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735980306318844,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.6347,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322,
"step": 160000
},
{
"_prepare_inputs_in_ms": 4.134731147347427,
"compute_loss_in_ms": 268.0676885545254,
"epoch": 66.56,
"learning_rate/full": 3.671616785217033e-05,
"loss": 3.559,
"step": 161000,
"training_step_in_ms": 961.5968884006143
},
{
"_prepare_inputs_in_ms": 4.13828482478857,
"compute_loss_in_ms": 268.11520731821656,
"epoch": 66.97,
"learning_rate/full": 3.4920467704438286e-05,
"loss": 3.5617,
"step": 162000,
"training_step_in_ms": 963.3356633149087
},
{
"_prepare_inputs_in_ms": 4.1371137127280235,
"compute_loss_in_ms": 267.97775723040104,
"epoch": 67.38,
"learning_rate/full": 3.3169048798042254e-05,
"loss": 3.5629,
"step": 163000,
"training_step_in_ms": 964.7222346775234
},
{
"_prepare_inputs_in_ms": 4.129249203950167,
"compute_loss_in_ms": 267.63603001460433,
"epoch": 67.8,
"learning_rate/full": 3.145532456480391e-05,
"loss": 3.5596,
"step": 164000,
"training_step_in_ms": 964.5063005648553
},
{
"_prepare_inputs_in_ms": 4.151564922183752,
"compute_loss_in_ms": 268.839259788394,
"epoch": 68.21,
"learning_rate/full": 2.9784920606062528e-05,
"loss": 3.5602,
"step": 165000,
"training_step_in_ms": 972.3141440451145
},
{
"epoch": 68.21,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.539008855819702,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2725576622048259,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.4123,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.202,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 165000
},
{
"_prepare_inputs_in_ms": 4.126259837208725,
"compute_loss_in_ms": 267.8272004313767,
"epoch": 68.62,
"learning_rate/full": 2.8156514671178745e-05,
"loss": 3.5603,
"step": 166000,
"training_step_in_ms": 964.2809295020998
},
{
"_prepare_inputs_in_ms": 4.134287599474192,
"compute_loss_in_ms": 267.94721764326096,
"epoch": 69.04,
"learning_rate/full": 2.65705085449506e-05,
"loss": 3.5591,
"step": 167000,
"training_step_in_ms": 963.7021813839674
},
{
"_prepare_inputs_in_ms": 4.147611241787672,
"compute_loss_in_ms": 268.29229406639934,
"epoch": 69.45,
"learning_rate/full": 2.5025770357450595e-05,
"loss": 3.5561,
"step": 168000,
"training_step_in_ms": 967.2244190610945
},
{
"_prepare_inputs_in_ms": 4.15412675216794,
"compute_loss_in_ms": 268.25271063297987,
"epoch": 69.86,
"learning_rate/full": 2.352577066262569e-05,
"loss": 3.5576,
"step": 169000,
"training_step_in_ms": 965.3532739318907
},
{
"_prepare_inputs_in_ms": 4.129838448017836,
"compute_loss_in_ms": 267.92896181344986,
"epoch": 70.28,
"learning_rate/full": 2.206931334324922e-05,
"loss": 3.5536,
"step": 170000,
"training_step_in_ms": 965.5082765445113
},
{
"epoch": 70.28,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5376806259155273,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2738309179784362,
"eval_visual_genome-densecap-local-densecap-test_runtime": 77.9139,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321,
"step": 170000
},
{
"_prepare_inputs_in_ms": 4.163786387298165,
"compute_loss_in_ms": 267.95297726243734,
"epoch": 70.69,
"learning_rate/full": 2.0656757758371282e-05,
"loss": 3.5571,
"step": 171000,
"training_step_in_ms": 960.7510039620101
},
{
"_prepare_inputs_in_ms": 4.137572426348925,
"compute_loss_in_ms": 267.8121683038771,
"epoch": 71.1,
"learning_rate/full": 1.9287105043128472e-05,
"loss": 3.555,
"step": 172000,
"training_step_in_ms": 963.8648240976036
},
{
"_prepare_inputs_in_ms": 4.139789171516895,
"compute_loss_in_ms": 268.3458735384047,
"epoch": 71.52,
"learning_rate/full": 1.796343238799574e-05,
"loss": 3.5518,
"step": 173000,
"training_step_in_ms": 965.790959071368
},
{
"_prepare_inputs_in_ms": 4.144272416830063,
"compute_loss_in_ms": 268.10323084518313,
"epoch": 71.93,
"learning_rate/full": 1.6684674532049582e-05,
"loss": 3.5512,
"step": 174000,
"training_step_in_ms": 961.3717007525265
},
{
"_prepare_inputs_in_ms": 4.1666854321956635,
"compute_loss_in_ms": 268.03433157876134,
"epoch": 72.34,
"learning_rate/full": 1.5451146989656617e-05,
"loss": 3.5495,
"step": 175000,
"training_step_in_ms": 967.3243609592319
},
{
"epoch": 72.34,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.536776065826416,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2743759293675203,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.6158,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.176,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318,
"step": 175000
},
{
"_prepare_inputs_in_ms": 4.134207051701662,
"compute_loss_in_ms": 267.52714550867677,
"epoch": 72.76,
"learning_rate/full": 1.4261987845053304e-05,
"loss": 3.5555,
"step": 176000,
"training_step_in_ms": 962.5389591343701
},
{
"_prepare_inputs_in_ms": 4.146069306880236,
"compute_loss_in_ms": 268.7413688749075,
"epoch": 73.17,
"learning_rate/full": 1.3119868774900613e-05,
"loss": 3.5512,
"step": 177000,
"training_step_in_ms": 964.9299626871943
},
{
"_prepare_inputs_in_ms": 4.148835156112909,
"compute_loss_in_ms": 268.0495460778475,
"epoch": 73.58,
"learning_rate/full": 1.2023859580780273e-05,
"loss": 3.5529,
"step": 178000,
"training_step_in_ms": 967.7268707863986
},
{
"_prepare_inputs_in_ms": 4.1666895635426044,
"compute_loss_in_ms": 268.2634797357023,
"epoch": 74.0,
"learning_rate/full": 1.0973203331088377e-05,
"loss": 3.5538,
"step": 179000,
"training_step_in_ms": 965.1008929647505
},
{
"_prepare_inputs_in_ms": 4.153850518167019,
"compute_loss_in_ms": 268.7998457066715,
"epoch": 74.41,
"learning_rate/full": 9.970260528869224e-06,
"loss": 3.5524,
"step": 180000,
"training_step_in_ms": 968.3517145328224
},
{
"epoch": 74.41,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.536918878555298,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735705193198496,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.7713,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.156,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.317,
"step": 180000
},
{
"_prepare_inputs_in_ms": 4.127806843054004,
"compute_loss_in_ms": 268.1048993989825,
"epoch": 74.82,
"learning_rate/full": 9.01420472138852e-06,
"loss": 3.5468,
"step": 181000,
"training_step_in_ms": 960.1139997318387
},
{
"_prepare_inputs_in_ms": 4.13564395532012,
"compute_loss_in_ms": 267.3685629181564,
"epoch": 75.24,
"learning_rate/full": 8.105271801111003e-06,
"loss": 3.552,
"step": 182000,
"training_step_in_ms": 964.2471651136875
},
{
"_prepare_inputs_in_ms": 4.140480011701584,
"compute_loss_in_ms": 267.48710445687175,
"epoch": 75.65,
"learning_rate/full": 7.243686033634145e-06,
"loss": 3.5473,
"step": 183000,
"training_step_in_ms": 966.0506127551198
},
{
"_prepare_inputs_in_ms": 4.12862478941679,
"compute_loss_in_ms": 268.38187746331096,
"epoch": 76.06,
"learning_rate/full": 6.429660002353832e-06,
"loss": 3.5535,
"step": 184000,
"training_step_in_ms": 963.8830341026187
},
{
"_prepare_inputs_in_ms": 4.138918172568083,
"compute_loss_in_ms": 267.91103532910347,
"epoch": 76.48,
"learning_rate/full": 5.663394556012769e-06,
"loss": 3.5489,
"step": 185000,
"training_step_in_ms": 969.0565127506852
},
{
"epoch": 76.48,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5358800888061523,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2731816800574383,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.2007,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.23,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32,
"step": 185000
},
{
"_prepare_inputs_in_ms": 4.125211863982968,
"compute_loss_in_ms": 267.94072189182043,
"epoch": 76.89,
"learning_rate/full": 4.944383807374142e-06,
"loss": 3.5495,
"step": 186000,
"training_step_in_ms": 963.789376296103
},
{
"_prepare_inputs_in_ms": 4.155690658837557,
"compute_loss_in_ms": 267.86934616044164,
"epoch": 77.3,
"learning_rate/full": 4.273596510048239e-06,
"loss": 3.5465,
"step": 187000,
"training_step_in_ms": 966.8210936710238
},
{
"_prepare_inputs_in_ms": 4.130576055496931,
"compute_loss_in_ms": 268.2106507457793,
"epoch": 77.72,
"learning_rate/full": 3.6517966776118407e-06,
"loss": 3.5445,
"step": 188000,
"training_step_in_ms": 966.5816915780306
},
{
"_prepare_inputs_in_ms": 4.133735220879316,
"compute_loss_in_ms": 267.8969533368945,
"epoch": 78.13,
"learning_rate/full": 3.0789924830065154e-06,
"loss": 3.5528,
"step": 189000,
"training_step_in_ms": 964.6940425820649
},
{
"_prepare_inputs_in_ms": 4.137146957218647,
"compute_loss_in_ms": 267.9762873612344,
"epoch": 78.54,
"learning_rate/full": 2.5536764226682607e-06,
"loss": 3.5458,
"step": 190000,
"training_step_in_ms": 966.734307706356
},
{
"epoch": 78.54,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5369150638580322,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.272921503437743,
"eval_visual_genome-densecap-local-densecap-test_runtime": 79.0337,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.122,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316,
"step": 190000
},
{
"_prepare_inputs_in_ms": 4.113826969774758,
"compute_loss_in_ms": 267.3543768711388,
"epoch": 78.96,
"learning_rate/full": 2.077174866407172e-06,
"loss": 3.5455,
"step": 191000,
"training_step_in_ms": 959.5898663066328
},
{
"_prepare_inputs_in_ms": 4.15868678689003,
"compute_loss_in_ms": 268.5514197871089,
"epoch": 79.37,
"learning_rate/full": 1.650411851111966e-06,
"loss": 3.5422,
"step": 192000,
"training_step_in_ms": 966.848380189389
},
{
"_prepare_inputs_in_ms": 4.152705859392881,
"compute_loss_in_ms": 267.7775506339967,
"epoch": 79.79,
"learning_rate/full": 1.2717824473816864e-06,
"loss": 3.5542,
"step": 193000,
"training_step_in_ms": 966.0438013672829
},
{
"_prepare_inputs_in_ms": 4.149454560130835,
"compute_loss_in_ms": 268.18433906137943,
"epoch": 80.2,
"learning_rate/full": 9.425893981038769e-07,
"loss": 3.5513,
"step": 194000,
"training_step_in_ms": 968.7132156044245
},
{
"_prepare_inputs_in_ms": 4.145272459834814,
"compute_loss_in_ms": 269.00753265991807,
"epoch": 80.61,
"learning_rate/full": 6.625107863321489e-07,
"loss": 3.5423,
"step": 195000,
"training_step_in_ms": 966.2778741791844
},
{
"epoch": 80.61,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5363166332244873,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.2732828183368321,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.105,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.243,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32,
"step": 195000
},
{
"_prepare_inputs_in_ms": 4.114095866680145,
"compute_loss_in_ms": 267.9977478161454,
"epoch": 81.03,
"learning_rate/full": 4.3161571727299287e-07,
"loss": 3.5457,
"step": 196000,
"training_step_in_ms": 963.1876187734306
},
{
"_prepare_inputs_in_ms": 4.132705166935921,
"compute_loss_in_ms": 268.0948423668742,
"epoch": 81.44,
"learning_rate/full": 2.4980400999989885e-07,
"loss": 3.5462,
"step": 197000,
"training_step_in_ms": 967.0936130546033
},
{
"_prepare_inputs_in_ms": 4.152493238449097,
"compute_loss_in_ms": 268.8196250721812,
"epoch": 81.85,
"learning_rate/full": 1.174841397763915e-07,
"loss": 3.5462,
"step": 198000,
"training_step_in_ms": 964.0161675550044
},
{
"_prepare_inputs_in_ms": 4.15958097204566,
"compute_loss_in_ms": 268.9542033970356,
"epoch": 82.27,
"learning_rate/full": 3.4482289435100457e-08,
"loss": 3.5489,
"step": 199000,
"training_step_in_ms": 964.1794747672975
},
{
"_prepare_inputs_in_ms": 4.161274570971727,
"compute_loss_in_ms": 268.2289356328547,
"epoch": 82.68,
"learning_rate/full": 8.099638465708381e-10,
"loss": 3.5503,
"step": 200000,
"training_step_in_ms": 966.4167955368757
},
{
"epoch": 82.68,
"eval_visual_genome-densecap-local-densecap-test_loss": 3.5363588333129883,
"eval_visual_genome-densecap-local-densecap-test_meteor": 0.27337310510486335,
"eval_visual_genome-densecap-local-densecap-test_runtime": 78.3968,
"eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.204,
"eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319,
"step": 200000
}
],
"max_steps": 200000,
"num_train_epochs": 83,
"total_flos": 1.6535680980503157e+23,
"trial_name": null,
"trial_params": null
}