| [ |
| { |
| "loss": 0.6712, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.03, |
| "step": 1 |
| }, |
| { |
| "loss": 0.6482, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.05, |
| "step": 2 |
| }, |
| { |
| "loss": 0.6674, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.08, |
| "step": 3 |
| }, |
| { |
| "loss": 0.661, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.11, |
| "step": 4 |
| }, |
| { |
| "loss": 0.5958, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.13, |
| "step": 5 |
| }, |
| { |
| "loss": 0.628, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.16, |
| "step": 6 |
| }, |
| { |
| "loss": 0.6028, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.18, |
| "step": 7 |
| }, |
| { |
| "loss": 0.6019, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.21, |
| "step": 8 |
| }, |
| { |
| "loss": 0.5519, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.24, |
| "step": 9 |
| }, |
| { |
| "loss": 0.5427, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.26, |
| "step": 10 |
| }, |
| { |
| "loss": 0.5148, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.29, |
| "step": 11 |
| }, |
| { |
| "loss": 0.5229, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.32, |
| "step": 12 |
| }, |
| { |
| "loss": 0.4487, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.34, |
| "step": 13 |
| }, |
| { |
| "loss": 0.4622, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.37, |
| "step": 14 |
| }, |
| { |
| "loss": 0.5247, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.39, |
| "step": 15 |
| }, |
| { |
| "loss": 0.4628, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.42, |
| "step": 16 |
| }, |
| { |
| "loss": 0.4347, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.45, |
| "step": 17 |
| }, |
| { |
| "loss": 0.3905, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.47, |
| "step": 18 |
| }, |
| { |
| "loss": 0.3277, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.5, |
| "step": 19 |
| }, |
| { |
| "loss": 0.2926, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.53, |
| "step": 20 |
| }, |
| { |
| "loss": 0.3436, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.55, |
| "step": 21 |
| }, |
| { |
| "loss": 0.2549, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.58, |
| "step": 22 |
| }, |
| { |
| "loss": 0.2182, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.61, |
| "step": 23 |
| }, |
| { |
| "loss": 0.1982, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.63, |
| "step": 24 |
| }, |
| { |
| "loss": 0.161, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.66, |
| "step": 25 |
| }, |
| { |
| "eval_code_low_quality_loss": 0.0951915830373764, |
| "eval_code_low_quality_score": -0.023566950112581253, |
| "eval_code_low_quality_brier_score": 0.023566950112581253, |
| "eval_code_low_quality_average_probability": 0.907680332660675, |
| "eval_code_low_quality_accuracy": 0.98, |
| "eval_code_low_quality_probabilities": [ |
| 0.9925367832183838, |
| 0.9840611815452576, |
| 0.7860302925109863, |
| 0.8891001343727112, |
| 0.9905372262001038, |
| 0.9568611979484558, |
| 0.9341686964035034, |
| 0.8778702616691589, |
| 0.9786091446876526, |
| 0.9330840110778809, |
| 0.9966692328453064, |
| 0.9975678324699402, |
| 0.9617735147476196, |
| 0.9792876243591309, |
| 0.9869201183319092, |
| 0.9909035563468933, |
| 0.9864379167556763, |
| 0.5783786177635193, |
| 0.9241027235984802, |
| 0.9600433111190796, |
| 0.7587274312973022, |
| 0.8323114514350891, |
| 0.877905011177063, |
| 0.8901019096374512, |
| 0.8700847625732422, |
| 0.887502133846283, |
| 0.7855967879295349, |
| 0.8953022956848145, |
| 0.913593053817749, |
| 0.8834923505783081, |
| 0.6113455891609192, |
| 0.9742891192436218, |
| 0.9921196699142456, |
| 0.9815818071365356, |
| 0.9205424785614014, |
| 0.9094852209091187, |
| 0.9560614228248596, |
| 0.960161566734314, |
| 0.8312894701957703, |
| 0.7790418267250061, |
| 0.8403017520904541, |
| 0.9003271460533142, |
| 0.9872115254402161, |
| 0.9675229787826538, |
| 0.9775436520576477, |
| 0.9949591159820557, |
| 0.98282790184021, |
| 0.982309877872467, |
| 0.9526650309562683, |
| 0.9178764820098877, |
| 0.9971938133239746, |
| 0.9984176158905029, |
| 0.9871721863746643, |
| 0.9735684990882874, |
| 0.9058899283409119, |
| 0.9493223428726196, |
| 0.9861119985580444, |
| 0.9859384894371033, |
| 0.9355461001396179, |
| 0.791418194770813, |
| 0.992045521736145, |
| 0.9872221350669861, |
| 0.9527598023414612, |
| 0.9187523722648621, |
| 0.8177111148834229, |
| 0.9786438345909119, |
| 0.9874449968338013, |
| 0.9943341016769409, |
| 0.9862135052680969, |
| 0.988554060459137, |
| 0.9788398742675781, |
| 0.9971326589584351, |
| 0.9967315196990967, |
| 0.9900894165039062, |
| 0.9409597516059875, |
| 0.9783955812454224, |
| 0.9238479733467102, |
| 0.9934139847755432, |
| 0.7463366389274597, |
| 0.9180166721343994, |
| 0.9864663481712341, |
| 0.9937455654144287, |
| 0.9708875417709351, |
| 0.9727025032043457, |
| 0.9636775851249695, |
| 0.9573163390159607, |
| 0.6392986178398132, |
| 0.6527231335639954, |
| 0.9338482022285461, |
| 0.9202041029930115, |
| 0.7206510901451111, |
| 0.7209832072257996, |
| 0.9708787798881531, |
| 0.9102391004562378, |
| 0.8587813377380371, |
| 0.8840697407722473, |
| 0.7573890089988708, |
| 0.9752879738807678, |
| 0.4457229673862457, |
| 0.2561103403568268 |
| ], |
| "eval_code_low_quality_runtime": 38.4811, |
| "eval_code_low_quality_samples_per_second": 2.599, |
| "eval_code_low_quality_steps_per_second": 0.052, |
| "epoch": 0.66, |
| "step": 25 |
| }, |
| { |
| "eval_code_loss": 0.9943647980690002, |
| "eval_code_score": -0.28008389472961426, |
| "eval_code_brier_score": 0.28008389472961426, |
| "eval_code_average_probability": 0.5028746724128723, |
| "eval_code_accuracy": 0.73, |
| "eval_code_probabilities": [ |
| 0.0013771726517006755, |
| 0.0021421583369374275, |
| 0.0021674928721040487, |
| 0.523486852645874, |
| 0.6844746470451355, |
| 0.5299127101898193, |
| 0.5120762586593628, |
| 0.7857722043991089, |
| 0.5001239776611328, |
| 0.507907509803772, |
| 0.5472686886787415, |
| 0.5965446829795837, |
| 0.47309237718582153, |
| 0.7392762899398804, |
| 0.5616071224212646, |
| 0.5222716331481934, |
| 0.5174436569213867, |
| 0.5479878783226013, |
| 0.7341067790985107, |
| 0.6857637166976929, |
| 0.6855947375297546, |
| 0.484964519739151, |
| 0.5379744172096252, |
| 0.5018139481544495, |
| 0.018715351819992065, |
| 0.015019988641142845, |
| 0.016509870067238808, |
| 0.5054175853729248, |
| 0.5175662636756897, |
| 0.6052428483963013, |
| 0.4553852081298828, |
| 0.5380894541740417, |
| 0.5062794089317322, |
| 0.042318232357501984, |
| 0.037935495376586914, |
| 0.042440593242645264, |
| 0.5699766874313354, |
| 0.5090808272361755, |
| 0.5176827907562256, |
| 0.5127310752868652, |
| 0.5206546783447266, |
| 0.5350870490074158, |
| 0.5115861296653748, |
| 0.537502646446228, |
| 0.623155415058136, |
| 0.49951303005218506, |
| 0.548371434211731, |
| 0.5232611894607544, |
| 0.5098251700401306, |
| 0.5139918923377991, |
| 0.8860173225402832, |
| 0.6156609654426575, |
| 0.6341218948364258, |
| 0.543006181716919, |
| 0.5034212470054626, |
| 0.5090045928955078, |
| 0.5025768280029297, |
| 0.805193305015564, |
| 0.5220950245857239, |
| 0.8043115735054016, |
| 0.5911435484886169, |
| 0.5618972778320312, |
| 0.5862018465995789, |
| 0.4658759534358978, |
| 0.4998258650302887, |
| 0.5460342764854431, |
| 0.4621177017688751, |
| 0.33082979917526245, |
| 0.35442039370536804, |
| 0.5409923791885376, |
| 0.48686879873275757, |
| 0.5274949073791504, |
| 0.5022823810577393, |
| 0.5296149253845215, |
| 0.5378413796424866, |
| 0.8412360548973083, |
| 0.7736567258834839, |
| 0.8534575700759888, |
| 0.4241589307785034, |
| 0.5119674205780029, |
| 0.4645305573940277, |
| 0.5176393389701843, |
| 0.49852415919303894, |
| 0.602745771408081, |
| 0.5448736548423767, |
| 0.6585777401924133, |
| 0.4206017851829529, |
| 0.573499858379364, |
| 0.5334447026252747, |
| 0.5451390147209167, |
| 0.5268576145172119, |
| 0.5080337524414062, |
| 0.5261317491531372, |
| 0.5029634833335876, |
| 0.501714289188385, |
| 0.505605161190033, |
| 0.3948810398578644, |
| 0.39573386311531067, |
| 0.3992973268032074, |
| 0.4948563277721405 |
| ], |
| "eval_code_runtime": 36.6822, |
| "eval_code_samples_per_second": 2.726, |
| "eval_code_steps_per_second": 0.055, |
| "epoch": 0.66, |
| "step": 25 |
| }, |
| { |
| "loss": 0.3089, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.68, |
| "step": 26 |
| }, |
| { |
| "loss": 0.129, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.71, |
| "step": 27 |
| }, |
| { |
| "loss": 0.1145, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.74, |
| "step": 28 |
| }, |
| { |
| "loss": 0.1449, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.76, |
| "step": 29 |
| }, |
| { |
| "loss": 0.052, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.79, |
| "step": 30 |
| }, |
| { |
| "loss": 0.0636, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.82, |
| "step": 31 |
| }, |
| { |
| "loss": 0.0275, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.84, |
| "step": 32 |
| }, |
| { |
| "loss": 0.0324, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.87, |
| "step": 33 |
| }, |
| { |
| "loss": 0.0102, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.89, |
| "step": 34 |
| }, |
| { |
| "loss": 0.0436, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.92, |
| "step": 35 |
| }, |
| { |
| "loss": 0.0156, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.95, |
| "step": 36 |
| }, |
| { |
| "loss": 0.0175, |
| "learning_rate": 7.2e-05, |
| "epoch": 0.97, |
| "step": 37 |
| }, |
| { |
| "loss": 0.1136, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.0, |
| "step": 38 |
| }, |
| { |
| "loss": 0.0842, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.03, |
| "step": 39 |
| }, |
| { |
| "loss": 0.008, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.05, |
| "step": 40 |
| }, |
| { |
| "loss": 0.004, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.08, |
| "step": 41 |
| }, |
| { |
| "loss": 0.016, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.11, |
| "step": 42 |
| }, |
| { |
| "loss": 0.0247, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.13, |
| "step": 43 |
| }, |
| { |
| "loss": 0.0259, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.16, |
| "step": 44 |
| }, |
| { |
| "loss": 0.2052, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.18, |
| "step": 45 |
| }, |
| { |
| "loss": 0.0087, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.21, |
| "step": 46 |
| }, |
| { |
| "loss": 0.0006, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.24, |
| "step": 47 |
| }, |
| { |
| "loss": 0.0326, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.26, |
| "step": 48 |
| }, |
| { |
| "loss": 0.0016, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.29, |
| "step": 49 |
| }, |
| { |
| "loss": 0.022, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.32, |
| "step": 50 |
| }, |
| { |
| "eval_code_low_quality_loss": 0.007781789172440767, |
| "eval_code_low_quality_score": -0.009711829014122486, |
| "eval_code_low_quality_brier_score": 0.009711829014122486, |
| "eval_code_low_quality_average_probability": 0.9875654578208923, |
| "eval_code_low_quality_accuracy": 0.99, |
| "eval_code_low_quality_probabilities": [ |
| 1.0, |
| 1.0, |
| 0.973220705986023, |
| 0.9989569187164307, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999943971633911, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9804773330688477, |
| 0.9999984502792358, |
| 1.0, |
| 1.0, |
| 0.9992768168449402, |
| 0.9853408932685852, |
| 0.9999998807907104, |
| 1.0, |
| 0.9872244596481323, |
| 0.9999868869781494, |
| 0.9999997615814209, |
| 0.9999994039535522, |
| 0.9999929666519165, |
| 0.9999935626983643, |
| 0.9996015429496765, |
| 0.9999901056289673, |
| 1.0, |
| 0.9999998807907104, |
| 0.8831122517585754, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999983310699463, |
| 0.9999868869781494, |
| 0.9994181394577026, |
| 0.9999551773071289, |
| 1.0, |
| 0.9999998807907104, |
| 0.974841296672821, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999957084655762, |
| 0.9999563694000244, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999856948852539, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999946355819702, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 1.0, |
| 0.9999997615814209, |
| 1.0, |
| 0.9990255832672119, |
| 1.0, |
| 0.9886683821678162, |
| 0.9999992847442627, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.998230516910553, |
| 0.9682945609092712, |
| 0.9999998807907104, |
| 0.9999996423721313, |
| 0.9999982118606567, |
| 0.9999991655349731, |
| 1.0, |
| 0.9987072944641113, |
| 0.999998927116394, |
| 0.999998927116394, |
| 0.9999661445617676, |
| 1.0, |
| 0.9992316961288452, |
| 0.023133214563131332 |
| ], |
| "eval_code_low_quality_runtime": 38.4634, |
| "eval_code_low_quality_samples_per_second": 2.6, |
| "eval_code_low_quality_steps_per_second": 0.052, |
| "epoch": 1.32, |
| "step": 50 |
| }, |
| { |
| "eval_code_loss": 1.460232138633728, |
| "eval_code_score": -0.31812021136283875, |
| "eval_code_brier_score": 0.31812021136283875, |
| "eval_code_average_probability": 0.4904159903526306, |
| "eval_code_accuracy": 0.57, |
| "eval_code_probabilities": [ |
| 2.16732428270916e-06, |
| 3.4093727663275786e-06, |
| 3.5568630210036645e-06, |
| 0.6349762082099915, |
| 0.9333071708679199, |
| 0.5989739298820496, |
| 0.5028566718101501, |
| 0.7891841530799866, |
| 0.48944294452667236, |
| 0.4759078919887543, |
| 0.43146440386772156, |
| 0.539191722869873, |
| 0.3894290626049042, |
| 0.538087785243988, |
| 0.28379419445991516, |
| 0.5046406984329224, |
| 0.5067718625068665, |
| 0.5060579180717468, |
| 0.6930060982704163, |
| 0.363099068403244, |
| 0.3801196813583374, |
| 0.5059704184532166, |
| 0.5147981643676758, |
| 0.5063120126724243, |
| 0.1608428955078125, |
| 0.17055238783359528, |
| 0.18348702788352966, |
| 0.4475654661655426, |
| 0.5803108215332031, |
| 0.9961491823196411, |
| 0.4789189100265503, |
| 0.5795977115631104, |
| 0.5235514044761658, |
| 1.349542617390398e-05, |
| 6.869557637401158e-06, |
| 1.1343794540152885e-05, |
| 0.5054447650909424, |
| 0.4932360053062439, |
| 0.5053790211677551, |
| 0.4945124387741089, |
| 0.8466330766677856, |
| 0.09067995101213455, |
| 0.5200114846229553, |
| 0.5741671919822693, |
| 0.546498715877533, |
| 0.4916382431983948, |
| 0.5894687175750732, |
| 0.5640509128570557, |
| 0.5067146420478821, |
| 0.5299816131591797, |
| 0.32341182231903076, |
| 0.522653341293335, |
| 0.7552465200424194, |
| 0.5522850751876831, |
| 0.5096533298492432, |
| 0.5080340504646301, |
| 0.4963303208351135, |
| 0.9567633271217346, |
| 0.4783303439617157, |
| 0.9586471319198608, |
| 0.3498120903968811, |
| 0.2851160764694214, |
| 0.3396932780742645, |
| 0.17300352454185486, |
| 0.5078068971633911, |
| 0.5194015502929688, |
| 0.48811495304107666, |
| 0.42335256934165955, |
| 0.4560243785381317, |
| 0.6968233585357666, |
| 0.5099424123764038, |
| 0.47498029470443726, |
| 0.47725340723991394, |
| 0.6388620138168335, |
| 0.6904007792472839, |
| 0.9997544884681702, |
| 0.93499356508255, |
| 0.9999597072601318, |
| 0.07373078167438507, |
| 0.20508405566215515, |
| 0.11463714390993118, |
| 0.6171519160270691, |
| 0.4903092682361603, |
| 0.8550575375556946, |
| 0.6555699110031128, |
| 0.6090169548988342, |
| 0.6722232699394226, |
| 0.9523137211799622, |
| 0.722933292388916, |
| 0.7777043581008911, |
| 0.5438691973686218, |
| 0.4905330538749695, |
| 0.5533438324928284, |
| 0.5145766139030457, |
| 0.5064784288406372, |
| 0.46289509534835815, |
| 0.08988309651613235, |
| 0.07098916918039322, |
| 0.059304364025592804, |
| 0.5105205774307251 |
| ], |
| "eval_code_runtime": 36.6672, |
| "eval_code_samples_per_second": 2.727, |
| "eval_code_steps_per_second": 0.055, |
| "epoch": 1.32, |
| "step": 50 |
| }, |
| { |
| "loss": 0.0995, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.34, |
| "step": 51 |
| }, |
| { |
| "loss": 0.1833, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.37, |
| "step": 52 |
| }, |
| { |
| "loss": 0.0263, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.39, |
| "step": 53 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.42, |
| "step": 54 |
| }, |
| { |
| "loss": 0.0002, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.45, |
| "step": 55 |
| }, |
| { |
| "loss": 0.0218, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.47, |
| "step": 56 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.5, |
| "step": 57 |
| }, |
| { |
| "loss": 0.0106, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.53, |
| "step": 58 |
| }, |
| { |
| "loss": 0.004, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.55, |
| "step": 59 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.58, |
| "step": 60 |
| }, |
| { |
| "loss": 0.0002, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.61, |
| "step": 61 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.63, |
| "step": 62 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.66, |
| "step": 63 |
| }, |
| { |
| "loss": 0.295, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.68, |
| "step": 64 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.71, |
| "step": 65 |
| }, |
| { |
| "loss": 0.0501, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.74, |
| "step": 66 |
| }, |
| { |
| "loss": 0.01, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.76, |
| "step": 67 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.79, |
| "step": 68 |
| }, |
| { |
| "loss": 0.0008, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.82, |
| "step": 69 |
| }, |
| { |
| "loss": 0.0194, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.84, |
| "step": 70 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.87, |
| "step": 71 |
| }, |
| { |
| "loss": 0.0006, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.89, |
| "step": 72 |
| }, |
| { |
| "loss": 0.0041, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.92, |
| "step": 73 |
| }, |
| { |
| "loss": 0.0771, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.95, |
| "step": 74 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 1.97, |
| "step": 75 |
| }, |
| { |
| "eval_code_low_quality_loss": 0.0007030765991657972, |
| "eval_code_low_quality_score": -0.0002731765853241086, |
| "eval_code_low_quality_brier_score": 0.0002731765853241086, |
| "eval_code_low_quality_average_probability": 0.998019278049469, |
| "eval_code_low_quality_accuracy": 1.0, |
| "eval_code_low_quality_probabilities": [ |
| 0.9999996423721313, |
| 0.9999985694885254, |
| 0.9997590184211731, |
| 0.9999872446060181, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.999883770942688, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9998874664306641, |
| 0.9946458339691162, |
| 1.0, |
| 1.0, |
| 0.9999872446060181, |
| 1.0, |
| 0.9999836683273315, |
| 0.9999860525131226, |
| 0.9999688863754272, |
| 0.9999788999557495, |
| 0.9999792575836182, |
| 0.9999990463256836, |
| 1.0, |
| 1.0, |
| 0.9991899132728577, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999985694885254, |
| 0.9999978542327881, |
| 0.9999850988388062, |
| 0.9999971389770508, |
| 1.0, |
| 1.0, |
| 0.9836633205413818, |
| 1.0, |
| 0.9999394416809082, |
| 0.9999537467956543, |
| 0.9999992847442627, |
| 0.9999977350234985, |
| 1.0, |
| 1.0, |
| 0.9999996423721313, |
| 0.9999992847442627, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 0.9999901056289673, |
| 0.9999992847442627, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999781847000122, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 0.9999926090240479, |
| 1.0, |
| 0.9996541738510132, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9997922778129578, |
| 0.9902224540710449, |
| 0.9999978542327881, |
| 0.9999958276748657, |
| 0.9999992847442627, |
| 0.9999996423721313, |
| 1.0, |
| 0.9999915361404419, |
| 0.9998434782028198, |
| 0.9998369216918945, |
| 0.9999985694885254, |
| 1.0, |
| 0.9999539852142334, |
| 0.8359099626541138 |
| ], |
| "eval_code_low_quality_runtime": 38.4859, |
| "eval_code_low_quality_samples_per_second": 2.598, |
| "eval_code_low_quality_steps_per_second": 0.052, |
| "epoch": 1.97, |
| "step": 75 |
| }, |
| { |
| "eval_code_loss": 1.232956051826477, |
| "eval_code_score": -0.31121882796287537, |
| "eval_code_brier_score": 0.31121882796287537, |
| "eval_code_average_probability": 0.5223905444145203, |
| "eval_code_accuracy": 0.6, |
| "eval_code_probabilities": [ |
| 0.00011101631389465183, |
| 0.0009927322389557958, |
| 0.0006042951135896146, |
| 0.8104570508003235, |
| 0.9767997860908508, |
| 0.6998010873794556, |
| 0.5327707529067993, |
| 0.8981274962425232, |
| 0.46407392621040344, |
| 0.5261912941932678, |
| 0.5234853029251099, |
| 0.5620546936988831, |
| 0.4464522898197174, |
| 0.6497852206230164, |
| 0.3163464069366455, |
| 0.5068030953407288, |
| 0.4470524191856384, |
| 0.4513201415538788, |
| 0.9744485020637512, |
| 0.5525326132774353, |
| 0.6335050463676453, |
| 0.5116932392120361, |
| 0.5079017281532288, |
| 0.49437832832336426, |
| 0.007605725899338722, |
| 0.005129675380885601, |
| 0.0051497663371264935, |
| 0.5000962018966675, |
| 0.632622480392456, |
| 0.9706986546516418, |
| 0.43275994062423706, |
| 0.7873733639717102, |
| 0.540113627910614, |
| 0.004106579814106226, |
| 0.001123218797147274, |
| 0.0015394079964607954, |
| 0.5942471027374268, |
| 0.49709969758987427, |
| 0.5328391194343567, |
| 0.4717523455619812, |
| 0.7803015112876892, |
| 0.15918061137199402, |
| 0.5596816539764404, |
| 0.7085431218147278, |
| 0.6711235642433167, |
| 0.44160714745521545, |
| 0.8594750761985779, |
| 0.7278712391853333, |
| 0.6237335801124573, |
| 0.6038733124732971, |
| 0.298341304063797, |
| 0.4917309582233429, |
| 0.9929433465003967, |
| 0.7463914155960083, |
| 0.5643486380577087, |
| 0.5242550373077393, |
| 0.48715683817863464, |
| 0.9934378266334534, |
| 0.6017891764640808, |
| 0.995071530342102, |
| 0.04592354968190193, |
| 0.03277994319796562, |
| 0.04245381057262421, |
| 0.17133520543575287, |
| 0.5046836137771606, |
| 0.4788260757923126, |
| 0.5977773070335388, |
| 0.3292385935783386, |
| 0.3777988851070404, |
| 0.8941593766212463, |
| 0.550373375415802, |
| 0.4914136230945587, |
| 0.4404219090938568, |
| 0.5822964310646057, |
| 0.6599177718162537, |
| 0.9999847412109375, |
| 0.8205021619796753, |
| 0.9999983310699463, |
| 0.06390584260225296, |
| 0.27923598885536194, |
| 0.18379205465316772, |
| 0.816386342048645, |
| 0.47810855507850647, |
| 0.994751513004303, |
| 0.6124905347824097, |
| 0.7866218090057373, |
| 0.9306473731994629, |
| 0.9980021119117737, |
| 0.9195950627326965, |
| 0.9040439128875732, |
| 0.5383397936820984, |
| 0.5097209811210632, |
| 0.5496564507484436, |
| 0.5447408556938171, |
| 0.5060871243476868, |
| 0.47790002822875977, |
| 0.13077017664909363, |
| 0.0860414132475853, |
| 0.08788496255874634, |
| 0.5176451802253723 |
| ], |
| "eval_code_runtime": 36.6727, |
| "eval_code_samples_per_second": 2.727, |
| "eval_code_steps_per_second": 0.055, |
| "epoch": 1.97, |
| "step": 75 |
| }, |
| { |
| "loss": 0.0008, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.0, |
| "step": 76 |
| }, |
| { |
| "loss": 0.0006, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.03, |
| "step": 77 |
| }, |
| { |
| "loss": 0.001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.05, |
| "step": 78 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.08, |
| "step": 79 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.11, |
| "step": 80 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.13, |
| "step": 81 |
| }, |
| { |
| "loss": 0.0003, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.16, |
| "step": 82 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.18, |
| "step": 83 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.21, |
| "step": 84 |
| }, |
| { |
| "loss": 0.0003, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.24, |
| "step": 85 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.26, |
| "step": 86 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.29, |
| "step": 87 |
| }, |
| { |
| "loss": 0.0017, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.32, |
| "step": 88 |
| }, |
| { |
| "loss": 0.0017, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.34, |
| "step": 89 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.37, |
| "step": 90 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.39, |
| "step": 91 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.42, |
| "step": 92 |
| }, |
| { |
| "loss": 0.0059, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.45, |
| "step": 93 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.47, |
| "step": 94 |
| }, |
| { |
| "loss": 0.0584, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.5, |
| "step": 95 |
| }, |
| { |
| "loss": 0.0175, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.53, |
| "step": 96 |
| }, |
| { |
| "loss": 0.0035, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.55, |
| "step": 97 |
| }, |
| { |
| "loss": 0.0014, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.58, |
| "step": 98 |
| }, |
| { |
| "loss": 0.0002, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.61, |
| "step": 99 |
| }, |
| { |
| "loss": 0.0008, |
| "learning_rate": 7.2e-05, |
| "epoch": 2.63, |
| "step": 100 |
| }, |
| { |
| "eval_code_low_quality_loss": 0.0012827370082959533, |
| "eval_code_low_quality_score": -0.00027803267585113645, |
| "eval_code_low_quality_brier_score": 0.00027803267585113645, |
| "eval_code_low_quality_average_probability": 0.9977189898490906, |
| "eval_code_low_quality_accuracy": 1.0, |
| "eval_code_low_quality_probabilities": [ |
| 0.9999994039535522, |
| 0.9999977350234985, |
| 0.9998675584793091, |
| 0.9999971389770508, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9997872710227966, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9998853206634521, |
| 0.9965422749519348, |
| 1.0, |
| 1.0, |
| 0.9999979734420776, |
| 1.0, |
| 0.9999878406524658, |
| 0.9999878406524658, |
| 0.9999140501022339, |
| 0.9999234676361084, |
| 0.9999630451202393, |
| 0.9999982118606567, |
| 1.0, |
| 1.0, |
| 0.9995156526565552, |
| 0.9999998807907104, |
| 0.9999997615814209, |
| 0.9999996423721313, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999949932098389, |
| 0.9999933242797852, |
| 0.9999910593032837, |
| 0.9999983310699463, |
| 1.0, |
| 1.0, |
| 0.9342825412750244, |
| 1.0, |
| 0.9998719692230225, |
| 0.9999229907989502, |
| 0.9999988079071045, |
| 0.9999977350234985, |
| 1.0, |
| 1.0, |
| 0.9999996423721313, |
| 0.9999992847442627, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999988079071045, |
| 0.9999582767486572, |
| 0.999998927116394, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9994237422943115, |
| 0.9999994039535522, |
| 1.0, |
| 1.0, |
| 0.9999977350234985, |
| 1.0, |
| 0.9998207688331604, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999158382415771, |
| 0.9968264102935791, |
| 0.9999985694885254, |
| 0.9999969005584717, |
| 0.9999995231628418, |
| 0.9999995231628418, |
| 1.0, |
| 0.9999986886978149, |
| 0.9998912811279297, |
| 0.9998600482940674, |
| 0.9999988079071045, |
| 1.0, |
| 0.9999797344207764, |
| 0.8468278646469116 |
| ], |
| "eval_code_low_quality_runtime": 38.4811, |
| "eval_code_low_quality_samples_per_second": 2.599, |
| "eval_code_low_quality_steps_per_second": 0.052, |
| "epoch": 2.63, |
| "step": 100 |
| }, |
| { |
| "eval_code_loss": 1.1787313222885132, |
| "eval_code_score": -0.31372034549713135, |
| "eval_code_brier_score": 0.31372034549713135, |
| "eval_code_average_probability": 0.5205222964286804, |
| "eval_code_accuracy": 0.61, |
| "eval_code_probabilities": [ |
| 0.00037343462463468313, |
| 0.005696576554328203, |
| 0.0029806813690811396, |
| 0.7806524038314819, |
| 0.9673417806625366, |
| 0.7065327763557434, |
| 0.5146356821060181, |
| 0.8472678065299988, |
| 0.47349339723587036, |
| 0.5219644904136658, |
| 0.5305175185203552, |
| 0.5515053272247314, |
| 0.46156707406044006, |
| 0.6081150770187378, |
| 0.32390114665031433, |
| 0.5063720941543579, |
| 0.44415482878685, |
| 0.44942569732666016, |
| 0.9759170413017273, |
| 0.5840467214584351, |
| 0.6595930457115173, |
| 0.5098740458488464, |
| 0.5081343650817871, |
| 0.49616581201553345, |
| 0.0029768662061542273, |
| 0.002015285426750779, |
| 0.0017812805017456412, |
| 0.5042777061462402, |
| 0.6546298861503601, |
| 0.9300457239151001, |
| 0.4243517518043518, |
| 0.8517654538154602, |
| 0.5293809771537781, |
| 0.06185666099190712, |
| 0.015204992145299911, |
| 0.0212001521140337, |
| 0.5635135173797607, |
| 0.49610862135887146, |
| 0.5277267694473267, |
| 0.508770763874054, |
| 0.8537895083427429, |
| 0.23215477168560028, |
| 0.5770038962364197, |
| 0.7559729814529419, |
| 0.6758078336715698, |
| 0.43735623359680176, |
| 0.8165058493614197, |
| 0.741995096206665, |
| 0.6506164073944092, |
| 0.6589956879615784, |
| 0.1663256138563156, |
| 0.4853304922580719, |
| 0.9941813349723816, |
| 0.7592731714248657, |
| 0.5826183557510376, |
| 0.5224794745445251, |
| 0.4846497178077698, |
| 0.9794431328773499, |
| 0.5740240216255188, |
| 0.9839484095573425, |
| 0.012579960748553276, |
| 0.008771419525146484, |
| 0.011818967759609222, |
| 0.16271692514419556, |
| 0.5130095481872559, |
| 0.45814013481140137, |
| 0.6292014122009277, |
| 0.2866065204143524, |
| 0.3463272154331207, |
| 0.9270575046539307, |
| 0.6034852266311646, |
| 0.4980922341346741, |
| 0.4166427254676819, |
| 0.5456990599632263, |
| 0.6291698217391968, |
| 0.9999699592590332, |
| 0.7315388321876526, |
| 0.9999964237213135, |
| 0.09563731402158737, |
| 0.25322115421295166, |
| 0.14264462888240814, |
| 0.7902861833572388, |
| 0.4692409634590149, |
| 0.9958581328392029, |
| 0.6111039519309998, |
| 0.799086332321167, |
| 0.9464629292488098, |
| 0.998227059841156, |
| 0.9346933960914612, |
| 0.8618530631065369, |
| 0.5354170203208923, |
| 0.517333984375, |
| 0.5421465635299683, |
| 0.5469100475311279, |
| 0.5029715895652771, |
| 0.48473188281059265, |
| 0.12127426266670227, |
| 0.07449286431074142, |
| 0.07441763579845428, |
| 0.515086829662323 |
| ], |
| "eval_code_runtime": 36.6788, |
| "eval_code_samples_per_second": 2.726, |
| "eval_code_steps_per_second": 0.055, |
| "epoch": 2.63, |
| "step": 100 |
| }, |
| { |
| "train_runtime": 3664.8951, |
| "train_samples_per_second": 0.873, |
| "train_steps_per_second": 0.027, |
| "total_flos": 0.0, |
| "train_loss": 0.1413757397209065, |
| "epoch": 2.63, |
| "step": 100 |
| } |
| ] |