openllama-3b-code_is_correct / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
25e1204
Invalid JSON: Expected ',' or ']' after array element in JSONat line 352, column 15
[
{
"loss": 0.7294,
"learning_rate": 7.2e-05,
"epoch": 0.05,
"step": 1
},
{
"loss": 0.6837,
"learning_rate": 7.2e-05,
"epoch": 0.11,
"step": 2
},
{
"loss": 0.7207,
"learning_rate": 7.2e-05,
"epoch": 0.16,
"step": 3
},
{
"loss": 0.7014,
"learning_rate": 7.2e-05,
"epoch": 0.21,
"step": 4
},
{
"loss": 0.6994,
"learning_rate": 7.2e-05,
"epoch": 0.26,
"step": 5
},
{
"loss": 0.6877,
"learning_rate": 7.2e-05,
"epoch": 0.32,
"step": 6
},
{
"loss": 0.6923,
"learning_rate": 7.2e-05,
"epoch": 0.37,
"step": 7
},
{
"loss": 0.706,
"learning_rate": 7.2e-05,
"epoch": 0.42,
"step": 8
},
{
"loss": 0.7193,
"learning_rate": 7.2e-05,
"epoch": 0.47,
"step": 9
},
{
"loss": 0.7082,
"learning_rate": 7.2e-05,
"epoch": 0.53,
"step": 10
},
{
"loss": 0.6847,
"learning_rate": 7.2e-05,
"epoch": 0.58,
"step": 11
},
{
"loss": 0.7139,
"learning_rate": 7.2e-05,
"epoch": 0.63,
"step": 12
},
{
"loss": 0.7051,
"learning_rate": 7.2e-05,
"epoch": 0.68,
"step": 13
},
{
"loss": 0.7057,
"learning_rate": 7.2e-05,
"epoch": 0.74,
"step": 14
},
{
"loss": 0.6808,
"learning_rate": 7.2e-05,
"epoch": 0.79,
"step": 15
},
{
"loss": 0.7065,
"learning_rate": 7.2e-05,
"epoch": 0.84,
"step": 16
},
{
"loss": 0.6851,
"learning_rate": 7.2e-05,
"epoch": 0.89,
"step": 17
},
{
"loss": 0.6962,
"learning_rate": 7.2e-05,
"epoch": 0.95,
"step": 18
},
{
"loss": 0.6754,
"learning_rate": 7.2e-05,
"epoch": 1.0,
"step": 19
},
{
"loss": 0.703,
"learning_rate": 7.2e-05,
"epoch": 1.05,
"step": 20
},
{
"loss": 0.6805,
"learning_rate": 7.2e-05,
"epoch": 1.11,
"step": 21
},
{
"loss": 0.6911,
"learning_rate": 7.2e-05,
"epoch": 1.16,
"step": 22
},
{
"loss": 0.6972,
"learning_rate": 7.2e-05,
"epoch": 1.21,
"step": 23
},
{
"loss": 0.7043,
"learning_rate": 7.2e-05,
"epoch": 1.26,
"step": 24
},
{
"loss": 0.6986,
"learning_rate": 7.2e-05,
"epoch": 1.32,
"step": 25
},
{
"eval_code_is_correct_loss": 0.6981677412986755,
"eval_code_is_correct_score": -0.25274571776390076,
"eval_code_is_correct_brier_score": 0.25274571776390076,
"eval_code_is_correct_average_probability": 0.4975625276565552,
"eval_code_is_correct_accuracy": 0.43,
"eval_code_is_correct_probabilities": [
0.5088271498680115,
0.48198673129081726,
0.4981909990310669,
0.5024533271789551,
0.48107844591140747,
0.5089389681816101,
0.4841275215148926,
0.4966141879558563,
0.5106652975082397,
0.5127133131027222,
0.4725325107574463,
0.5244400501251221,
0.511084258556366,
0.521553635597229,
0.4971517324447632,
0.48880547285079956,
0.4734472632408142,
0.5228509306907654,
0.4940826892852783,
0.47331884503364563,
0.5112957954406738,
0.4850262403488159,
0.4836397171020508,
0.49904710054397583,
0.528581440448761,
0.5303167700767517,
0.5002449750900269,
0.5001938343048096,
0.4752185046672821,
0.514567494392395,
0.4778810441493988,
0.4975382685661316,
0.5223871469497681,
0.48589223623275757,
0.46854928135871887,
0.5050678849220276,
0.47625279426574707,
0.48999258875846863,
0.4709635376930237,
0.5040507316589355,
0.4879027009010315,
0.5210784077644348,
0.5200101137161255,
0.49343761801719666,
0.47951218485832214,
0.49272558093070984,
0.5004433393478394,
0.5177253484725952,
0.5200391411781311,
0.5149074792861938,
0.5044199824333191,
0.4863050580024719,
0.48952627182006836,
0.48324888944625854,
0.4773913621902466,
0.4935683608055115,
0.5272597074508667,
0.4823913872241974,
0.4688487946987152,
0.4804125130176544,
0.48838281631469727,
0.49300506711006165,
0.4761504828929901,
0.5559667348861694,
0.4856325089931488,
0.4806632697582245,
0.499020516872406,
0.5097540020942688,
0.5151796936988831,
0.5133408904075623,
0.4923568367958069,
0.5121997594833374,
0.49316778779029846,
0.4804587960243225,
0.5247389078140259,
0.48702362179756165,
0.48010408878326416,
0.4811219871044159,
0.48185238242149353,
0.4993566572666168,
0.4789592921733856,
0.481153279542923,
0.5070401430130005,
0.5011581182479858,
0.4959249794483185,
0.481794536113739,
0.4979727566242218,
0.5089129209518433,
0.5138169527053833,
0.48047563433647156,
0.5165080428123474,
0.5102388262748718,
0.515179455280304,
0.5202771425247192,
0.49016904830932617,
0.517183244228363,
0.50786954164505,
0.5065057873725891,
0.47355517745018005,
0.4693579375743866
],
"eval_code_is_correct_runtime": 29.2492,
"eval_code_is_correct_samples_per_second": 3.419,
"eval_code_is_correct_steps_per_second": 0.068,
"epoch": 1.32,
"step": 25
},
{
"loss": 0.696,
"learning_rate": 7.2e-05,
"epoch": 1.37,
"step": 26
},
{
"loss": 0.6871,
"learning_rate": 7.2e-05,
"epoch": 1.42,
"step": 27
},
{
"loss": 0.6972,
"learning_rate": 7.2e-05,
"epoch": 1.47,
"step": 28
},
{
"loss": 0.6813,
"learning_rate": 7.2e-05,
"epoch": 1.53,
"step": 29
},
{
"loss": 0.6828,
"learning_rate": 7.2e-05,
"epoch": 1.58,
"step": 30
},
{
"loss": 0.6826,
"learning_rate": 7.2e-05,
"epoch": 1.63,
"step": 31
},
{
"loss": 0.6938,
"learning_rate": 7.2e-05,
"epoch": 1.68,
"step": 32
},
{
"loss": 0.6955,
"learning_rate": 7.2e-05,
"epoch": 1.74,
"step": 33
},
{
"loss": 0.6808,
"learning_rate": 7.2e-05,
"epoch": 1.79,
"step": 34
},
{
"loss": 0.6886,
"learning_rate": 7.2e-05,
"epoch": 1.84,
"step": 35
},
{
"loss": 0.6998,
"learning_rate": 7.2e-05,
"epoch": 1.89,
"step": 36
},
{
"loss": 0.6769,
"learning_rate": 7.2e-05,
"epoch": 1.95,
"step": 37
},
{
"loss": 0.7146,
"learning_rate": 7.2e-05,
"epoch": 2.0,
"step": 38
},
{
"loss": 0.6642,
"learning_rate": 7.2e-05,
"epoch": 2.05,
"step": 39
},
"loss": 0.684,
"learning_rate": 7.2e-05,
"epoch": 2.11,
"step": 40
},
{
"loss": 0.6962,
"learning_rate": 7.2e-05,
"epoch": 2.16,
"step": 41
},
{
"loss": 0.7021,
"learning_rate": 7.2e-05,
"epoch": 2.21,
"step": 42
},
{
"loss": 0.702,
"learning_rate": 7.2e-05,
"epoch": 2.26,
"step": 43
},
{
"loss": 0.6701,
"learning_rate": 7.2e-05,
"epoch": 2.32,
"step": 44
},
{
"loss": 0.7221,
"learning_rate": 7.2e-05,
"epoch": 2.37,
"step": 45
},
{
"loss": 0.6895,
"learning_rate": 7.2e-05,
"epoch": 2.42,
"step": 46
},
{
"loss": 0.6897,
"learning_rate": 7.2e-05,
"epoch": 2.47,
"step": 47
},
{
"loss": 0.7001,
"learning_rate": 7.2e-05,
"epoch": 2.53,
"step": 48
},
{
"loss": 0.6845,
"learning_rate": 7.2e-05,
"epoch": 2.58,
"step": 49
},
{
"loss": 0.702,
"learning_rate": 7.2e-05,
"epoch": 2.63,
"step": 50
},
{
"eval_code_is_correct_loss": 0.6996689438819885,
"eval_code_is_correct_score": -0.25365304946899414,
"eval_code_is_correct_brier_score": 0.25365304946899414,
"eval_code_is_correct_average_probability": 0.4967172145843506,
"eval_code_is_correct_accuracy": 0.43,
"eval_code_is_correct_probabilities": [
0.5074375867843628,
0.4723518490791321,
0.48632118105888367,
0.49848517775535583,
0.476654589176178,
0.5107546448707581,
0.4704548716545105,
0.49364662170410156,
0.49723079800605774,
0.49965834617614746,
0.4738099277019501,
0.5174873471260071,
0.5036610960960388,
0.5156582593917847,
0.49093103408813477,
0.49312105774879456,
0.4914981424808502,
0.5185192823410034,
0.5077788233757019,
0.4805068373680115,
0.4961990416049957,
0.49203917384147644,
0.4657118618488312,
0.4971868097782135,
0.5209845304489136,
0.5242859721183777,
0.5050302147865295,
0.5064529776573181,
0.47357138991355896,
0.5292315483093262,
0.48264941573143005,
0.5002627968788147,
0.5115101933479309,
0.4869055151939392,
0.46029502153396606,
0.49682366847991943,
0.4798851013183594,
0.4962373971939087,
0.4617874026298523,
0.5052241683006287,
0.4935094118118286,
0.5108048319816589,
0.5389617085456848,
0.49815618991851807,
0.47433826327323914,
0.49846169352531433,
0.49559274315834045,
0.5151790976524353,
0.5131077170372009,
0.5054615139961243,
0.4999138414859772,
0.5005282163619995,
0.4700585603713989,
0.4792395234107971,
0.484203577041626,
0.5069689750671387,
0.5312584042549133,
0.48872625827789307,
0.4664309024810791,
0.4882381856441498,
0.49106600880622864,
0.5087692737579346,
0.4675412178039551,
0.573962390422821,
0.4947565197944641,
0.4820893108844757,
0.5046402215957642,
0.5246191620826721,
0.5146574378013611,
0.5106992125511169,
0.5022192597389221,
0.5226336717605591,
0.5060445070266724,
0.481097012758255,
0.5169151425361633,
0.4949752390384674,
0.4639112055301666,
0.4817794859409332,
0.48367029428482056,
0.4781152904033661,
0.47685888409614563,
0.48095741868019104,
0.491726815700531,
0.5017462968826294,
0.4904364347457886,
0.4698854982852936,
0.5083165168762207,
0.5017600655555725,
0.5108470916748047,
0.48250630497932434,
0.5158757567405701,
0.5019074082374573,
0.5176712274551392,
0.5154513716697693,
0.503238320350647,
0.5167521834373474,
0.4993845224380493,
0.4867921769618988,
0.47787371277809143,
0.46018683910369873
],
"eval_code_is_correct_runtime": 29.2407,
"eval_code_is_correct_samples_per_second": 3.42,
"eval_code_is_correct_steps_per_second": 0.068,
"epoch": 2.63,
"step": 50
},
{
"loss": 0.6957,
"learning_rate": 7.2e-05,
"epoch": 2.68,
"step": 51
},
{
"loss": 0.6726,
"learning_rate": 7.2e-05,
"epoch": 2.74,
"step": 52
},
{
"loss": 0.6883,
"learning_rate": 7.2e-05,
"epoch": 2.79,
"step": 53
},
{
"loss": 0.6894,
"learning_rate": 7.2e-05,
"epoch": 2.84,
"step": 54
},
{
"loss": 0.6743,
"learning_rate": 7.2e-05,
"epoch": 2.89,
"step": 55
},
{
"loss": 0.6833,
"learning_rate": 7.2e-05,
"epoch": 2.95,
"step": 56
},
{
"loss": 0.6786,
"learning_rate": 7.2e-05,
"epoch": 3.0,
"step": 57
},
{
"loss": 0.699,
"learning_rate": 7.2e-05,
"epoch": 3.05,
"step": 58
},
{
"loss": 0.6791,
"learning_rate": 7.2e-05,
"epoch": 3.11,
"step": 59
},
{
"loss": 0.6751,
"learning_rate": 7.2e-05,
"epoch": 3.16,
"step": 60
},
{
"loss": 0.6812,
"learning_rate": 7.2e-05,
"epoch": 3.21,
"step": 61
},
{
"loss": 0.6724,
"learning_rate": 7.2e-05,
"epoch": 3.26,
"step": 62
},
{
"loss": 0.6829,
"learning_rate": 7.2e-05,
"epoch": 3.32,
"step": 63
},
{
"loss": 0.6842,
"learning_rate": 7.2e-05,
"epoch": 3.37,
"step": 64
},
{
"loss": 0.6806,
"learning_rate": 7.2e-05,
"epoch": 3.42,
"step": 65
},
{
"loss": 0.6905,
"learning_rate": 7.2e-05,
"epoch": 3.47,
"step": 66
},
{
"loss": 0.6845,
"learning_rate": 7.2e-05,
"epoch": 3.53,
"step": 67
},
{
"loss": 0.6722,
"learning_rate": 7.2e-05,
"epoch": 3.58,
"step": 68
},
{
"loss": 0.6976,
"learning_rate": 7.2e-05,
"epoch": 3.63,
"step": 69
},
{
"loss": 0.6757,
"learning_rate": 7.2e-05,
"epoch": 3.68,
"step": 70
},
{
"loss": 0.6638,
"learning_rate": 7.2e-05,
"epoch": 3.74,
"step": 71
},
{
"loss": 0.6589,
"learning_rate": 7.2e-05,
"epoch": 3.79,
"step": 72
},
{
"loss": 0.6792,
"learning_rate": 7.2e-05,
"epoch": 3.84,
"step": 73
},
{
"loss": 0.6868,
"learning_rate": 7.2e-05,
"epoch": 3.89,
"step": 74
},
{
"loss": 0.6743,
"learning_rate": 7.2e-05,
"epoch": 3.95,
"step": 75
},
{
"eval_code_is_correct_loss": 0.7115283012390137,
"eval_code_is_correct_score": -0.25936323404312134,
"eval_code_is_correct_brier_score": 0.25936323404312134,
"eval_code_is_correct_average_probability": 0.492844820022583,
"eval_code_is_correct_accuracy": 0.45,
""eval_code_is_correct_probabilities": [
0.5315108895301819,
0.4404357671737671,
0.4393325448036194,
0.5136876702308655,
0.4317817986011505,
0.5407170057296753,
0.42210498452186584,
0.5032879114151001,
0.499985009431839,
0.5063377022743225,
0.44853413105010986,
0.5249595642089844,
0.519929051399231,
0.5444207191467285,
0.46772903203964233,
0.4709188640117645,
0.49579933285713196,
0.5452953577041626,
0.5071123838424683,
0.4668845534324646,
0.5050070285797119,
0.4854079782962799,
0.4207446873188019,
0.5136836171150208,
0.5283437371253967,
0.5321181416511536,
0.4974518120288849,
0.4980766177177429,
0.43917903304100037,
0.5816516876220703,
0.4618088901042938,
0.48619911074638367,
0.5236653089523315,
0.45910876989364624,
0.40605857968330383,
0.4992276430130005,
0.45045509934425354,
0.47411617636680603,
0.40248948335647583,
0.5305703282356262,
0.4813811182975769,
0.5272884368896484,
0.6161030530929565,
0.46347883343696594,
0.43354177474975586,
0.4877569079399109,
0.5148259997367859,
0.5279054045677185,
0.5294895172119141,
0.5120590329170227,
0.5139973163604736,
0.5520778298377991,
0.45969536900520325,
0.4304928183555603,
0.48464471101760864,
0.5018194913864136,
0.5791583061218262,
0.47863584756851196,
0.41838565468788147,
0.4741626977920532,
0.4651537537574768,
0.5022154450416565,
0.4011237621307373,
0.6317132115364075,
0.4900273084640503,
0.44324833154678345,
0.4855543375015259,
0.5688998103141785,
0.532179057598114,
0.5357102155685425,
0.48324429988861084,
0.5526444911956787,
0.539372444152832,
0.44041797518730164,
0.5359059572219849,
0.46845659613609314,
0.42640483379364014,
0.4501952528953552,
0.4579535722732544,
0.4656803011894226,
0.43683329224586487,
0.448000431060791,
0.482930064201355,
0.5224722623825073,
0.4616173803806305,
0.42225685715675354,
0.48842281103134155,
0.5094820261001587,
0.5359870195388794,
0.45143479108810425,
0.5495825409889221,
0.5185818672180176,
0.5359978675842285,
0.5442188382148743,
0.5404256582260132,
0.5551626682281494,
0.5226612091064453,
0.4831567108631134,
0.4785938560962677,
0.41752859950065613
],
"eval_code_is_correct_runtime": 29.2291,
"eval_code_is_correct_samples_per_second": 3.421,
"eval_code_is_correct_steps_per_second": 0.068,
"epoch": 3.95,
"step": 75
},
{
"loss": 0.6737,
"learning_rate": 7.2e-05,
"epoch": 4.0,
"step": 76
},
{
"loss": 0.6813,
"learning_rate": 7.2e-05,
"epoch": 4.05,
"step": 77
},
{
"loss": 0.6845,
"learning_rate": 7.2e-05,
"epoch": 4.11,
"step": 78
},
{
"loss": 0.68,
"learning_rate": 7.2e-05,
"epoch": 4.16,
"step": 79
},
{
"loss": 0.6638,
"learning_rate": 7.2e-05,
"epoch": 4.21,
"step": 80
},
{
"loss": 0.7058,
"learning_rate": 7.2e-05,
"epoch": 4.26,
"step": 81
},
{
"loss": 0.6644,
"learning_rate": 7.2e-05,
"epoch": 4.32,
"step": 82
},
{
"loss": 0.6641,
"learning_rate": 7.2e-05,
"epoch": 4.37,
"step": 83
},
{
"loss": 0.665,
"learning_rate": 7.2e-05,
"epoch": 4.42,
"step": 84
},
{
"loss": 0.6785,
"learning_rate": 7.2e-05,
"epoch": 4.47,
"step": 85
},
{
"loss": 0.6354,
"learning_rate": 7.2e-05,
"epoch": 4.53,
"step": 86
},
{
"loss": 0.6546,
"learning_rate": 7.2e-05,
"epoch": 4.58,
"step": 87
},
{
"loss": 0.6678,
"learning_rate": 7.2e-05,
"epoch": 4.63,
"step": 88
},
{
"loss": 0.6342,
"learning_rate": 7.2e-05,
"epoch": 4.68,
"step": 89
},
{
"loss": 0.6919,
"learning_rate": 7.2e-05,
"epoch": 4.74,
"step": 90
},
{
"loss": 0.6494,
"learning_rate": 7.2e-05,
"epoch": 4.79,
"step": 91
},
{
"loss": 0.6597,
"learning_rate": 7.2e-05,
"epoch": 4.84,
"step": 92
},
{
"loss": 0.6769,
"learning_rate": 7.2e-05,
"epoch": 4.89,
"step": 93
},
{
"loss": 0.6669,
"learning_rate": 7.2e-05,
"epoch": 4.95,
"step": 94
},
{
"loss": 0.6585,
"learning_rate": 7.2e-05,
"epoch": 5.0,
"step": 95
},
{
"loss": 0.6861,
"learning_rate": 7.2e-05,
"epoch": 5.05,
"step": 96
},
{
"loss": 0.6498,
"learning_rate": 7.2e-05,
"epoch": 5.11,
"step": 97
},
{
"loss": 0.6466,
"learning_rate": 7.2e-05,
"epoch": 5.16,
"step": 98
},
{
"loss": 0.6421,
"learning_rate": 7.2e-05,
"epoch": 5.21,
"step": 99
},
{
"loss": 0.6568,
"learning_rate": 7.2e-05,
"epoch": 5.26,
"step": 100
},
{
"eval_code_is_correct_loss": 0.7250129580497742,
"eval_code_is_correct_score": -0.2655547261238098,
"eval_code_is_correct_brier_score": 0.2655547261238098,
"eval_code_is_correct_average_probability": 0.49155572056770325,
"eval_code_is_correct_accuracy": 0.48,
"eval_code_is_correct_probabilities": [
0.5083851218223572,
0.4273935854434967,
0.4364035129547119,
0.4872526526451111,
0.37440311908721924,
0.5888470411300659,
0.37513232231140137,
0.48127123713493347,
0.47687897086143494,
0.4585302472114563,
0.4116853177547455,
0.5032776594161987,
0.5315262675285339,
0.5401375889778137,
0.47433847188949585,
0.48878082633018494,
0.5708949565887451,
0.5461510419845581,
0.5810272097587585,
0.4907934367656708,
0.4523153305053711,
0.5213923454284668,
0.40194064378738403,
0.4633757770061493,
0.4978197515010834,
0.5100975632667542,
0.5173598527908325,
0.5476617813110352,
0.45146241784095764,
0.6570491194725037,
0.453940212726593,
0.5251180529594421,
0.48246118426322937,
0.4712594449520111,
0.3543213903903961,
0.4387568533420563,
0.45936518907546997,
0.48073822259902954,
0.3076059818267822,
0.5172088742256165,
0.5109153985977173,
0.49946558475494385,
0.7792166471481323,
0.43944960832595825,
0.42077937722206116,
0.5631754398345947,
0.493571937084198,
0.49611571431159973,
0.5187433362007141,
0.5067903995513916,
0.48328694701194763,
0.6678159236907959,
0.3781387507915497,
0.3635239005088806,
0.5364617109298706,
0.5524997115135193,
0.632897675037384,
0.511653482913971,
0.3425663709640503,
0.5403125882148743,
0.47932958602905273,
0.5451420545578003,
0.32550284266471863,
0.7307556867599487,
0.5360798835754395,
0.36980098485946655,
0.5202561616897583,
0.6240019798278809,
0.5508140921592712,
0.5679302215576172,
0.5044476389884949,
0.5724747776985168,
0.5710216760635376,
0.3993741571903229,
0.5445007681846619,
0.4687022268772125,
0.38320469856262207,
0.4335331320762634,
0.44064751267433167,
0.3625722825527191,
0.42068955302238464,
0.3999265134334564,
0.38937661051750183,
0.5059962272644043,
0.48507365584373474,
0.3598549962043762,
0.5178597569465637,
0.518267810344696,
0.5441962480545044,
0.4130031168460846,
0.613496720790863,
0.45683199167251587,
0.534511148929596,
0.5284443497657776,
0.6089046001434326,
0.5780519843101501,
0.544437050819397,
0.41231974959373474,
0.5470799207687378,
0.34541189670562744
],
"eval_code_is_correct_runtime": 29.2342,
"eval_code_is_correct_samples_per_second": 3.421,
"eval_code_is_correct_steps_per_second": 0.068,
"epoch": 5.26,
"step": 100
},
{
"train_runtime": 1903.4626,
"train_samples_per_second": 1.681,
"train_steps_per_second": 0.053,
"total_flos": 0.0,
"train_loss": 0.6841741448640823,
"epoch": 5.26,
"step": 100
}
]