openllama-3b-unhelpful_alpaca / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
92e4532
[
{
"loss": 0.6786,
"learning_rate": 7.2e-05,
"epoch": 0.03,
"step": 1
},
{
"loss": 0.6579,
"learning_rate": 7.2e-05,
"epoch": 0.05,
"step": 2
},
{
"loss": 0.625,
"learning_rate": 7.2e-05,
"epoch": 0.08,
"step": 3
},
{
"loss": 0.6009,
"learning_rate": 7.2e-05,
"epoch": 0.11,
"step": 4
},
{
"loss": 0.5805,
"learning_rate": 7.2e-05,
"epoch": 0.13,
"step": 5
},
{
"loss": 0.5482,
"learning_rate": 7.2e-05,
"epoch": 0.16,
"step": 6
},
{
"loss": 0.5001,
"learning_rate": 7.2e-05,
"epoch": 0.18,
"step": 7
},
{
"loss": 0.4963,
"learning_rate": 7.2e-05,
"epoch": 0.21,
"step": 8
},
{
"loss": 0.4514,
"learning_rate": 7.2e-05,
"epoch": 0.24,
"step": 9
},
{
"loss": 0.388,
"learning_rate": 7.2e-05,
"epoch": 0.26,
"step": 10
},
{
"loss": 0.3235,
"learning_rate": 7.2e-05,
"epoch": 0.29,
"step": 11
},
{
"loss": 0.3438,
"learning_rate": 7.2e-05,
"epoch": 0.32,
"step": 12
},
{
"loss": 0.2536,
"learning_rate": 7.2e-05,
"epoch": 0.34,
"step": 13
},
{
"loss": 0.272,
"learning_rate": 7.2e-05,
"epoch": 0.37,
"step": 14
},
{
"loss": 0.2117,
"learning_rate": 7.2e-05,
"epoch": 0.39,
"step": 15
},
{
"loss": 0.2177,
"learning_rate": 7.2e-05,
"epoch": 0.42,
"step": 16
},
{
"loss": 0.1553,
"learning_rate": 7.2e-05,
"epoch": 0.45,
"step": 17
},
{
"loss": 0.1271,
"learning_rate": 7.2e-05,
"epoch": 0.47,
"step": 18
},
{
"loss": 0.1402,
"learning_rate": 7.2e-05,
"epoch": 0.5,
"step": 19
},
{
"loss": 0.1508,
"learning_rate": 7.2e-05,
"epoch": 0.53,
"step": 20
},
{
"loss": 0.0748,
"learning_rate": 7.2e-05,
"epoch": 0.55,
"step": 21
},
{
"loss": 0.0553,
"learning_rate": 7.2e-05,
"epoch": 0.58,
"step": 22
},
{
"loss": 0.0653,
"learning_rate": 7.2e-05,
"epoch": 0.61,
"step": 23
},
{
"loss": 0.0463,
"learning_rate": 7.2e-05,
"epoch": 0.63,
"step": 24
},
{
"loss": 0.0303,
"learning_rate": 7.2e-05,
"epoch": 0.66,
"step": 25
},
{
"eval_unhelpful_qa_loss": 0.01779823936522007,
"eval_unhelpful_qa_score": -0.0010496400063857436,
"eval_unhelpful_qa_brier_score": 0.0010496400063857436,
"eval_unhelpful_qa_average_probability": 0.9844704270362854,
"eval_unhelpful_qa_accuracy": 1.0,
"eval_unhelpful_qa_probabilities": [
0.9939919114112854,
0.9919893145561218,
0.8812373876571655,
0.851738691329956,
0.9973465204238892,
0.9960262775421143,
0.9988310933113098,
0.9891974329948425,
0.9986070990562439,
0.9992314577102661,
0.9990812540054321,
0.9973466396331787,
0.9113909602165222,
0.9160753488540649,
0.9991025924682617,
0.9979730248451233,
0.989537239074707,
0.9893562197685242,
0.99642413854599,
0.9989349246025085,
0.9995711445808411,
0.9964518547058105,
0.9990758895874023,
0.9947203397750854,
0.9984740614891052,
0.9956274032592773,
0.9992215633392334,
0.9988768696784973,
0.989105761051178,
0.9887821078300476,
0.9629070162773132,
0.9381523132324219,
0.9953693747520447,
0.9993336796760559,
0.9995018243789673,
0.9994494318962097,
0.9896090030670166,
0.9062108397483826,
0.988205075263977,
0.9981988072395325,
0.9910675883293152,
0.9604835510253906,
0.9976778626441956,
0.9929446578025818,
0.9992949962615967,
0.9992386102676392,
0.9824511408805847,
0.9721674919128418,
0.9989849925041199,
0.9980792999267578,
0.9980413913726807,
0.9973067045211792,
0.9900492429733276,
0.9161818623542786,
0.998734176158905,
0.9994983673095703,
0.9936081171035767,
0.9967616200447083,
0.9997459053993225,
0.9997015595436096,
0.9963715076446533,
0.9964374303817749,
0.9894015192985535,
0.9956427812576294,
0.9990524649620056,
0.9971012473106384,
0.98968505859375,
0.9685617685317993,
0.9976811408996582,
0.9932328462600708,
0.9612935781478882,
0.9011391401290894,
0.9958304762840271,
0.9974175691604614,
0.9763060212135315,
0.9916849136352539,
0.9701336622238159,
0.9753015041351318,
0.9987087249755859,
0.9989778995513916,
0.9981098175048828,
0.9985300302505493,
0.9991015195846558,
0.9993440508842468,
0.9979883432388306,
0.9987518787384033,
0.9983501434326172,
0.9938720464706421,
0.998902440071106,
0.9992947578430176,
0.9258926510810852,
0.9793673157691956,
0.9225127100944519,
0.9537939429283142,
0.9991394281387329,
0.9929335117340088,
0.9970986843109131,
0.9969837069511414,
0.997686505317688,
0.9971426129341125
],
"eval_unhelpful_qa_runtime": 8.4452,
"eval_unhelpful_qa_samples_per_second": 11.841,
"eval_unhelpful_qa_steps_per_second": 0.237,
"epoch": 0.66,
"step": 25
},
{
"loss": 0.0085,
"learning_rate": 7.2e-05,
"epoch": 0.68,
"step": 26
},
{
"loss": 0.0037,
"learning_rate": 7.2e-05,
"epoch": 0.71,
"step": 27
},
{
"loss": 0.0071,
"learning_rate": 7.2e-05,
"epoch": 0.74,
"step": 28
},
{
"loss": 0.0019,
"learning_rate": 7.2e-05,
"epoch": 0.76,
"step": 29
},
{
"loss": 0.0026,
"learning_rate": 7.2e-05,
"epoch": 0.79,
"step": 30
},
{
"loss": 0.0005,
"learning_rate": 7.2e-05,
"epoch": 0.82,
"step": 31
},
{
"loss": 0.0003,
"learning_rate": 7.2e-05,
"epoch": 0.84,
"step": 32
},
{
"loss": 0.0007,
"learning_rate": 7.2e-05,
"epoch": 0.87,
"step": 33
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 0.89,
"step": 34
},
{
"loss": 0.0013,
"learning_rate": 7.2e-05,
"epoch": 0.92,
"step": 35
},
{
"loss": 0.0004,
"learning_rate": 7.2e-05,
"epoch": 0.95,
"step": 36
},
{
"loss": 0.0017,
"learning_rate": 7.2e-05,
"epoch": 0.97,
"step": 37
},
{
"loss": 0.0032,
"learning_rate": 7.2e-05,
"epoch": 1.0,
"step": 38
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.03,
"step": 39
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.05,
"step": 40
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.08,
"step": 41
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.11,
"step": 42
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.13,
"step": 43
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.16,
"step": 44
},
{
"loss": 0.0367,
"learning_rate": 7.2e-05,
"epoch": 1.18,
"step": 45
},
{
"loss": 0.1319,
"learning_rate": 7.2e-05,
"epoch": 1.21,
"step": 46
},
{
"loss": 0.0066,
"learning_rate": 7.2e-05,
"epoch": 1.24,
"step": 47
},
{
"loss": 0.0042,
"learning_rate": 7.2e-05,
"epoch": 1.26,
"step": 48
},
{
"loss": 0.0004,
"learning_rate": 7.2e-05,
"epoch": 1.29,
"step": 49
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.32,
"step": 50
},
{
"eval_unhelpful_qa_loss": 0.0005234834388829768,
"eval_unhelpful_qa_score": -5.054382654634537e-06,
"eval_unhelpful_qa_brier_score": 5.054382654634537e-06,
"eval_unhelpful_qa_average_probability": 0.9995836615562439,
"eval_unhelpful_qa_accuracy": 1.0,
"eval_unhelpful_qa_probabilities": [
0.9999996423721313,
0.9999973773956299,
0.9809955954551697,
0.9941462278366089,
0.9999998807907104,
0.9999997615814209,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.999602735042572,
0.9999313354492188,
0.9999998807907104,
0.9999998807907104,
0.9999991655349731,
0.9999985694885254,
0.9999990463256836,
1.0,
1.0,
0.9999966621398926,
1.0,
0.9999881982803345,
0.9999998807907104,
0.9999996423721313,
1.0,
1.0,
0.999996542930603,
0.9999954700469971,
0.9999890327453613,
0.9999867677688599,
0.9999895095825195,
1.0,
1.0,
1.0,
0.9999996423721313,
0.9902190566062927,
0.9999997615814209,
1.0,
0.9999997615814209,
0.9999992847442627,
0.9999998807907104,
0.9999978542327881,
1.0,
1.0,
0.9999979734420776,
0.9999970197677612,
1.0,
1.0,
1.0,
1.0,
0.9999990463256836,
0.999974250793457,
1.0,
1.0,
0.9999996423721313,
0.9999997615814209,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999977350234985,
0.9999998807907104,
0.9999998807907104,
0.9999998807907104,
0.9999973773956299,
0.9999854564666748,
0.9999998807907104,
0.9999980926513672,
0.999778687953949,
0.9970857501029968,
0.9999995231628418,
0.9999998807907104,
0.9999984502792358,
0.9999994039535522,
0.9999212026596069,
0.9999579191207886,
1.0,
1.0,
0.9999997615814209,
0.9999998807907104,
0.9999997615814209,
1.0,
0.9999997615814209,
1.0,
0.9999998807907104,
0.9999998807907104,
1.0,
1.0,
0.9977099895477295,
0.9999592304229736,
0.9994352459907532,
0.9997578263282776,
0.9999998807907104,
0.99998939037323,
0.9999998807907104,
0.9999998807907104,
1.0,
1.0
],
"eval_unhelpful_qa_runtime": 8.4513,
"eval_unhelpful_qa_samples_per_second": 11.832,
"eval_unhelpful_qa_steps_per_second": 0.237,
"epoch": 1.32,
"step": 50
},
{
"loss": 0.0003,
"learning_rate": 7.2e-05,
"epoch": 1.34,
"step": 51
},
{
"loss": 0.0008,
"learning_rate": 7.2e-05,
"epoch": 1.37,
"step": 52
},
{
"loss": 0.0002,
"learning_rate": 7.2e-05,
"epoch": 1.39,
"step": 53
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.42,
"step": 54
},
{
"loss": 0.0004,
"learning_rate": 7.2e-05,
"epoch": 1.45,
"step": 55
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.47,
"step": 56
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.5,
"step": 57
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.53,
"step": 58
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.55,
"step": 59
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.58,
"step": 60
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.61,
"step": 61
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.63,
"step": 62
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.66,
"step": 63
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.68,
"step": 64
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.71,
"step": 65
},
{
"loss": 0.0005,
"learning_rate": 7.2e-05,
"epoch": 1.74,
"step": 66
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.76,
"step": 67
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.79,
"step": 68
},
{
"loss": 0.0006,
"learning_rate": 7.2e-05,
"epoch": 1.82,
"step": 69
},
{
"loss": 0.0007,
"learning_rate": 7.2e-05,
"epoch": 1.84,
"step": 70
},
{
"loss": 0.0011,
"learning_rate": 7.2e-05,
"epoch": 1.87,
"step": 71
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 1.89,
"step": 72
},
{
"loss": 0.0002,
"learning_rate": 7.2e-05,
"epoch": 1.92,
"step": 73
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.95,
"step": 74
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 1.97,
"step": 75
},
{
"eval_unhelpful_qa_loss": 2.224229319836013e-05,
"eval_unhelpful_qa_score": -5.717748940980982e-09,
"eval_unhelpful_qa_brier_score": 5.717748940980982e-09,
"eval_unhelpful_qa_average_probability": 0.9999831914901733,
"eval_unhelpful_qa_accuracy": 1.0,
"eval_unhelpful_qa_probabilities": [
0.9999997615814209,
0.9999982118606567,
0.9994237422943115,
0.9999692440032959,
1.0,
0.9999997615814209,
1.0,
0.9999995231628418,
1.0,
1.0,
1.0,
1.0,
0.9999576807022095,
0.9999715089797974,
1.0,
0.9999998807907104,
0.9999959468841553,
0.9999905824661255,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999998807907104,
0.9999996423721313,
1.0,
1.0,
0.9997066855430603,
0.9996340274810791,
0.9999668598175049,
0.9999656677246094,
0.9999994039535522,
1.0,
1.0,
1.0,
0.9999997615814209,
0.9999434947967529,
1.0,
1.0,
0.9999998807907104,
0.9999998807907104,
0.9999998807907104,
0.9999996423721313,
1.0,
1.0,
0.9999988079071045,
0.9999988079071045,
1.0,
1.0,
1.0,
1.0,
0.999996542930603,
0.9999923706054688,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
0.9999990463256836,
0.9999997615814209,
1.0,
1.0,
0.9999990463256836,
0.9999986886978149,
1.0,
1.0,
0.9999765157699585,
0.9999898672103882,
1.0,
1.0,
0.9999873638153076,
0.9999938011169434,
0.9999959468841553,
0.9999977350234985,
0.9999998807907104,
0.9999998807907104,
0.9999998807907104,
0.9999998807907104,
1.0,
1.0,
0.9999997615814209,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9999029636383057,
0.9999897480010986,
0.99998939037323,
0.9999954700469971,
1.0,
0.9999998807907104,
0.9999998807907104,
1.0,
1.0,
1.0
],
"eval_unhelpful_qa_runtime": 8.4444,
"eval_unhelpful_qa_samples_per_second": 11.842,
"eval_unhelpful_qa_steps_per_second": 0.237,
"epoch": 1.97,
"step": 75
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.0,
"step": 76
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.03,
"step": 77
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.05,
"step": 78
},
{
"loss": 0.0002,
"learning_rate": 7.2e-05,
"epoch": 2.08,
"step": 79
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.11,
"step": 80
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.13,
"step": 81
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.16,
"step": 82
},
{
"loss": 0.0003,
"learning_rate": 7.2e-05,
"epoch": 2.18,
"step": 83
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.21,
"step": 84
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.24,
"step": 85
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.26,
"step": 86
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.29,
"step": 87
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.32,
"step": 88
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 2.34,
"step": 89
},
{
"loss": 0.0004,
"learning_rate": 7.2e-05,
"epoch": 2.37,
"step": 90
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.39,
"step": 91
},
{
"loss": 0.0002,
"learning_rate": 7.2e-05,
"epoch": 2.42,
"step": 92
},
{
"loss": 0.0004,
"learning_rate": 7.2e-05,
"epoch": 2.45,
"step": 93
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.47,
"step": 94
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.5,
"step": 95
},
{
"loss": 0.0001,
"learning_rate": 7.2e-05,
"epoch": 2.53,
"step": 96
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.55,
"step": 97
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.58,
"step": 98
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.61,
"step": 99
},
{
"loss": 0.0,
"learning_rate": 7.2e-05,
"epoch": 2.63,
"step": 100
},
{
"eval_unhelpful_qa_loss": 1.810065623431001e-05,
"eval_unhelpful_qa_score": -6.358372939274659e-09,
"eval_unhelpful_qa_brier_score": 6.358372939274659e-09,
"eval_unhelpful_qa_average_probability": 0.9999858140945435,
"eval_unhelpful_qa_accuracy": 1.0,
"eval_unhelpful_qa_probabilities": [
0.9999998807907104,
0.9999996423721313,
0.9997879862785339,
0.9999940395355225,
1.0,
1.0,
1.0,
0.9999997615814209,
1.0,
1.0,
1.0,
1.0,
0.9999822378158569,
0.9999915361404419,
1.0,
1.0,
0.9999984502792358,
0.9999960660934448,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
0.9995390176773071,
0.9993865489959717,
0.9999877214431763,
0.9999871253967285,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9999812841415405,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
0.9999996423721313,
0.9999995231628418,
1.0,
1.0,
1.0,
1.0,
0.9999990463256836,
0.9999977350234985,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
0.9999995231628418,
0.9999994039535522,
1.0,
1.0,
0.999992847442627,
0.9999972581863403,
1.0,
1.0,
0.9999963045120239,
0.9999970197677612,
0.9999986886978149,
0.9999991655349731,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999709129333496,
0.9999969005584717,
0.999997615814209,
0.999998927116394,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0
],
"eval_unhelpful_qa_runtime": 8.434,
"eval_unhelpful_qa_samples_per_second": 11.857,
"eval_unhelpful_qa_steps_per_second": 0.237,
"epoch": 2.63,
"step": 100
},
{
"train_runtime": 775.6839,
"train_samples_per_second": 4.125,
"train_steps_per_second": 0.129,
"total_flos": 0.0,
"train_loss": 0.0821405840863207,
"epoch": 2.63,
"step": 100
}
]]