路卡
commited on
Commit
•
2e554e9
1
Parent(s):
ffb74e4
init
Browse files- .ossutil_checkpoint/48c676315533e611d7cd754890b5075e-d712583ecacd6a6df77151d53d30076c.cp +1 -0
- .ossutil_checkpoint/d053d2b482cdbeddf778161d292507c7-3feaef7dd3e84e71d74f83849c381748.cp +1 -0
- README.md +59 -3
- all_results.json +7 -0
- config.json +29 -0
- generation_config.json +7 -0
- model-00001-of-00029.safetensors +3 -0
- model-00002-of-00029.safetensors +3 -0
- model-00003-of-00029.safetensors +3 -0
- model-00004-of-00029.safetensors +3 -0
- model-00005-of-00029.safetensors +3 -0
- model-00006-of-00029.safetensors +3 -0
- model-00007-of-00029.safetensors +3 -0
- model-00008-of-00029.safetensors +3 -0
- model-00009-of-00029.safetensors +3 -0
- model-00010-of-00029.safetensors +3 -0
- model-00011-of-00029.safetensors +3 -0
- model-00012-of-00029.safetensors +3 -0
- model-00013-of-00029.safetensors +3 -0
- model-00014-of-00029.safetensors +3 -0
- model-00015-of-00029.safetensors +3 -0
- model-00016-of-00029.safetensors +3 -0
- model-00017-of-00029.safetensors +3 -0
- model-00018-of-00029.safetensors +3 -0
- model-00019-of-00029.safetensors +3 -0
- model-00020-of-00029.safetensors +3 -0
- model-00021-of-00029.safetensors +3 -0
- model-00022-of-00029.safetensors +3 -0
- model-00023-of-00029.safetensors +3 -0
- model-00024-of-00029.safetensors +3 -0
- model-00025-of-00029.safetensors +3 -0
- model-00026-of-00029.safetensors +3 -0
- model-00027-of-00029.safetensors +3 -0
- model-00028-of-00029.safetensors +3 -0
- model-00029-of-00029.safetensors +3 -0
- model.safetensors.index.json +730 -0
- special_tokens_map.json +30 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +43 -0
- train_results.json +7 -0
- trainer_log.jsonl +44 -0
- trainer_state.json +90 -0
- training_args.bin +3 -0
- training_loss.png +0 -0
.ossutil_checkpoint/48c676315533e611d7cd754890b5075e-d712583ecacd6a6df77151d53d30076c.cp
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"Magic":"92611BED-89E2-46B6-89E5-72F273D4B0A3","MD5":"39UdeVK4DFejoGg8V+5JlA==","FilePath":"./model-00001-of-00029.safetensors","Object":"lukeming.lkm/ckpts/MuggleMATH_70B/model-00001-of-00029.safetensors","ObjStat":{"Size":4718660336,"LastModified":"Thu, 23 May 2024 07:44:31 GMT","Etag":"\"B8B72314F5A65CA755A0758A0DD4F1A8-400\""},"Parts":[{"Index":0,"Start":0,"End":11796650,"Offset":0,"CRC64":7734103908939600283},{"Index":1,"Start":11796651,"End":23593301,"Offset":0,"CRC64":13946797209173438414},{"Index":2,"Start":23593302,"End":35389952,"Offset":0,"CRC64":6522356605359540525},{"Index":3,"Start":35389953,"End":47186603,"Offset":0,"CRC64":3117497203324519042},{"Index":4,"Start":47186604,"End":58983254,"Offset":0,"CRC64":2107163154314994146},{"Index":5,"Start":58983255,"End":70779905,"Offset":0,"CRC64":2252182964793588192},{"Index":6,"Start":70779906,"End":82576556,"Offset":0,"CRC64":11158521091770250582},{"Index":7,"Start":82576557,"End":94373207,"Offset":0,"CRC64":8323376016140168251},{"Index":8,"Start":94373208,"End":106169858,"Offset":0,"CRC64":4564559710057877774},{"Index":9,"Start":106169859,"End":117966509,"Offset":0,"CRC64":6648284542793722288},{"Index":10,"Start":117966510,"End":129763160,"Offset":0,"CRC64":6843877926650281737},{"Index":11,"Start":129763161,"End":141559811,"Offset":0,"CRC64":7324989584136854474},{"Index":12,"Start":141559812,"End":153356462,"Offset":0,"CRC64":2294434949326897558},{"Index":13,"Start":153356463,"End":165153113,"Offset":0,"CRC64":4086485204359859989},{"Index":14,"Start":165153114,"End":176949764,"Offset":0,"CRC64":16310818712231293452},{"Index":15,"Start":176949765,"End":188746415,"Offset":0,"CRC64":16758457411500040791},{"Index":16,"Start":188746416,"End":200543066,"Offset":0,"CRC64":12165807584262201641},{"Index":17,"Start":200543067,"End":212339717,"Offset":0,"CRC64":7174588206375560363},{"Index":18,"Start":212339718,"End":224136368,"Offset":0,"CRC64":15232022520324217815},{"Index":19,"Start":224136369,"End":235933019,"Offset":0,"CRC64":10753117933180140319},{"Index":20,"Start":235933020,"End":247729670,"Offset":0,"CRC64":11891670518696121651},{"Index":21,"Start":247729671,"End":259526321,"Offset":0,"CRC64":10360606638270250153},{"Index":22,"Start":259526322,"End":271322972,"Offset":0,"CRC64":4842394567191982555},{"Index":23,"Start":271322973,"End":283119623,"Offset":0,"CRC64":15466180023694753038},{"Index":24,"Start":283119624,"End":294916274,"Offset":0,"CRC64":17278651481439366333},{"Index":25,"Start":294916275,"End":306712925,"Offset":0,"CRC64":17528679591708311910},{"Index":26,"Start":306712926,"End":318509576,"Offset":0,"CRC64":13591749462233292433},{"Index":27,"Start":318509577,"End":330306227,"Offset":0,"CRC64":7351374801468350070},{"Index":28,"Start":330306228,"End":342102878,"Offset":0,"CRC64":2239865038877898494},{"Index":29,"Start":342102879,"End":353899529,"Offset":0,"CRC64":3135988359496048238},{"Index":30,"Start":353899530,"End":365696180,"Offset":0,"CRC64":14479971787162511573},{"Index":31,"Start":365696181,"End":377492831,"Offset":0,"CRC64":12645989155660017377},{"Index":32,"Start":377492832,"End":389289482,"Offset":0,"CRC64":9521224400584333947},{"Index":33,"Start":389289483,"End":401086133,"Offset":0,"CRC64":3943705059016206527},{"Index":34,"Start":401086134,"End":412882784,"Offset":0,"CRC64":2059250154093896235},{"Index":35,"Start":412882785,"End":424679435,"Offset":0,"CRC64":2612536668580787815},{"Index":36,"Start":424679436,"End":436476086,"Offset":0,"CRC64":12359524698496950769},{"Index":37,"Start":436476087,"End":448272737,"Offset":0,"CRC64":17953878105145873185},{"Index":38,"Start":448272738,"End":460069388,"Offset":0,"CRC64":7688179382154582285},{"Index":39,"Start":460069389,"End":471866039,"Offset":0,"CRC64":12664330962337419862},{"Index":40,"Start":471866040,"End":483662690,"Offset":0,"CRC64":2417373381611650965},{"Index":41,"Start":483662691,"End":495459341,"Offset":0,"CRC64":8558757232920379343},{"Index":42,"Start":495459342,"End":507255992,"Offset":0,"CRC64":7399801473079246540},{"Index":43,"Start":507255993,"End":519052643,"Offset":0,"CRC64":9805207422636938175},{"Index":44,"Start":519052644,"End":530849294,"Offset":0,"CRC64":5240013993706589142},{"Index":45,"Start":530849295,"End":542645945,"Offset":0,"CRC64":1562999921063104423},{"Index":46,"Start":542645946,"End":554442596,"Offset":0,"CRC64":15407629091861646893},{"Index":47,"Start":554442597,"End":566239247,"Offset":0,"CRC64":2807194333079361599},{"Index":48,"Start":566239248,"End":578035898,"Offset":0,"CRC64":7535713447309415267},{"Index":49,"Start":578035899,"End":589832549,"Offset":0,"CRC64":10444205549846255608},{"Index":50,"Start":589832550,"End":601629200,"Offset":0,"CRC64":12983761514076363698},{"Index":51,"Start":601629201,"End":613425851,"Offset":0,"CRC64":6127471005251864035},{"Index":52,"Start":613425852,"End":625222502,"Offset":0,"CRC64":5018572865074776406},{"Index":53,"Start":625222503,"End":637019153,"Offset":0,"CRC64":2076272156518857384},{"Index":54,"Start":637019154,"End":648815804,"Offset":0,"CRC64":10149648838630035461},{"Index":55,"Start":648815805,"End":660612455,"Offset":0,"CRC64":897798584627247841},{"Index":56,"Start":660612456,"End":672409106,"Offset":0,"CRC64":18186021319043360166},{"Index":57,"Start":672409107,"End":684205757,"Offset":0,"CRC64":18424898970797850335},{"Index":58,"Start":684205758,"End":696002408,"Offset":0,"CRC64":4066330460845409264},{"Index":59,"Start":696002409,"End":707799059,"Offset":0,"CRC64":18065653842779634761},{"Index":60,"Start":707799060,"End":719595710,"Offset":0,"CRC64":5659405315101506615},{"Index":61,"Start":719595711,"End":731392361,"Offset":0,"CRC64":1934359076054688293},{"Index":62,"Start":731392362,"End":743189012,"Offset":0,"CRC64":4003681020197115752},{"Index":63,"Start":743189013,"End":754985663,"Offset":0,"CRC64":12175557224575475796},{"Index":64,"Start":754985664,"End":766782314,"Offset":0,"CRC64":17308077171406247301},{"Index":65,"Start":766782315,"End":778578965,"Offset":0,"CRC64":0},{"Index":66,"Start":778578966,"End":790375616,"Offset":0,"CRC64":0},{"Index":67,"Start":790375617,"End":802172267,"Offset":0,"CRC64":0},{"Index":68,"Start":802172268,"End":813968918,"Offset":0,"CRC64":0},{"Index":69,"Start":813968919,"End":825765569,"Offset":0,"CRC64":0},{"Index":70,"Start":825765570,"End":837562220,"Offset":0,"CRC64":0},{"Index":71,"Start":837562221,"End":849358871,"Offset":0,"CRC64":0},{"Index":72,"Start":849358872,"End":861155522,"Offset":0,"CRC64":0},{"Index":73,"Start":861155523,"End":872952173,"Offset":0,"CRC64":0},{"Index":74,"Start":872952174,"End":884748824,"Offset":0,"CRC64":0},{"Index":75,"Start":884748825,"End":896545475,"Offset":0,"CRC64":0},{"Index":76,"Start":896545476,"End":908342126,"Offset":0,"CRC64":0},{"Index":77,"Start":908342127,"End":920138777,"Offset":0,"CRC64":0},{"Index":78,"Start":920138778,"End":931935428,"Offset":0,"CRC64":0},{"Index":79,"Start":931935429,"End":943732079,"Offset":0,"CRC64":0},{"Index":80,"Start":943732080,"End":955528730,"Offset":0,"CRC64":0},{"Index":81,"Start":955528731,"End":967325381,"Offset":0,"CRC64":0},{"Index":82,"Start":967325382,"End":979122032,"Offset":0,"CRC64":0},{"Index":83,"Start":979122033,"End":990918683,"Offset":0,"CRC64":0},{"Index":84,"Start":990918684,"End":1002715334,"Offset":0,"CRC64":0},{"Index":85,"Start":1002715335,"End":1014511985,"Offset":0,"CRC64":0},{"Index":86,"Start":1014511986,"End":1026308636,"Offset":0,"CRC64":0},{"Index":87,"Start":1026308637,"End":1038105287,"Offset":0,"CRC64":0},{"Index":88,"Start":1038105288,"End":1049901938,"Offset":0,"CRC64":0},{"Index":89,"Start":1049901939,"End":1061698589,"Offset":0,"CRC64":0},{"Index":90,"Start":1061698590,"End":1073495240,"Offset":0,"CRC64":0},{"Index":91,"Start":1073495241,"End":1085291891,"Offset":0,"CRC64":0},{"Index":92,"Start":1085291892,"End":1097088542,"Offset":0,"CRC64":0},{"Index":93,"Start":1097088543,"End":1108885193,"Offset":0,"CRC64":0},{"Index":94,"Start":1108885194,"End":1120681844,"Offset":0,"CRC64":0},{"Index":95,"Start":1120681845,"End":1132478495,"Offset":0,"CRC64":0},{"Index":96,"Start":1132478496,"End":1144275146,"Offset":0,"CRC64":0},{"Index":97,"Start":1144275147,"End":1156071797,"Offset":0,"CRC64":0},{"Index":98,"Start":1156071798,"End":1167868448,"Offset":0,"CRC64":0},{"Index":99,"Start":1167868449,"End":1179665099,"Offset":0,"CRC64":0},{"Index":100,"Start":1179665100,"End":1191461750,"Offset":0,"CRC64":0},{"Index":101,"Start":1191461751,"End":1203258401,"Offset":0,"CRC64":0},{"Index":102,"Start":1203258402,"End":1215055052,"Offset":0,"CRC64":0},{"Index":103,"Start":1215055053,"End":1226851703,"Offset":0,"CRC64":0},{"Index":104,"Start":1226851704,"End":1238648354,"Offset":0,"CRC64":0},{"Index":105,"Start":1238648355,"End":1250445005,"Offset":0,"CRC64":0},{"Index":106,"Start":1250445006,"End":1262241656,"Offset":0,"CRC64":0},{"Index":107,"Start":1262241657,"End":1274038307,"Offset":0,"CRC64":0},{"Index":108,"Start":1274038308,"End":1285834958,"Offset":0,"CRC64":0},{"Index":109,"Start":1285834959,"End":1297631609,"Offset":0,"CRC64":0},{"Index":110,"Start":1297631610,"End":1309428260,"Offset":0,"CRC64":0},{"Index":111,"Start":1309428261,"End":1321224911,"Offset":0,"CRC64":0},{"Index":112,"Start":1321224912,"End":1333021562,"Offset":0,"CRC64":0},{"Index":113,"Start":1333021563,"End":1344818213,"Offset":0,"CRC64":0},{"Index":114,"Start":1344818214,"End":1356614864,"Offset":0,"CRC64":0},{"Index":115,"Start":1356614865,"End":1368411515,"Offset":0,"CRC64":0},{"Index":116,"Start":1368411516,"End":1380208166,"Offset":0,"CRC64":0},{"Index":117,"Start":1380208167,"End":1392004817,"Offset":0,"CRC64":0},{"Index":118,"Start":1392004818,"End":1403801468,"Offset":0,"CRC64":0},{"Index":119,"Start":1403801469,"End":1415598119,"Offset":0,"CRC64":0},{"Index":120,"Start":1415598120,"End":1427394770,"Offset":0,"CRC64":0},{"Index":121,"Start":1427394771,"End":1439191421,"Offset":0,"CRC64":0},{"Index":122,"Start":1439191422,"End":1450988072,"Offset":0,"CRC64":0},{"Index":123,"Start":1450988073,"End":1462784723,"Offset":0,"CRC64":0},{"Index":124,"Start":1462784724,"End":1474581374,"Offset":0,"CRC64":0},{"Index":125,"Start":1474581375,"End":1486378025,"Offset":0,"CRC64":0},{"Index":126,"Start":1486378026,"End":1498174676,"Offset":0,"CRC64":0},{"Index":127,"Start":1498174677,"End":1509971327,"Offset":0,"CRC64":0},{"Index":128,"Start":1509971328,"End":1521767978,"Offset":0,"CRC64":0},{"Index":129,"Start":1521767979,"End":1533564629,"Offset":0,"CRC64":0},{"Index":130,"Start":1533564630,"End":1545361280,"Offset":0,"CRC64":0},{"Index":131,"Start":1545361281,"End":1557157931,"Offset":0,"CRC64":0},{"Index":132,"Start":1557157932,"End":1568954582,"Offset":0,"CRC64":0},{"Index":133,"Start":1568954583,"End":1580751233,"Offset":0,"CRC64":0},{"Index":134,"Start":1580751234,"End":1592547884,"Offset":0,"CRC64":0},{"Index":135,"Start":1592547885,"End":1604344535,"Offset":0,"CRC64":0},{"Index":136,"Start":1604344536,"End":1616141186,"Offset":0,"CRC64":0},{"Index":137,"Start":1616141187,"End":1627937837,"Offset":0,"CRC64":0},{"Index":138,"Start":1627937838,"End":1639734488,"Offset":0,"CRC64":0},{"Index":139,"Start":1639734489,"End":1651531139,"Offset":0,"CRC64":0},{"Index":140,"Start":1651531140,"End":1663327790,"Offset":0,"CRC64":0},{"Index":141,"Start":1663327791,"End":1675124441,"Offset":0,"CRC64":0},{"Index":142,"Start":1675124442,"End":1686921092,"Offset":0,"CRC64":0},{"Index":143,"Start":1686921093,"End":1698717743,"Offset":0,"CRC64":0},{"Index":144,"Start":1698717744,"End":1710514394,"Offset":0,"CRC64":0},{"Index":145,"Start":1710514395,"End":1722311045,"Offset":0,"CRC64":0},{"Index":146,"Start":1722311046,"End":1734107696,"Offset":0,"CRC64":0},{"Index":147,"Start":1734107697,"End":1745904347,"Offset":0,"CRC64":0},{"Index":148,"Start":1745904348,"End":1757700998,"Offset":0,"CRC64":0},{"Index":149,"Start":1757700999,"End":1769497649,"Offset":0,"CRC64":0},{"Index":150,"Start":1769497650,"End":1781294300,"Offset":0,"CRC64":0},{"Index":151,"Start":1781294301,"End":1793090951,"Offset":0,"CRC64":0},{"Index":152,"Start":1793090952,"End":1804887602,"Offset":0,"CRC64":0},{"Index":153,"Start":1804887603,"End":1816684253,"Offset":0,"CRC64":0},{"Index":154,"Start":1816684254,"End":1828480904,"Offset":0,"CRC64":0},{"Index":155,"Start":1828480905,"End":1840277555,"Offset":0,"CRC64":0},{"Index":156,"Start":1840277556,"End":1852074206,"Offset":0,"CRC64":0},{"Index":157,"Start":1852074207,"End":1863870857,"Offset":0,"CRC64":0},{"Index":158,"Start":1863870858,"End":1875667508,"Offset":0,"CRC64":0},{"Index":159,"Start":1875667509,"End":1887464159,"Offset":0,"CRC64":0},{"Index":160,"Start":1887464160,"End":1899260810,"Offset":0,"CRC64":0},{"Index":161,"Start":1899260811,"End":1911057461,"Offset":0,"CRC64":0},{"Index":162,"Start":1911057462,"End":1922854112,"Offset":0,"CRC64":0},{"Index":163,"Start":1922854113,"End":1934650763,"Offset":0,"CRC64":0},{"Index":164,"Start":1934650764,"End":1946447414,"Offset":0,"CRC64":0},{"Index":165,"Start":1946447415,"End":1958244065,"Offset":0,"CRC64":0},{"Index":166,"Start":1958244066,"End":1970040716,"Offset":0,"CRC64":0},{"Index":167,"Start":1970040717,"End":1981837367,"Offset":0,"CRC64":0},{"Index":168,"Start":1981837368,"End":1993634018,"Offset":0,"CRC64":0},{"Index":169,"Start":1993634019,"End":2005430669,"Offset":0,"CRC64":0},{"Index":170,"Start":2005430670,"End":2017227320,"Offset":0,"CRC64":0},{"Index":171,"Start":2017227321,"End":2029023971,"Offset":0,"CRC64":0},{"Index":172,"Start":2029023972,"End":2040820622,"Offset":0,"CRC64":0},{"Index":173,"Start":2040820623,"End":2052617273,"Offset":0,"CRC64":0},{"Index":174,"Start":2052617274,"End":2064413924,"Offset":0,"CRC64":0},{"Index":175,"Start":2064413925,"End":2076210575,"Offset":0,"CRC64":0},{"Index":176,"Start":2076210576,"End":2088007226,"Offset":0,"CRC64":0},{"Index":177,"Start":2088007227,"End":2099803877,"Offset":0,"CRC64":0},{"Index":178,"Start":2099803878,"End":2111600528,"Offset":0,"CRC64":0},{"Index":179,"Start":2111600529,"End":2123397179,"Offset":0,"CRC64":0},{"Index":180,"Start":2123397180,"End":2135193830,"Offset":0,"CRC64":0},{"Index":181,"Start":2135193831,"End":2146990481,"Offset":0,"CRC64":0},{"Index":182,"Start":2146990482,"End":2158787132,"Offset":0,"CRC64":0},{"Index":183,"Start":2158787133,"End":2170583783,"Offset":0,"CRC64":0},{"Index":184,"Start":2170583784,"End":2182380434,"Offset":0,"CRC64":0},{"Index":185,"Start":2182380435,"End":2194177085,"Offset":0,"CRC64":0},{"Index":186,"Start":2194177086,"End":2205973736,"Offset":0,"CRC64":0},{"Index":187,"Start":2205973737,"End":2217770387,"Offset":0,"CRC64":0},{"Index":188,"Start":2217770388,"End":2229567038,"Offset":0,"CRC64":0},{"Index":189,"Start":2229567039,"End":2241363689,"Offset":0,"CRC64":0},{"Index":190,"Start":2241363690,"End":2253160340,"Offset":0,"CRC64":0},{"Index":191,"Start":2253160341,"End":2264956991,"Offset":0,"CRC64":0},{"Index":192,"Start":2264956992,"End":2276753642,"Offset":0,"CRC64":0},{"Index":193,"Start":2276753643,"End":2288550293,"Offset":0,"CRC64":0},{"Index":194,"Start":2288550294,"End":2300346944,"Offset":0,"CRC64":0},{"Index":195,"Start":2300346945,"End":2312143595,"Offset":0,"CRC64":0},{"Index":196,"Start":2312143596,"End":2323940246,"Offset":0,"CRC64":0},{"Index":197,"Start":2323940247,"End":2335736897,"Offset":0,"CRC64":0},{"Index":198,"Start":2335736898,"End":2347533548,"Offset":0,"CRC64":0},{"Index":199,"Start":2347533549,"End":2359330199,"Offset":0,"CRC64":0},{"Index":200,"Start":2359330200,"End":2371126850,"Offset":0,"CRC64":0},{"Index":201,"Start":2371126851,"End":2382923501,"Offset":0,"CRC64":0},{"Index":202,"Start":2382923502,"End":2394720152,"Offset":0,"CRC64":0},{"Index":203,"Start":2394720153,"End":2406516803,"Offset":0,"CRC64":0},{"Index":204,"Start":2406516804,"End":2418313454,"Offset":0,"CRC64":0},{"Index":205,"Start":2418313455,"End":2430110105,"Offset":0,"CRC64":0},{"Index":206,"Start":2430110106,"End":2441906756,"Offset":0,"CRC64":0},{"Index":207,"Start":2441906757,"End":2453703407,"Offset":0,"CRC64":0},{"Index":208,"Start":2453703408,"End":2465500058,"Offset":0,"CRC64":0},{"Index":209,"Start":2465500059,"End":2477296709,"Offset":0,"CRC64":0},{"Index":210,"Start":2477296710,"End":2489093360,"Offset":0,"CRC64":0},{"Index":211,"Start":2489093361,"End":2500890011,"Offset":0,"CRC64":0},{"Index":212,"Start":2500890012,"End":2512686662,"Offset":0,"CRC64":0},{"Index":213,"Start":2512686663,"End":2524483313,"Offset":0,"CRC64":0},{"Index":214,"Start":2524483314,"End":2536279964,"Offset":0,"CRC64":0},{"Index":215,"Start":2536279965,"End":2548076615,"Offset":0,"CRC64":0},{"Index":216,"Start":2548076616,"End":2559873266,"Offset":0,"CRC64":0},{"Index":217,"Start":2559873267,"End":2571669917,"Offset":0,"CRC64":0},{"Index":218,"Start":2571669918,"End":2583466568,"Offset":0,"CRC64":0},{"Index":219,"Start":2583466569,"End":2595263219,"Offset":0,"CRC64":0},{"Index":220,"Start":2595263220,"End":2607059870,"Offset":0,"CRC64":0},{"Index":221,"Start":2607059871,"End":2618856521,"Offset":0,"CRC64":0},{"Index":222,"Start":2618856522,"End":2630653172,"Offset":0,"CRC64":0},{"Index":223,"Start":2630653173,"End":2642449823,"Offset":0,"CRC64":0},{"Index":224,"Start":2642449824,"End":2654246474,"Offset":0,"CRC64":0},{"Index":225,"Start":2654246475,"End":2666043125,"Offset":0,"CRC64":0},{"Index":226,"Start":2666043126,"End":2677839776,"Offset":0,"CRC64":0},{"Index":227,"Start":2677839777,"End":2689636427,"Offset":0,"CRC64":0},{"Index":228,"Start":2689636428,"End":2701433078,"Offset":0,"CRC64":0},{"Index":229,"Start":2701433079,"End":2713229729,"Offset":0,"CRC64":0},{"Index":230,"Start":2713229730,"End":2725026380,"Offset":0,"CRC64":0},{"Index":231,"Start":2725026381,"End":2736823031,"Offset":0,"CRC64":0},{"Index":232,"Start":2736823032,"End":2748619682,"Offset":0,"CRC64":0},{"Index":233,"Start":2748619683,"End":2760416333,"Offset":0,"CRC64":0},{"Index":234,"Start":2760416334,"End":2772212984,"Offset":0,"CRC64":0},{"Index":235,"Start":2772212985,"End":2784009635,"Offset":0,"CRC64":0},{"Index":236,"Start":2784009636,"End":2795806286,"Offset":0,"CRC64":0},{"Index":237,"Start":2795806287,"End":2807602937,"Offset":0,"CRC64":0},{"Index":238,"Start":2807602938,"End":2819399588,"Offset":0,"CRC64":0},{"Index":239,"Start":2819399589,"End":2831196239,"Offset":0,"CRC64":0},{"Index":240,"Start":2831196240,"End":2842992890,"Offset":0,"CRC64":0},{"Index":241,"Start":2842992891,"End":2854789541,"Offset":0,"CRC64":0},{"Index":242,"Start":2854789542,"End":2866586192,"Offset":0,"CRC64":0},{"Index":243,"Start":2866586193,"End":2878382843,"Offset":0,"CRC64":0},{"Index":244,"Start":2878382844,"End":2890179494,"Offset":0,"CRC64":0},{"Index":245,"Start":2890179495,"End":2901976145,"Offset":0,"CRC64":0},{"Index":246,"Start":2901976146,"End":2913772796,"Offset":0,"CRC64":0},{"Index":247,"Start":2913772797,"End":2925569447,"Offset":0,"CRC64":0},{"Index":248,"Start":2925569448,"End":2937366098,"Offset":0,"CRC64":0},{"Index":249,"Start":2937366099,"End":2949162749,"Offset":0,"CRC64":0},{"Index":250,"Start":2949162750,"End":2960959400,"Offset":0,"CRC64":0},{"Index":251,"Start":2960959401,"End":2972756051,"Offset":0,"CRC64":0},{"Index":252,"Start":2972756052,"End":2984552702,"Offset":0,"CRC64":0},{"Index":253,"Start":2984552703,"End":2996349353,"Offset":0,"CRC64":0},{"Index":254,"Start":2996349354,"End":3008146004,"Offset":0,"CRC64":0},{"Index":255,"Start":3008146005,"End":3019942655,"Offset":0,"CRC64":0},{"Index":256,"Start":3019942656,"End":3031739306,"Offset":0,"CRC64":0},{"Index":257,"Start":3031739307,"End":3043535957,"Offset":0,"CRC64":0},{"Index":258,"Start":3043535958,"End":3055332608,"Offset":0,"CRC64":0},{"Index":259,"Start":3055332609,"End":3067129259,"Offset":0,"CRC64":0},{"Index":260,"Start":3067129260,"End":3078925910,"Offset":0,"CRC64":0},{"Index":261,"Start":3078925911,"End":3090722561,"Offset":0,"CRC64":0},{"Index":262,"Start":3090722562,"End":3102519212,"Offset":0,"CRC64":0},{"Index":263,"Start":3102519213,"End":3114315863,"Offset":0,"CRC64":0},{"Index":264,"Start":3114315864,"End":3126112514,"Offset":0,"CRC64":0},{"Index":265,"Start":3126112515,"End":3137909165,"Offset":0,"CRC64":0},{"Index":266,"Start":3137909166,"End":3149705816,"Offset":0,"CRC64":0},{"Index":267,"Start":3149705817,"End":3161502467,"Offset":0,"CRC64":0},{"Index":268,"Start":3161502468,"End":3173299118,"Offset":0,"CRC64":0},{"Index":269,"Start":3173299119,"End":3185095769,"Offset":0,"CRC64":0},{"Index":270,"Start":3185095770,"End":3196892420,"Offset":0,"CRC64":0},{"Index":271,"Start":3196892421,"End":3208689071,"Offset":0,"CRC64":0},{"Index":272,"Start":3208689072,"End":3220485722,"Offset":0,"CRC64":0},{"Index":273,"Start":3220485723,"End":3232282373,"Offset":0,"CRC64":0},{"Index":274,"Start":3232282374,"End":3244079024,"Offset":0,"CRC64":0},{"Index":275,"Start":3244079025,"End":3255875675,"Offset":0,"CRC64":0},{"Index":276,"Start":3255875676,"End":3267672326,"Offset":0,"CRC64":0},{"Index":277,"Start":3267672327,"End":3279468977,"Offset":0,"CRC64":0},{"Index":278,"Start":3279468978,"End":3291265628,"Offset":0,"CRC64":0},{"Index":279,"Start":3291265629,"End":3303062279,"Offset":0,"CRC64":0},{"Index":280,"Start":3303062280,"End":3314858930,"Offset":0,"CRC64":0},{"Index":281,"Start":3314858931,"End":3326655581,"Offset":0,"CRC64":0},{"Index":282,"Start":3326655582,"End":3338452232,"Offset":0,"CRC64":0},{"Index":283,"Start":3338452233,"End":3350248883,"Offset":0,"CRC64":0},{"Index":284,"Start":3350248884,"End":3362045534,"Offset":0,"CRC64":0},{"Index":285,"Start":3362045535,"End":3373842185,"Offset":0,"CRC64":0},{"Index":286,"Start":3373842186,"End":3385638836,"Offset":0,"CRC64":0},{"Index":287,"Start":3385638837,"End":3397435487,"Offset":0,"CRC64":0},{"Index":288,"Start":3397435488,"End":3409232138,"Offset":0,"CRC64":0},{"Index":289,"Start":3409232139,"End":3421028789,"Offset":0,"CRC64":0},{"Index":290,"Start":3421028790,"End":3432825440,"Offset":0,"CRC64":0},{"Index":291,"Start":3432825441,"End":3444622091,"Offset":0,"CRC64":0},{"Index":292,"Start":3444622092,"End":3456418742,"Offset":0,"CRC64":0},{"Index":293,"Start":3456418743,"End":3468215393,"Offset":0,"CRC64":0},{"Index":294,"Start":3468215394,"End":3480012044,"Offset":0,"CRC64":0},{"Index":295,"Start":3480012045,"End":3491808695,"Offset":0,"CRC64":0},{"Index":296,"Start":3491808696,"End":3503605346,"Offset":0,"CRC64":0},{"Index":297,"Start":3503605347,"End":3515401997,"Offset":0,"CRC64":0},{"Index":298,"Start":3515401998,"End":3527198648,"Offset":0,"CRC64":0},{"Index":299,"Start":3527198649,"End":3538995299,"Offset":0,"CRC64":0},{"Index":300,"Start":3538995300,"End":3550791950,"Offset":0,"CRC64":0},{"Index":301,"Start":3550791951,"End":3562588601,"Offset":0,"CRC64":0},{"Index":302,"Start":3562588602,"End":3574385252,"Offset":0,"CRC64":0},{"Index":303,"Start":3574385253,"End":3586181903,"Offset":0,"CRC64":0},{"Index":304,"Start":3586181904,"End":3597978554,"Offset":0,"CRC64":0},{"Index":305,"Start":3597978555,"End":3609775205,"Offset":0,"CRC64":0},{"Index":306,"Start":3609775206,"End":3621571856,"Offset":0,"CRC64":0},{"Index":307,"Start":3621571857,"End":3633368507,"Offset":0,"CRC64":0},{"Index":308,"Start":3633368508,"End":3645165158,"Offset":0,"CRC64":0},{"Index":309,"Start":3645165159,"End":3656961809,"Offset":0,"CRC64":0},{"Index":310,"Start":3656961810,"End":3668758460,"Offset":0,"CRC64":0},{"Index":311,"Start":3668758461,"End":3680555111,"Offset":0,"CRC64":0},{"Index":312,"Start":3680555112,"End":3692351762,"Offset":0,"CRC64":0},{"Index":313,"Start":3692351763,"End":3704148413,"Offset":0,"CRC64":0},{"Index":314,"Start":3704148414,"End":3715945064,"Offset":0,"CRC64":0},{"Index":315,"Start":3715945065,"End":3727741715,"Offset":0,"CRC64":0},{"Index":316,"Start":3727741716,"End":3739538366,"Offset":0,"CRC64":0},{"Index":317,"Start":3739538367,"End":3751335017,"Offset":0,"CRC64":0},{"Index":318,"Start":3751335018,"End":3763131668,"Offset":0,"CRC64":0},{"Index":319,"Start":3763131669,"End":3774928319,"Offset":0,"CRC64":0},{"Index":320,"Start":3774928320,"End":3786724970,"Offset":0,"CRC64":0},{"Index":321,"Start":3786724971,"End":3798521621,"Offset":0,"CRC64":0},{"Index":322,"Start":3798521622,"End":3810318272,"Offset":0,"CRC64":0},{"Index":323,"Start":3810318273,"End":3822114923,"Offset":0,"CRC64":0},{"Index":324,"Start":3822114924,"End":3833911574,"Offset":0,"CRC64":0},{"Index":325,"Start":3833911575,"End":3845708225,"Offset":0,"CRC64":0},{"Index":326,"Start":3845708226,"End":3857504876,"Offset":0,"CRC64":0},{"Index":327,"Start":3857504877,"End":3869301527,"Offset":0,"CRC64":0},{"Index":328,"Start":3869301528,"End":3881098178,"Offset":0,"CRC64":0},{"Index":329,"Start":3881098179,"End":3892894829,"Offset":0,"CRC64":0},{"Index":330,"Start":3892894830,"End":3904691480,"Offset":0,"CRC64":0},{"Index":331,"Start":3904691481,"End":3916488131,"Offset":0,"CRC64":0},{"Index":332,"Start":3916488132,"End":3928284782,"Offset":0,"CRC64":0},{"Index":333,"Start":3928284783,"End":3940081433,"Offset":0,"CRC64":0},{"Index":334,"Start":3940081434,"End":3951878084,"Offset":0,"CRC64":0},{"Index":335,"Start":3951878085,"End":3963674735,"Offset":0,"CRC64":0},{"Index":336,"Start":3963674736,"End":3975471386,"Offset":0,"CRC64":0},{"Index":337,"Start":3975471387,"End":3987268037,"Offset":0,"CRC64":0},{"Index":338,"Start":3987268038,"End":3999064688,"Offset":0,"CRC64":0},{"Index":339,"Start":3999064689,"End":4010861339,"Offset":0,"CRC64":0},{"Index":340,"Start":4010861340,"End":4022657990,"Offset":0,"CRC64":0},{"Index":341,"Start":4022657991,"End":4034454641,"Offset":0,"CRC64":0},{"Index":342,"Start":4034454642,"End":4046251292,"Offset":0,"CRC64":0},{"Index":343,"Start":4046251293,"End":4058047943,"Offset":0,"CRC64":0},{"Index":344,"Start":4058047944,"End":4069844594,"Offset":0,"CRC64":0},{"Index":345,"Start":4069844595,"End":4081641245,"Offset":0,"CRC64":0},{"Index":346,"Start":4081641246,"End":4093437896,"Offset":0,"CRC64":0},{"Index":347,"Start":4093437897,"End":4105234547,"Offset":0,"CRC64":0},{"Index":348,"Start":4105234548,"End":4117031198,"Offset":0,"CRC64":0},{"Index":349,"Start":4117031199,"End":4128827849,"Offset":0,"CRC64":0},{"Index":350,"Start":4128827850,"End":4140624500,"Offset":0,"CRC64":0},{"Index":351,"Start":4140624501,"End":4152421151,"Offset":0,"CRC64":0},{"Index":352,"Start":4152421152,"End":4164217802,"Offset":0,"CRC64":0},{"Index":353,"Start":4164217803,"End":4176014453,"Offset":0,"CRC64":0},{"Index":354,"Start":4176014454,"End":4187811104,"Offset":0,"CRC64":0},{"Index":355,"Start":4187811105,"End":4199607755,"Offset":0,"CRC64":0},{"Index":356,"Start":4199607756,"End":4211404406,"Offset":0,"CRC64":0},{"Index":357,"Start":4211404407,"End":4223201057,"Offset":0,"CRC64":0},{"Index":358,"Start":4223201058,"End":4234997708,"Offset":0,"CRC64":0},{"Index":359,"Start":4234997709,"End":4246794359,"Offset":0,"CRC64":0},{"Index":360,"Start":4246794360,"End":4258591010,"Offset":0,"CRC64":0},{"Index":361,"Start":4258591011,"End":4270387661,"Offset":0,"CRC64":0},{"Index":362,"Start":4270387662,"End":4282184312,"Offset":0,"CRC64":0},{"Index":363,"Start":4282184313,"End":4293980963,"Offset":0,"CRC64":0},{"Index":364,"Start":4293980964,"End":4305777614,"Offset":0,"CRC64":0},{"Index":365,"Start":4305777615,"End":4317574265,"Offset":0,"CRC64":0},{"Index":366,"Start":4317574266,"End":4329370916,"Offset":0,"CRC64":0},{"Index":367,"Start":4329370917,"End":4341167567,"Offset":0,"CRC64":0},{"Index":368,"Start":4341167568,"End":4352964218,"Offset":0,"CRC64":0},{"Index":369,"Start":4352964219,"End":4364760869,"Offset":0,"CRC64":0},{"Index":370,"Start":4364760870,"End":4376557520,"Offset":0,"CRC64":0},{"Index":371,"Start":4376557521,"End":4388354171,"Offset":0,"CRC64":0},{"Index":372,"Start":4388354172,"End":4400150822,"Offset":0,"CRC64":0},{"Index":373,"Start":4400150823,"End":4411947473,"Offset":0,"CRC64":0},{"Index":374,"Start":4411947474,"End":4423744124,"Offset":0,"CRC64":0},{"Index":375,"Start":4423744125,"End":4435540775,"Offset":0,"CRC64":0},{"Index":376,"Start":4435540776,"End":4447337426,"Offset":0,"CRC64":0},{"Index":377,"Start":4447337427,"End":4459134077,"Offset":0,"CRC64":0},{"Index":378,"Start":4459134078,"End":4470930728,"Offset":0,"CRC64":0},{"Index":379,"Start":4470930729,"End":4482727379,"Offset":0,"CRC64":0},{"Index":380,"Start":4482727380,"End":4494524030,"Offset":0,"CRC64":0},{"Index":381,"Start":4494524031,"End":4506320681,"Offset":0,"CRC64":0},{"Index":382,"Start":4506320682,"End":4518117332,"Offset":0,"CRC64":0},{"Index":383,"Start":4518117333,"End":4529913983,"Offset":0,"CRC64":0},{"Index":384,"Start":4529913984,"End":4541710634,"Offset":0,"CRC64":0},{"Index":385,"Start":4541710635,"End":4553507285,"Offset":0,"CRC64":0},{"Index":386,"Start":4553507286,"End":4565303936,"Offset":0,"CRC64":0},{"Index":387,"Start":4565303937,"End":4577100587,"Offset":0,"CRC64":0},{"Index":388,"Start":4577100588,"End":4588897238,"Offset":0,"CRC64":0},{"Index":389,"Start":4588897239,"End":4600693889,"Offset":0,"CRC64":0},{"Index":390,"Start":4600693890,"End":4612490540,"Offset":0,"CRC64":0},{"Index":391,"Start":4612490541,"End":4624287191,"Offset":0,"CRC64":0},{"Index":392,"Start":4624287192,"End":4636083842,"Offset":0,"CRC64":0},{"Index":393,"Start":4636083843,"End":4647880493,"Offset":0,"CRC64":0},{"Index":394,"Start":4647880494,"End":4659677144,"Offset":0,"CRC64":0},{"Index":395,"Start":4659677145,"End":4671473795,"Offset":0,"CRC64":0},{"Index":396,"Start":4671473796,"End":4683270446,"Offset":0,"CRC64":0},{"Index":397,"Start":4683270447,"End":4695067097,"Offset":0,"CRC64":0},{"Index":398,"Start":4695067098,"End":4706863748,"Offset":0,"CRC64":0},{"Index":399,"Start":4706863749,"End":4718660335,"Offset":0,"CRC64":0}],"PartStat":[true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false],"Start":0,"End":0,"CRC":8229322551163540572}
|
.ossutil_checkpoint/d053d2b482cdbeddf778161d292507c7-3feaef7dd3e84e71d74f83849c381748.cp
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"Magic":"92611BED-89E2-46B6-89E5-72F273D4B0A3","MD5":"mT4bJdGkoH+elGKfpR/UHg==","FilePath":"./model-00002-of-00029.safetensors","Object":"lukeming.lkm/ckpts/MuggleMATH_70B/model-00002-of-00029.safetensors","ObjStat":{"Size":4664167376,"LastModified":"Thu, 23 May 2024 07:44:31 GMT","Etag":"\"E72B1F549177DFE02B067DA3B7C798C6-400\""},"Parts":[{"Index":0,"Start":0,"End":11660418,"Offset":0,"CRC64":10368645139660881830},{"Index":1,"Start":11660419,"End":23320837,"Offset":0,"CRC64":10961325361347256765},{"Index":2,"Start":23320838,"End":34981256,"Offset":0,"CRC64":3708697921186040670},{"Index":3,"Start":34981257,"End":46641675,"Offset":0,"CRC64":9047405136072969615},{"Index":4,"Start":46641676,"End":58302094,"Offset":0,"CRC64":944240148420449784},{"Index":5,"Start":58302095,"End":69962513,"Offset":0,"CRC64":12035190702942283733},{"Index":6,"Start":69962514,"End":81622932,"Offset":0,"CRC64":13305926003969242753},{"Index":7,"Start":81622933,"End":93283351,"Offset":0,"CRC64":2210904154344616086},{"Index":8,"Start":93283352,"End":104943770,"Offset":0,"CRC64":4242539274214137042},{"Index":9,"Start":104943771,"End":116604189,"Offset":0,"CRC64":8481860656238977215},{"Index":10,"Start":116604190,"End":128264608,"Offset":0,"CRC64":4161185334651582665},{"Index":11,"Start":128264609,"End":139925027,"Offset":0,"CRC64":13913449849767659401},{"Index":12,"Start":139925028,"End":151585446,"Offset":0,"CRC64":15540944646821163085},{"Index":13,"Start":151585447,"End":163245865,"Offset":0,"CRC64":7917054514325984966},{"Index":14,"Start":163245866,"End":174906284,"Offset":0,"CRC64":17178767107784259291},{"Index":15,"Start":174906285,"End":186566703,"Offset":0,"CRC64":13812673432586913773},{"Index":16,"Start":186566704,"End":198227122,"Offset":0,"CRC64":3653453705253504273},{"Index":17,"Start":198227123,"End":209887541,"Offset":0,"CRC64":11190013813454468347},{"Index":18,"Start":209887542,"End":221547960,"Offset":0,"CRC64":5533247556752930481},{"Index":19,"Start":221547961,"End":233208379,"Offset":0,"CRC64":15849036080534608692},{"Index":20,"Start":233208380,"End":244868798,"Offset":0,"CRC64":13703147084868492330},{"Index":21,"Start":244868799,"End":256529217,"Offset":0,"CRC64":5916236202680844092},{"Index":22,"Start":256529218,"End":268189636,"Offset":0,"CRC64":12275947725176245213},{"Index":23,"Start":268189637,"End":279850055,"Offset":0,"CRC64":18049087360047100379},{"Index":24,"Start":279850056,"End":291510474,"Offset":0,"CRC64":15499141766239173559},{"Index":25,"Start":291510475,"End":303170893,"Offset":0,"CRC64":340028435928279860},{"Index":26,"Start":303170894,"End":314831312,"Offset":0,"CRC64":15186312857499017160},{"Index":27,"Start":314831313,"End":326491731,"Offset":0,"CRC64":6922168739133407963},{"Index":28,"Start":326491732,"End":338152150,"Offset":0,"CRC64":8980608710238140365},{"Index":29,"Start":338152151,"End":349812569,"Offset":0,"CRC64":6469108255033812945},{"Index":30,"Start":349812570,"End":361472988,"Offset":0,"CRC64":11287381035623870338},{"Index":31,"Start":361472989,"End":373133407,"Offset":0,"CRC64":18256317411039136649},{"Index":32,"Start":373133408,"End":384793826,"Offset":0,"CRC64":819742292214934946},{"Index":33,"Start":384793827,"End":396454245,"Offset":0,"CRC64":4709100509873870267},{"Index":34,"Start":396454246,"End":408114664,"Offset":0,"CRC64":2469143290875329684},{"Index":35,"Start":408114665,"End":419775083,"Offset":0,"CRC64":6444565971909242549},{"Index":36,"Start":419775084,"End":431435502,"Offset":0,"CRC64":16693022421337334587},{"Index":37,"Start":431435503,"End":443095921,"Offset":0,"CRC64":13666188880747168306},{"Index":38,"Start":443095922,"End":454756340,"Offset":0,"CRC64":11349805719409723577},{"Index":39,"Start":454756341,"End":466416759,"Offset":0,"CRC64":7755691616683770537},{"Index":40,"Start":466416760,"End":478077178,"Offset":0,"CRC64":16714215758177607204},{"Index":41,"Start":478077179,"End":489737597,"Offset":0,"CRC64":12936468357410169352},{"Index":42,"Start":489737598,"End":501398016,"Offset":0,"CRC64":18135976149709447687},{"Index":43,"Start":501398017,"End":513058435,"Offset":0,"CRC64":2137063146610027373},{"Index":44,"Start":513058436,"End":524718854,"Offset":0,"CRC64":18027700751305578471},{"Index":45,"Start":524718855,"End":536379273,"Offset":0,"CRC64":17070489883008053169},{"Index":46,"Start":536379274,"End":548039692,"Offset":0,"CRC64":12089509756774810301},{"Index":47,"Start":548039693,"End":559700111,"Offset":0,"CRC64":5250844095937064123},{"Index":48,"Start":559700112,"End":571360530,"Offset":0,"CRC64":17329324136696121029},{"Index":49,"Start":571360531,"End":583020949,"Offset":0,"CRC64":8243902950432017691},{"Index":50,"Start":583020950,"End":594681368,"Offset":0,"CRC64":3692218183166404253},{"Index":51,"Start":594681369,"End":606341787,"Offset":0,"CRC64":14860942240336948981},{"Index":52,"Start":606341788,"End":618002206,"Offset":0,"CRC64":11309456291437465096},{"Index":53,"Start":618002207,"End":629662625,"Offset":0,"CRC64":17279889133426672725},{"Index":54,"Start":629662626,"End":641323044,"Offset":0,"CRC64":14367998732942896796},{"Index":55,"Start":641323045,"End":652983463,"Offset":0,"CRC64":15446064298176669167},{"Index":56,"Start":652983464,"End":664643882,"Offset":0,"CRC64":1546999908191271705},{"Index":57,"Start":664643883,"End":676304301,"Offset":0,"CRC64":8586578867992460022},{"Index":58,"Start":676304302,"End":687964720,"Offset":0,"CRC64":1497801634519813361},{"Index":59,"Start":687964721,"End":699625139,"Offset":0,"CRC64":8710972666671602408},{"Index":60,"Start":699625140,"End":711285558,"Offset":0,"CRC64":3981061586075396065},{"Index":61,"Start":711285559,"End":722945977,"Offset":0,"CRC64":13225035173230182860},{"Index":62,"Start":722945978,"End":734606396,"Offset":0,"CRC64":12036921112722219165},{"Index":63,"Start":734606397,"End":746266815,"Offset":0,"CRC64":10562687976098495881},{"Index":64,"Start":746266816,"End":757927234,"Offset":0,"CRC64":3704439255300855077},{"Index":65,"Start":757927235,"End":769587653,"Offset":0,"CRC64":16124778209460514536},{"Index":66,"Start":769587654,"End":781248072,"Offset":0,"CRC64":17922332911749744390},{"Index":67,"Start":781248073,"End":792908491,"Offset":0,"CRC64":1523306128822911936},{"Index":68,"Start":792908492,"End":804568910,"Offset":0,"CRC64":15316974474598485549},{"Index":69,"Start":804568911,"End":816229329,"Offset":0,"CRC64":14784577240049233698},{"Index":70,"Start":816229330,"End":827889748,"Offset":0,"CRC64":0},{"Index":71,"Start":827889749,"End":839550167,"Offset":0,"CRC64":11690304918250955011},{"Index":72,"Start":839550168,"End":851210586,"Offset":0,"CRC64":0},{"Index":73,"Start":851210587,"End":862871005,"Offset":0,"CRC64":0},{"Index":74,"Start":862871006,"End":874531424,"Offset":0,"CRC64":0},{"Index":75,"Start":874531425,"End":886191843,"Offset":0,"CRC64":0},{"Index":76,"Start":886191844,"End":897852262,"Offset":0,"CRC64":0},{"Index":77,"Start":897852263,"End":909512681,"Offset":0,"CRC64":0},{"Index":78,"Start":909512682,"End":921173100,"Offset":0,"CRC64":0},{"Index":79,"Start":921173101,"End":932833519,"Offset":0,"CRC64":0},{"Index":80,"Start":932833520,"End":944493938,"Offset":0,"CRC64":0},{"Index":81,"Start":944493939,"End":956154357,"Offset":0,"CRC64":0},{"Index":82,"Start":956154358,"End":967814776,"Offset":0,"CRC64":0},{"Index":83,"Start":967814777,"End":979475195,"Offset":0,"CRC64":0},{"Index":84,"Start":979475196,"End":991135614,"Offset":0,"CRC64":0},{"Index":85,"Start":991135615,"End":1002796033,"Offset":0,"CRC64":0},{"Index":86,"Start":1002796034,"End":1014456452,"Offset":0,"CRC64":0},{"Index":87,"Start":1014456453,"End":1026116871,"Offset":0,"CRC64":0},{"Index":88,"Start":1026116872,"End":1037777290,"Offset":0,"CRC64":0},{"Index":89,"Start":1037777291,"End":1049437709,"Offset":0,"CRC64":0},{"Index":90,"Start":1049437710,"End":1061098128,"Offset":0,"CRC64":0},{"Index":91,"Start":1061098129,"End":1072758547,"Offset":0,"CRC64":0},{"Index":92,"Start":1072758548,"End":1084418966,"Offset":0,"CRC64":0},{"Index":93,"Start":1084418967,"End":1096079385,"Offset":0,"CRC64":0},{"Index":94,"Start":1096079386,"End":1107739804,"Offset":0,"CRC64":0},{"Index":95,"Start":1107739805,"End":1119400223,"Offset":0,"CRC64":0},{"Index":96,"Start":1119400224,"End":1131060642,"Offset":0,"CRC64":0},{"Index":97,"Start":1131060643,"End":1142721061,"Offset":0,"CRC64":0},{"Index":98,"Start":1142721062,"End":1154381480,"Offset":0,"CRC64":0},{"Index":99,"Start":1154381481,"End":1166041899,"Offset":0,"CRC64":0},{"Index":100,"Start":1166041900,"End":1177702318,"Offset":0,"CRC64":0},{"Index":101,"Start":1177702319,"End":1189362737,"Offset":0,"CRC64":0},{"Index":102,"Start":1189362738,"End":1201023156,"Offset":0,"CRC64":0},{"Index":103,"Start":1201023157,"End":1212683575,"Offset":0,"CRC64":0},{"Index":104,"Start":1212683576,"End":1224343994,"Offset":0,"CRC64":0},{"Index":105,"Start":1224343995,"End":1236004413,"Offset":0,"CRC64":0},{"Index":106,"Start":1236004414,"End":1247664832,"Offset":0,"CRC64":0},{"Index":107,"Start":1247664833,"End":1259325251,"Offset":0,"CRC64":0},{"Index":108,"Start":1259325252,"End":1270985670,"Offset":0,"CRC64":0},{"Index":109,"Start":1270985671,"End":1282646089,"Offset":0,"CRC64":0},{"Index":110,"Start":1282646090,"End":1294306508,"Offset":0,"CRC64":0},{"Index":111,"Start":1294306509,"End":1305966927,"Offset":0,"CRC64":0},{"Index":112,"Start":1305966928,"End":1317627346,"Offset":0,"CRC64":0},{"Index":113,"Start":1317627347,"End":1329287765,"Offset":0,"CRC64":0},{"Index":114,"Start":1329287766,"End":1340948184,"Offset":0,"CRC64":0},{"Index":115,"Start":1340948185,"End":1352608603,"Offset":0,"CRC64":0},{"Index":116,"Start":1352608604,"End":1364269022,"Offset":0,"CRC64":0},{"Index":117,"Start":1364269023,"End":1375929441,"Offset":0,"CRC64":0},{"Index":118,"Start":1375929442,"End":1387589860,"Offset":0,"CRC64":0},{"Index":119,"Start":1387589861,"End":1399250279,"Offset":0,"CRC64":0},{"Index":120,"Start":1399250280,"End":1410910698,"Offset":0,"CRC64":0},{"Index":121,"Start":1410910699,"End":1422571117,"Offset":0,"CRC64":0},{"Index":122,"Start":1422571118,"End":1434231536,"Offset":0,"CRC64":0},{"Index":123,"Start":1434231537,"End":1445891955,"Offset":0,"CRC64":0},{"Index":124,"Start":1445891956,"End":1457552374,"Offset":0,"CRC64":0},{"Index":125,"Start":1457552375,"End":1469212793,"Offset":0,"CRC64":0},{"Index":126,"Start":1469212794,"End":1480873212,"Offset":0,"CRC64":0},{"Index":127,"Start":1480873213,"End":1492533631,"Offset":0,"CRC64":0},{"Index":128,"Start":1492533632,"End":1504194050,"Offset":0,"CRC64":0},{"Index":129,"Start":1504194051,"End":1515854469,"Offset":0,"CRC64":0},{"Index":130,"Start":1515854470,"End":1527514888,"Offset":0,"CRC64":0},{"Index":131,"Start":1527514889,"End":1539175307,"Offset":0,"CRC64":0},{"Index":132,"Start":1539175308,"End":1550835726,"Offset":0,"CRC64":0},{"Index":133,"Start":1550835727,"End":1562496145,"Offset":0,"CRC64":0},{"Index":134,"Start":1562496146,"End":1574156564,"Offset":0,"CRC64":0},{"Index":135,"Start":1574156565,"End":1585816983,"Offset":0,"CRC64":0},{"Index":136,"Start":1585816984,"End":1597477402,"Offset":0,"CRC64":0},{"Index":137,"Start":1597477403,"End":1609137821,"Offset":0,"CRC64":0},{"Index":138,"Start":1609137822,"End":1620798240,"Offset":0,"CRC64":0},{"Index":139,"Start":1620798241,"End":1632458659,"Offset":0,"CRC64":0},{"Index":140,"Start":1632458660,"End":1644119078,"Offset":0,"CRC64":0},{"Index":141,"Start":1644119079,"End":1655779497,"Offset":0,"CRC64":0},{"Index":142,"Start":1655779498,"End":1667439916,"Offset":0,"CRC64":0},{"Index":143,"Start":1667439917,"End":1679100335,"Offset":0,"CRC64":0},{"Index":144,"Start":1679100336,"End":1690760754,"Offset":0,"CRC64":0},{"Index":145,"Start":1690760755,"End":1702421173,"Offset":0,"CRC64":0},{"Index":146,"Start":1702421174,"End":1714081592,"Offset":0,"CRC64":0},{"Index":147,"Start":1714081593,"End":1725742011,"Offset":0,"CRC64":0},{"Index":148,"Start":1725742012,"End":1737402430,"Offset":0,"CRC64":0},{"Index":149,"Start":1737402431,"End":1749062849,"Offset":0,"CRC64":0},{"Index":150,"Start":1749062850,"End":1760723268,"Offset":0,"CRC64":0},{"Index":151,"Start":1760723269,"End":1772383687,"Offset":0,"CRC64":0},{"Index":152,"Start":1772383688,"End":1784044106,"Offset":0,"CRC64":0},{"Index":153,"Start":1784044107,"End":1795704525,"Offset":0,"CRC64":0},{"Index":154,"Start":1795704526,"End":1807364944,"Offset":0,"CRC64":0},{"Index":155,"Start":1807364945,"End":1819025363,"Offset":0,"CRC64":0},{"Index":156,"Start":1819025364,"End":1830685782,"Offset":0,"CRC64":0},{"Index":157,"Start":1830685783,"End":1842346201,"Offset":0,"CRC64":0},{"Index":158,"Start":1842346202,"End":1854006620,"Offset":0,"CRC64":0},{"Index":159,"Start":1854006621,"End":1865667039,"Offset":0,"CRC64":0},{"Index":160,"Start":1865667040,"End":1877327458,"Offset":0,"CRC64":0},{"Index":161,"Start":1877327459,"End":1888987877,"Offset":0,"CRC64":0},{"Index":162,"Start":1888987878,"End":1900648296,"Offset":0,"CRC64":0},{"Index":163,"Start":1900648297,"End":1912308715,"Offset":0,"CRC64":0},{"Index":164,"Start":1912308716,"End":1923969134,"Offset":0,"CRC64":0},{"Index":165,"Start":1923969135,"End":1935629553,"Offset":0,"CRC64":0},{"Index":166,"Start":1935629554,"End":1947289972,"Offset":0,"CRC64":0},{"Index":167,"Start":1947289973,"End":1958950391,"Offset":0,"CRC64":0},{"Index":168,"Start":1958950392,"End":1970610810,"Offset":0,"CRC64":0},{"Index":169,"Start":1970610811,"End":1982271229,"Offset":0,"CRC64":0},{"Index":170,"Start":1982271230,"End":1993931648,"Offset":0,"CRC64":0},{"Index":171,"Start":1993931649,"End":2005592067,"Offset":0,"CRC64":0},{"Index":172,"Start":2005592068,"End":2017252486,"Offset":0,"CRC64":0},{"Index":173,"Start":2017252487,"End":2028912905,"Offset":0,"CRC64":0},{"Index":174,"Start":2028912906,"End":2040573324,"Offset":0,"CRC64":0},{"Index":175,"Start":2040573325,"End":2052233743,"Offset":0,"CRC64":0},{"Index":176,"Start":2052233744,"End":2063894162,"Offset":0,"CRC64":0},{"Index":177,"Start":2063894163,"End":2075554581,"Offset":0,"CRC64":0},{"Index":178,"Start":2075554582,"End":2087215000,"Offset":0,"CRC64":0},{"Index":179,"Start":2087215001,"End":2098875419,"Offset":0,"CRC64":0},{"Index":180,"Start":2098875420,"End":2110535838,"Offset":0,"CRC64":0},{"Index":181,"Start":2110535839,"End":2122196257,"Offset":0,"CRC64":0},{"Index":182,"Start":2122196258,"End":2133856676,"Offset":0,"CRC64":0},{"Index":183,"Start":2133856677,"End":2145517095,"Offset":0,"CRC64":0},{"Index":184,"Start":2145517096,"End":2157177514,"Offset":0,"CRC64":0},{"Index":185,"Start":2157177515,"End":2168837933,"Offset":0,"CRC64":0},{"Index":186,"Start":2168837934,"End":2180498352,"Offset":0,"CRC64":0},{"Index":187,"Start":2180498353,"End":2192158771,"Offset":0,"CRC64":0},{"Index":188,"Start":2192158772,"End":2203819190,"Offset":0,"CRC64":0},{"Index":189,"Start":2203819191,"End":2215479609,"Offset":0,"CRC64":0},{"Index":190,"Start":2215479610,"End":2227140028,"Offset":0,"CRC64":0},{"Index":191,"Start":2227140029,"End":2238800447,"Offset":0,"CRC64":0},{"Index":192,"Start":2238800448,"End":2250460866,"Offset":0,"CRC64":0},{"Index":193,"Start":2250460867,"End":2262121285,"Offset":0,"CRC64":0},{"Index":194,"Start":2262121286,"End":2273781704,"Offset":0,"CRC64":0},{"Index":195,"Start":2273781705,"End":2285442123,"Offset":0,"CRC64":0},{"Index":196,"Start":2285442124,"End":2297102542,"Offset":0,"CRC64":0},{"Index":197,"Start":2297102543,"End":2308762961,"Offset":0,"CRC64":0},{"Index":198,"Start":2308762962,"End":2320423380,"Offset":0,"CRC64":0},{"Index":199,"Start":2320423381,"End":2332083799,"Offset":0,"CRC64":0},{"Index":200,"Start":2332083800,"End":2343744218,"Offset":0,"CRC64":0},{"Index":201,"Start":2343744219,"End":2355404637,"Offset":0,"CRC64":0},{"Index":202,"Start":2355404638,"End":2367065056,"Offset":0,"CRC64":0},{"Index":203,"Start":2367065057,"End":2378725475,"Offset":0,"CRC64":0},{"Index":204,"Start":2378725476,"End":2390385894,"Offset":0,"CRC64":0},{"Index":205,"Start":2390385895,"End":2402046313,"Offset":0,"CRC64":0},{"Index":206,"Start":2402046314,"End":2413706732,"Offset":0,"CRC64":0},{"Index":207,"Start":2413706733,"End":2425367151,"Offset":0,"CRC64":0},{"Index":208,"Start":2425367152,"End":2437027570,"Offset":0,"CRC64":0},{"Index":209,"Start":2437027571,"End":2448687989,"Offset":0,"CRC64":0},{"Index":210,"Start":2448687990,"End":2460348408,"Offset":0,"CRC64":0},{"Index":211,"Start":2460348409,"End":2472008827,"Offset":0,"CRC64":0},{"Index":212,"Start":2472008828,"End":2483669246,"Offset":0,"CRC64":0},{"Index":213,"Start":2483669247,"End":2495329665,"Offset":0,"CRC64":0},{"Index":214,"Start":2495329666,"End":2506990084,"Offset":0,"CRC64":0},{"Index":215,"Start":2506990085,"End":2518650503,"Offset":0,"CRC64":0},{"Index":216,"Start":2518650504,"End":2530310922,"Offset":0,"CRC64":0},{"Index":217,"Start":2530310923,"End":2541971341,"Offset":0,"CRC64":0},{"Index":218,"Start":2541971342,"End":2553631760,"Offset":0,"CRC64":0},{"Index":219,"Start":2553631761,"End":2565292179,"Offset":0,"CRC64":0},{"Index":220,"Start":2565292180,"End":2576952598,"Offset":0,"CRC64":0},{"Index":221,"Start":2576952599,"End":2588613017,"Offset":0,"CRC64":0},{"Index":222,"Start":2588613018,"End":2600273436,"Offset":0,"CRC64":0},{"Index":223,"Start":2600273437,"End":2611933855,"Offset":0,"CRC64":0},{"Index":224,"Start":2611933856,"End":2623594274,"Offset":0,"CRC64":0},{"Index":225,"Start":2623594275,"End":2635254693,"Offset":0,"CRC64":0},{"Index":226,"Start":2635254694,"End":2646915112,"Offset":0,"CRC64":0},{"Index":227,"Start":2646915113,"End":2658575531,"Offset":0,"CRC64":0},{"Index":228,"Start":2658575532,"End":2670235950,"Offset":0,"CRC64":0},{"Index":229,"Start":2670235951,"End":2681896369,"Offset":0,"CRC64":0},{"Index":230,"Start":2681896370,"End":2693556788,"Offset":0,"CRC64":0},{"Index":231,"Start":2693556789,"End":2705217207,"Offset":0,"CRC64":0},{"Index":232,"Start":2705217208,"End":2716877626,"Offset":0,"CRC64":0},{"Index":233,"Start":2716877627,"End":2728538045,"Offset":0,"CRC64":0},{"Index":234,"Start":2728538046,"End":2740198464,"Offset":0,"CRC64":0},{"Index":235,"Start":2740198465,"End":2751858883,"Offset":0,"CRC64":0},{"Index":236,"Start":2751858884,"End":2763519302,"Offset":0,"CRC64":0},{"Index":237,"Start":2763519303,"End":2775179721,"Offset":0,"CRC64":0},{"Index":238,"Start":2775179722,"End":2786840140,"Offset":0,"CRC64":0},{"Index":239,"Start":2786840141,"End":2798500559,"Offset":0,"CRC64":0},{"Index":240,"Start":2798500560,"End":2810160978,"Offset":0,"CRC64":0},{"Index":241,"Start":2810160979,"End":2821821397,"Offset":0,"CRC64":0},{"Index":242,"Start":2821821398,"End":2833481816,"Offset":0,"CRC64":0},{"Index":243,"Start":2833481817,"End":2845142235,"Offset":0,"CRC64":0},{"Index":244,"Start":2845142236,"End":2856802654,"Offset":0,"CRC64":0},{"Index":245,"Start":2856802655,"End":2868463073,"Offset":0,"CRC64":0},{"Index":246,"Start":2868463074,"End":2880123492,"Offset":0,"CRC64":0},{"Index":247,"Start":2880123493,"End":2891783911,"Offset":0,"CRC64":0},{"Index":248,"Start":2891783912,"End":2903444330,"Offset":0,"CRC64":0},{"Index":249,"Start":2903444331,"End":2915104749,"Offset":0,"CRC64":0},{"Index":250,"Start":2915104750,"End":2926765168,"Offset":0,"CRC64":0},{"Index":251,"Start":2926765169,"End":2938425587,"Offset":0,"CRC64":0},{"Index":252,"Start":2938425588,"End":2950086006,"Offset":0,"CRC64":0},{"Index":253,"Start":2950086007,"End":2961746425,"Offset":0,"CRC64":0},{"Index":254,"Start":2961746426,"End":2973406844,"Offset":0,"CRC64":0},{"Index":255,"Start":2973406845,"End":2985067263,"Offset":0,"CRC64":0},{"Index":256,"Start":2985067264,"End":2996727682,"Offset":0,"CRC64":0},{"Index":257,"Start":2996727683,"End":3008388101,"Offset":0,"CRC64":0},{"Index":258,"Start":3008388102,"End":3020048520,"Offset":0,"CRC64":0},{"Index":259,"Start":3020048521,"End":3031708939,"Offset":0,"CRC64":0},{"Index":260,"Start":3031708940,"End":3043369358,"Offset":0,"CRC64":0},{"Index":261,"Start":3043369359,"End":3055029777,"Offset":0,"CRC64":0},{"Index":262,"Start":3055029778,"End":3066690196,"Offset":0,"CRC64":0},{"Index":263,"Start":3066690197,"End":3078350615,"Offset":0,"CRC64":0},{"Index":264,"Start":3078350616,"End":3090011034,"Offset":0,"CRC64":0},{"Index":265,"Start":3090011035,"End":3101671453,"Offset":0,"CRC64":0},{"Index":266,"Start":3101671454,"End":3113331872,"Offset":0,"CRC64":0},{"Index":267,"Start":3113331873,"End":3124992291,"Offset":0,"CRC64":0},{"Index":268,"Start":3124992292,"End":3136652710,"Offset":0,"CRC64":0},{"Index":269,"Start":3136652711,"End":3148313129,"Offset":0,"CRC64":0},{"Index":270,"Start":3148313130,"End":3159973548,"Offset":0,"CRC64":0},{"Index":271,"Start":3159973549,"End":3171633967,"Offset":0,"CRC64":0},{"Index":272,"Start":3171633968,"End":3183294386,"Offset":0,"CRC64":0},{"Index":273,"Start":3183294387,"End":3194954805,"Offset":0,"CRC64":0},{"Index":274,"Start":3194954806,"End":3206615224,"Offset":0,"CRC64":0},{"Index":275,"Start":3206615225,"End":3218275643,"Offset":0,"CRC64":0},{"Index":276,"Start":3218275644,"End":3229936062,"Offset":0,"CRC64":0},{"Index":277,"Start":3229936063,"End":3241596481,"Offset":0,"CRC64":0},{"Index":278,"Start":3241596482,"End":3253256900,"Offset":0,"CRC64":0},{"Index":279,"Start":3253256901,"End":3264917319,"Offset":0,"CRC64":0},{"Index":280,"Start":3264917320,"End":3276577738,"Offset":0,"CRC64":0},{"Index":281,"Start":3276577739,"End":3288238157,"Offset":0,"CRC64":0},{"Index":282,"Start":3288238158,"End":3299898576,"Offset":0,"CRC64":0},{"Index":283,"Start":3299898577,"End":3311558995,"Offset":0,"CRC64":0},{"Index":284,"Start":3311558996,"End":3323219414,"Offset":0,"CRC64":0},{"Index":285,"Start":3323219415,"End":3334879833,"Offset":0,"CRC64":0},{"Index":286,"Start":3334879834,"End":3346540252,"Offset":0,"CRC64":0},{"Index":287,"Start":3346540253,"End":3358200671,"Offset":0,"CRC64":0},{"Index":288,"Start":3358200672,"End":3369861090,"Offset":0,"CRC64":0},{"Index":289,"Start":3369861091,"End":3381521509,"Offset":0,"CRC64":0},{"Index":290,"Start":3381521510,"End":3393181928,"Offset":0,"CRC64":0},{"Index":291,"Start":3393181929,"End":3404842347,"Offset":0,"CRC64":0},{"Index":292,"Start":3404842348,"End":3416502766,"Offset":0,"CRC64":0},{"Index":293,"Start":3416502767,"End":3428163185,"Offset":0,"CRC64":0},{"Index":294,"Start":3428163186,"End":3439823604,"Offset":0,"CRC64":0},{"Index":295,"Start":3439823605,"End":3451484023,"Offset":0,"CRC64":0},{"Index":296,"Start":3451484024,"End":3463144442,"Offset":0,"CRC64":0},{"Index":297,"Start":3463144443,"End":3474804861,"Offset":0,"CRC64":0},{"Index":298,"Start":3474804862,"End":3486465280,"Offset":0,"CRC64":0},{"Index":299,"Start":3486465281,"End":3498125699,"Offset":0,"CRC64":0},{"Index":300,"Start":3498125700,"End":3509786118,"Offset":0,"CRC64":0},{"Index":301,"Start":3509786119,"End":3521446537,"Offset":0,"CRC64":0},{"Index":302,"Start":3521446538,"End":3533106956,"Offset":0,"CRC64":0},{"Index":303,"Start":3533106957,"End":3544767375,"Offset":0,"CRC64":0},{"Index":304,"Start":3544767376,"End":3556427794,"Offset":0,"CRC64":0},{"Index":305,"Start":3556427795,"End":3568088213,"Offset":0,"CRC64":0},{"Index":306,"Start":3568088214,"End":3579748632,"Offset":0,"CRC64":0},{"Index":307,"Start":3579748633,"End":3591409051,"Offset":0,"CRC64":0},{"Index":308,"Start":3591409052,"End":3603069470,"Offset":0,"CRC64":0},{"Index":309,"Start":3603069471,"End":3614729889,"Offset":0,"CRC64":0},{"Index":310,"Start":3614729890,"End":3626390308,"Offset":0,"CRC64":0},{"Index":311,"Start":3626390309,"End":3638050727,"Offset":0,"CRC64":0},{"Index":312,"Start":3638050728,"End":3649711146,"Offset":0,"CRC64":0},{"Index":313,"Start":3649711147,"End":3661371565,"Offset":0,"CRC64":0},{"Index":314,"Start":3661371566,"End":3673031984,"Offset":0,"CRC64":0},{"Index":315,"Start":3673031985,"End":3684692403,"Offset":0,"CRC64":0},{"Index":316,"Start":3684692404,"End":3696352822,"Offset":0,"CRC64":0},{"Index":317,"Start":3696352823,"End":3708013241,"Offset":0,"CRC64":0},{"Index":318,"Start":3708013242,"End":3719673660,"Offset":0,"CRC64":0},{"Index":319,"Start":3719673661,"End":3731334079,"Offset":0,"CRC64":0},{"Index":320,"Start":3731334080,"End":3742994498,"Offset":0,"CRC64":0},{"Index":321,"Start":3742994499,"End":3754654917,"Offset":0,"CRC64":0},{"Index":322,"Start":3754654918,"End":3766315336,"Offset":0,"CRC64":0},{"Index":323,"Start":3766315337,"End":3777975755,"Offset":0,"CRC64":0},{"Index":324,"Start":3777975756,"End":3789636174,"Offset":0,"CRC64":0},{"Index":325,"Start":3789636175,"End":3801296593,"Offset":0,"CRC64":0},{"Index":326,"Start":3801296594,"End":3812957012,"Offset":0,"CRC64":0},{"Index":327,"Start":3812957013,"End":3824617431,"Offset":0,"CRC64":0},{"Index":328,"Start":3824617432,"End":3836277850,"Offset":0,"CRC64":0},{"Index":329,"Start":3836277851,"End":3847938269,"Offset":0,"CRC64":0},{"Index":330,"Start":3847938270,"End":3859598688,"Offset":0,"CRC64":0},{"Index":331,"Start":3859598689,"End":3871259107,"Offset":0,"CRC64":0},{"Index":332,"Start":3871259108,"End":3882919526,"Offset":0,"CRC64":0},{"Index":333,"Start":3882919527,"End":3894579945,"Offset":0,"CRC64":0},{"Index":334,"Start":3894579946,"End":3906240364,"Offset":0,"CRC64":0},{"Index":335,"Start":3906240365,"End":3917900783,"Offset":0,"CRC64":0},{"Index":336,"Start":3917900784,"End":3929561202,"Offset":0,"CRC64":0},{"Index":337,"Start":3929561203,"End":3941221621,"Offset":0,"CRC64":0},{"Index":338,"Start":3941221622,"End":3952882040,"Offset":0,"CRC64":0},{"Index":339,"Start":3952882041,"End":3964542459,"Offset":0,"CRC64":0},{"Index":340,"Start":3964542460,"End":3976202878,"Offset":0,"CRC64":0},{"Index":341,"Start":3976202879,"End":3987863297,"Offset":0,"CRC64":0},{"Index":342,"Start":3987863298,"End":3999523716,"Offset":0,"CRC64":0},{"Index":343,"Start":3999523717,"End":4011184135,"Offset":0,"CRC64":0},{"Index":344,"Start":4011184136,"End":4022844554,"Offset":0,"CRC64":0},{"Index":345,"Start":4022844555,"End":4034504973,"Offset":0,"CRC64":0},{"Index":346,"Start":4034504974,"End":4046165392,"Offset":0,"CRC64":0},{"Index":347,"Start":4046165393,"End":4057825811,"Offset":0,"CRC64":0},{"Index":348,"Start":4057825812,"End":4069486230,"Offset":0,"CRC64":0},{"Index":349,"Start":4069486231,"End":4081146649,"Offset":0,"CRC64":0},{"Index":350,"Start":4081146650,"End":4092807068,"Offset":0,"CRC64":0},{"Index":351,"Start":4092807069,"End":4104467487,"Offset":0,"CRC64":0},{"Index":352,"Start":4104467488,"End":4116127906,"Offset":0,"CRC64":0},{"Index":353,"Start":4116127907,"End":4127788325,"Offset":0,"CRC64":0},{"Index":354,"Start":4127788326,"End":4139448744,"Offset":0,"CRC64":0},{"Index":355,"Start":4139448745,"End":4151109163,"Offset":0,"CRC64":0},{"Index":356,"Start":4151109164,"End":4162769582,"Offset":0,"CRC64":0},{"Index":357,"Start":4162769583,"End":4174430001,"Offset":0,"CRC64":0},{"Index":358,"Start":4174430002,"End":4186090420,"Offset":0,"CRC64":0},{"Index":359,"Start":4186090421,"End":4197750839,"Offset":0,"CRC64":0},{"Index":360,"Start":4197750840,"End":4209411258,"Offset":0,"CRC64":0},{"Index":361,"Start":4209411259,"End":4221071677,"Offset":0,"CRC64":0},{"Index":362,"Start":4221071678,"End":4232732096,"Offset":0,"CRC64":0},{"Index":363,"Start":4232732097,"End":4244392515,"Offset":0,"CRC64":0},{"Index":364,"Start":4244392516,"End":4256052934,"Offset":0,"CRC64":0},{"Index":365,"Start":4256052935,"End":4267713353,"Offset":0,"CRC64":0},{"Index":366,"Start":4267713354,"End":4279373772,"Offset":0,"CRC64":0},{"Index":367,"Start":4279373773,"End":4291034191,"Offset":0,"CRC64":0},{"Index":368,"Start":4291034192,"End":4302694610,"Offset":0,"CRC64":0},{"Index":369,"Start":4302694611,"End":4314355029,"Offset":0,"CRC64":0},{"Index":370,"Start":4314355030,"End":4326015448,"Offset":0,"CRC64":0},{"Index":371,"Start":4326015449,"End":4337675867,"Offset":0,"CRC64":0},{"Index":372,"Start":4337675868,"End":4349336286,"Offset":0,"CRC64":0},{"Index":373,"Start":4349336287,"End":4360996705,"Offset":0,"CRC64":0},{"Index":374,"Start":4360996706,"End":4372657124,"Offset":0,"CRC64":0},{"Index":375,"Start":4372657125,"End":4384317543,"Offset":0,"CRC64":0},{"Index":376,"Start":4384317544,"End":4395977962,"Offset":0,"CRC64":0},{"Index":377,"Start":4395977963,"End":4407638381,"Offset":0,"CRC64":0},{"Index":378,"Start":4407638382,"End":4419298800,"Offset":0,"CRC64":0},{"Index":379,"Start":4419298801,"End":4430959219,"Offset":0,"CRC64":0},{"Index":380,"Start":4430959220,"End":4442619638,"Offset":0,"CRC64":0},{"Index":381,"Start":4442619639,"End":4454280057,"Offset":0,"CRC64":0},{"Index":382,"Start":4454280058,"End":4465940476,"Offset":0,"CRC64":0},{"Index":383,"Start":4465940477,"End":4477600895,"Offset":0,"CRC64":0},{"Index":384,"Start":4477600896,"End":4489261314,"Offset":0,"CRC64":0},{"Index":385,"Start":4489261315,"End":4500921733,"Offset":0,"CRC64":0},{"Index":386,"Start":4500921734,"End":4512582152,"Offset":0,"CRC64":0},{"Index":387,"Start":4512582153,"End":4524242571,"Offset":0,"CRC64":0},{"Index":388,"Start":4524242572,"End":4535902990,"Offset":0,"CRC64":0},{"Index":389,"Start":4535902991,"End":4547563409,"Offset":0,"CRC64":0},{"Index":390,"Start":4547563410,"End":4559223828,"Offset":0,"CRC64":0},{"Index":391,"Start":4559223829,"End":4570884247,"Offset":0,"CRC64":0},{"Index":392,"Start":4570884248,"End":4582544666,"Offset":0,"CRC64":0},{"Index":393,"Start":4582544667,"End":4594205085,"Offset":0,"CRC64":0},{"Index":394,"Start":4594205086,"End":4605865504,"Offset":0,"CRC64":0},{"Index":395,"Start":4605865505,"End":4617525923,"Offset":0,"CRC64":0},{"Index":396,"Start":4617525924,"End":4629186342,"Offset":0,"CRC64":0},{"Index":397,"Start":4629186343,"End":4640846761,"Offset":0,"CRC64":0},{"Index":398,"Start":4640846762,"End":4652507180,"Offset":0,"CRC64":0},{"Index":399,"Start":4652507181,"End":4664167375,"Offset":0,"CRC64":0}],"PartStat":[true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,true,false,true,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false,false],"Start":0,"End":0,"CRC":6503938402276769276}
|
README.md
CHANGED
@@ -1,3 +1,59 @@
|
|
1 |
-
---
|
2 |
-
license:
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: other
|
3 |
+
base_model: /cpfs01/shared/public/lichengpeng.lcp/Llama-2-70b-hf
|
4 |
+
tags:
|
5 |
+
- llama-factory
|
6 |
+
- full
|
7 |
+
- generated_from_trainer
|
8 |
+
model-index:
|
9 |
+
- name: muggle70b
|
10 |
+
results: []
|
11 |
+
---
|
12 |
+
|
13 |
+
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
14 |
+
should probably proofread and complete it, then remove this comment. -->
|
15 |
+
|
16 |
+
# muggle70b
|
17 |
+
|
18 |
+
This model is a fine-tuned version of [/cpfs01/shared/public/lichengpeng.lcp/Llama-2-70b-hf](https://huggingface.co//cpfs01/shared/public/lichengpeng.lcp/Llama-2-70b-hf) on the muggle dataset.
|
19 |
+
|
20 |
+
## Model description
|
21 |
+
|
22 |
+
More information needed
|
23 |
+
|
24 |
+
## Intended uses & limitations
|
25 |
+
|
26 |
+
More information needed
|
27 |
+
|
28 |
+
## Training and evaluation data
|
29 |
+
|
30 |
+
More information needed
|
31 |
+
|
32 |
+
## Training procedure
|
33 |
+
|
34 |
+
### Training hyperparameters
|
35 |
+
|
36 |
+
The following hyperparameters were used during training:
|
37 |
+
- learning_rate: 1e-05
|
38 |
+
- train_batch_size: 1
|
39 |
+
- eval_batch_size: 8
|
40 |
+
- seed: 42
|
41 |
+
- distributed_type: multi-GPU
|
42 |
+
- num_devices: 32
|
43 |
+
- gradient_accumulation_steps: 4
|
44 |
+
- total_train_batch_size: 128
|
45 |
+
- total_eval_batch_size: 256
|
46 |
+
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
47 |
+
- lr_scheduler_type: cosine
|
48 |
+
- num_epochs: 3.0
|
49 |
+
|
50 |
+
### Training results
|
51 |
+
|
52 |
+
|
53 |
+
|
54 |
+
### Framework versions
|
55 |
+
|
56 |
+
- Transformers 4.37.2
|
57 |
+
- Pytorch 2.1.0+cu118
|
58 |
+
- Datasets 2.17.1
|
59 |
+
- Tokenizers 0.15.2
|
all_results.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 3.0,
|
3 |
+
"train_loss": 0.28055200490389104,
|
4 |
+
"train_runtime": 252630.326,
|
5 |
+
"train_samples_per_second": 5.482,
|
6 |
+
"train_steps_per_second": 0.043
|
7 |
+
}
|
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/cpfs01/shared/public/lichengpeng.lcp/Llama-2-70b-hf",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 10000.0,
|
24 |
+
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "bfloat16",
|
26 |
+
"transformers_version": "4.37.2",
|
27 |
+
"use_cache": false,
|
28 |
+
"vocab_size": 32000
|
29 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.37.2"
|
7 |
+
}
|
model-00001-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37150054471fd1d5c3de4db158c902371cdb6627df798e5242d26cafda8c8660
|
3 |
+
size 4718660336
|
model-00002-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a84df8da003c3245464000ec5d1b1ebda3b99a747370f70806088d774e6163c1
|
3 |
+
size 4664167376
|
model-00003-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4967bb50b1a9d2991f962fea3c294881dea29702327af4983aff37a2b4949284
|
3 |
+
size 4999711704
|
model-00004-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b829b345e22579d54257261df9c0fd80d68c2d42fc16f38feb680c960707b8e0
|
3 |
+
size 4966157048
|
model-00005-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b0228323a8d8da569fb8a15376f61da2c849e517de42b876a88873392966701
|
3 |
+
size 4664134408
|
model-00006-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8d293e5d712b803c5a61c1541b9d59a8c3ca5e782832e5a69ce6ba73a61972d
|
3 |
+
size 4664167408
|
model-00007-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1396c1052d22ba39e67b8c432bd531e1bcbde94ae5feaf1f06f43dc55bb0fd2
|
3 |
+
size 4664167408
|
model-00008-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beffa0b58e8edfea70a0c0d463ec46462968ac49a8ba0e49a1fb13d6c1b338ad
|
3 |
+
size 4999711728
|
model-00009-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6bd5b293c178df72f9a41a43b8213ed99a25c49160c1dbc2b0e57a53f3a4fd4
|
3 |
+
size 4966157056
|
model-00010-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e549b72be88b3b94ca71d03860c4801498ae9450aa9cdf2b74d0d21b9755c789
|
3 |
+
size 4664134408
|
model-00011-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b4dc650e63cdc0b0db976cdf1732944e3f84fc86335a948b93044ab363d580e
|
3 |
+
size 4664167408
|
model-00012-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:419e82872714cb006a1cf2547526e19dc5060e577b96f6afee1aa44738697f1a
|
3 |
+
size 4664167408
|
model-00013-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f802f2da884d6f47babcf6af3fe6c27280c65f01e8019728ea83097ca33d110
|
3 |
+
size 4999711728
|
model-00014-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0541c8b83b221263153b15e423abb7c87e2fe6dafc34398f5d0a143ed87d449
|
3 |
+
size 4966157056
|
model-00015-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93652283bfd06b688f9efd0cfc84f9cba05208279b23808ea4bf3344f3a80fcc
|
3 |
+
size 4664134408
|
model-00016-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4620e193359c029a09f4ebd72126492e154318efcdcaa94c234c6b11ffb55d09
|
3 |
+
size 4664167408
|
model-00017-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fee5c4229dd472cdde30a77d975db3f0f7cdc6dbb0044ad9b921a7178c637a8
|
3 |
+
size 4664167408
|
model-00018-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:218d9284939eaa55344145d50d2ac52a3668d9e04b8454d6f2841cca208f9329
|
3 |
+
size 4999711728
|
model-00019-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e8b254230b03b09f541e7521bebec89e030988abec1527c03bce242cb7a79d6
|
3 |
+
size 4966157056
|
model-00020-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7297b5acc4c21941017886ce8f453116ccc382472d2b1077c8737e9c0560841f
|
3 |
+
size 4664134408
|
model-00021-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0880541ff9cc4ee930f088b122ab365a7d44e3acf2d65d762a8deed136c8559
|
3 |
+
size 4664167408
|
model-00022-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:369a7661f1f773a6a8728df3df8ef91096146d25a1f4611bee377150850dfa21
|
3 |
+
size 4664167408
|
model-00023-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56286d80760e689ab7444f64dd83fed9e0a63c455af23964abd40812b4ed72cc
|
3 |
+
size 4999711728
|
model-00024-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54a4fb6f6e78e78b1e03fbccb8c0a1f22f1ccfb136b89fbf5b5300ccb8e155a2
|
3 |
+
size 4966157056
|
model-00025-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f133749501a530456afe4a07e17f4438db21dadb7ac9488fb782e1363102c48
|
3 |
+
size 4664134408
|
model-00026-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a508720bf7d77fc57ec06c081c2e1c71fa7d371c30697eb6a7c1ff07ce4cad5e
|
3 |
+
size 4664167408
|
model-00027-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dd386e5ea53727cdb2f07c1d5769482a9bb8adf3ed4a24893640fcb260cbfd4
|
3 |
+
size 4664167408
|
model-00028-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d48a46ee53bf2c347b7ddad2c7c8d4997822790f54f5b70203fe0830cd48a7
|
3 |
+
size 4999711728
|
model-00029-of-00029.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cc21f06062439803e1fa81060f92a840b242c6be64a11b6f213d11a0be6ab62
|
3 |
+
size 3779151784
|
model.safetensors.index.json
ADDED
@@ -0,0 +1,730 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"metadata": {
|
3 |
+
"total_size": 137953296384
|
4 |
+
},
|
5 |
+
"weight_map": {
|
6 |
+
"lm_head.weight": "model-00029-of-00029.safetensors",
|
7 |
+
"model.embed_tokens.weight": "model-00001-of-00029.safetensors",
|
8 |
+
"model.layers.0.input_layernorm.weight": "model-00001-of-00029.safetensors",
|
9 |
+
"model.layers.0.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
|
10 |
+
"model.layers.0.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
|
11 |
+
"model.layers.0.mlp.up_proj.weight": "model-00001-of-00029.safetensors",
|
12 |
+
"model.layers.0.post_attention_layernorm.weight": "model-00001-of-00029.safetensors",
|
13 |
+
"model.layers.0.self_attn.k_proj.weight": "model-00001-of-00029.safetensors",
|
14 |
+
"model.layers.0.self_attn.o_proj.weight": "model-00001-of-00029.safetensors",
|
15 |
+
"model.layers.0.self_attn.q_proj.weight": "model-00001-of-00029.safetensors",
|
16 |
+
"model.layers.0.self_attn.v_proj.weight": "model-00001-of-00029.safetensors",
|
17 |
+
"model.layers.1.input_layernorm.weight": "model-00001-of-00029.safetensors",
|
18 |
+
"model.layers.1.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
|
19 |
+
"model.layers.1.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
|
20 |
+
"model.layers.1.mlp.up_proj.weight": "model-00001-of-00029.safetensors",
|
21 |
+
"model.layers.1.post_attention_layernorm.weight": "model-00001-of-00029.safetensors",
|
22 |
+
"model.layers.1.self_attn.k_proj.weight": "model-00001-of-00029.safetensors",
|
23 |
+
"model.layers.1.self_attn.o_proj.weight": "model-00001-of-00029.safetensors",
|
24 |
+
"model.layers.1.self_attn.q_proj.weight": "model-00001-of-00029.safetensors",
|
25 |
+
"model.layers.1.self_attn.v_proj.weight": "model-00001-of-00029.safetensors",
|
26 |
+
"model.layers.10.input_layernorm.weight": "model-00004-of-00029.safetensors",
|
27 |
+
"model.layers.10.mlp.down_proj.weight": "model-00004-of-00029.safetensors",
|
28 |
+
"model.layers.10.mlp.gate_proj.weight": "model-00004-of-00029.safetensors",
|
29 |
+
"model.layers.10.mlp.up_proj.weight": "model-00004-of-00029.safetensors",
|
30 |
+
"model.layers.10.post_attention_layernorm.weight": "model-00004-of-00029.safetensors",
|
31 |
+
"model.layers.10.self_attn.k_proj.weight": "model-00004-of-00029.safetensors",
|
32 |
+
"model.layers.10.self_attn.o_proj.weight": "model-00004-of-00029.safetensors",
|
33 |
+
"model.layers.10.self_attn.q_proj.weight": "model-00004-of-00029.safetensors",
|
34 |
+
"model.layers.10.self_attn.v_proj.weight": "model-00004-of-00029.safetensors",
|
35 |
+
"model.layers.11.input_layernorm.weight": "model-00005-of-00029.safetensors",
|
36 |
+
"model.layers.11.mlp.down_proj.weight": "model-00005-of-00029.safetensors",
|
37 |
+
"model.layers.11.mlp.gate_proj.weight": "model-00005-of-00029.safetensors",
|
38 |
+
"model.layers.11.mlp.up_proj.weight": "model-00005-of-00029.safetensors",
|
39 |
+
"model.layers.11.post_attention_layernorm.weight": "model-00005-of-00029.safetensors",
|
40 |
+
"model.layers.11.self_attn.k_proj.weight": "model-00005-of-00029.safetensors",
|
41 |
+
"model.layers.11.self_attn.o_proj.weight": "model-00005-of-00029.safetensors",
|
42 |
+
"model.layers.11.self_attn.q_proj.weight": "model-00005-of-00029.safetensors",
|
43 |
+
"model.layers.11.self_attn.v_proj.weight": "model-00005-of-00029.safetensors",
|
44 |
+
"model.layers.12.input_layernorm.weight": "model-00005-of-00029.safetensors",
|
45 |
+
"model.layers.12.mlp.down_proj.weight": "model-00005-of-00029.safetensors",
|
46 |
+
"model.layers.12.mlp.gate_proj.weight": "model-00005-of-00029.safetensors",
|
47 |
+
"model.layers.12.mlp.up_proj.weight": "model-00005-of-00029.safetensors",
|
48 |
+
"model.layers.12.post_attention_layernorm.weight": "model-00005-of-00029.safetensors",
|
49 |
+
"model.layers.12.self_attn.k_proj.weight": "model-00005-of-00029.safetensors",
|
50 |
+
"model.layers.12.self_attn.o_proj.weight": "model-00005-of-00029.safetensors",
|
51 |
+
"model.layers.12.self_attn.q_proj.weight": "model-00005-of-00029.safetensors",
|
52 |
+
"model.layers.12.self_attn.v_proj.weight": "model-00005-of-00029.safetensors",
|
53 |
+
"model.layers.13.input_layernorm.weight": "model-00006-of-00029.safetensors",
|
54 |
+
"model.layers.13.mlp.down_proj.weight": "model-00006-of-00029.safetensors",
|
55 |
+
"model.layers.13.mlp.gate_proj.weight": "model-00005-of-00029.safetensors",
|
56 |
+
"model.layers.13.mlp.up_proj.weight": "model-00005-of-00029.safetensors",
|
57 |
+
"model.layers.13.post_attention_layernorm.weight": "model-00006-of-00029.safetensors",
|
58 |
+
"model.layers.13.self_attn.k_proj.weight": "model-00005-of-00029.safetensors",
|
59 |
+
"model.layers.13.self_attn.o_proj.weight": "model-00005-of-00029.safetensors",
|
60 |
+
"model.layers.13.self_attn.q_proj.weight": "model-00005-of-00029.safetensors",
|
61 |
+
"model.layers.13.self_attn.v_proj.weight": "model-00005-of-00029.safetensors",
|
62 |
+
"model.layers.14.input_layernorm.weight": "model-00006-of-00029.safetensors",
|
63 |
+
"model.layers.14.mlp.down_proj.weight": "model-00006-of-00029.safetensors",
|
64 |
+
"model.layers.14.mlp.gate_proj.weight": "model-00006-of-00029.safetensors",
|
65 |
+
"model.layers.14.mlp.up_proj.weight": "model-00006-of-00029.safetensors",
|
66 |
+
"model.layers.14.post_attention_layernorm.weight": "model-00006-of-00029.safetensors",
|
67 |
+
"model.layers.14.self_attn.k_proj.weight": "model-00006-of-00029.safetensors",
|
68 |
+
"model.layers.14.self_attn.o_proj.weight": "model-00006-of-00029.safetensors",
|
69 |
+
"model.layers.14.self_attn.q_proj.weight": "model-00006-of-00029.safetensors",
|
70 |
+
"model.layers.14.self_attn.v_proj.weight": "model-00006-of-00029.safetensors",
|
71 |
+
"model.layers.15.input_layernorm.weight": "model-00006-of-00029.safetensors",
|
72 |
+
"model.layers.15.mlp.down_proj.weight": "model-00006-of-00029.safetensors",
|
73 |
+
"model.layers.15.mlp.gate_proj.weight": "model-00006-of-00029.safetensors",
|
74 |
+
"model.layers.15.mlp.up_proj.weight": "model-00006-of-00029.safetensors",
|
75 |
+
"model.layers.15.post_attention_layernorm.weight": "model-00006-of-00029.safetensors",
|
76 |
+
"model.layers.15.self_attn.k_proj.weight": "model-00006-of-00029.safetensors",
|
77 |
+
"model.layers.15.self_attn.o_proj.weight": "model-00006-of-00029.safetensors",
|
78 |
+
"model.layers.15.self_attn.q_proj.weight": "model-00006-of-00029.safetensors",
|
79 |
+
"model.layers.15.self_attn.v_proj.weight": "model-00006-of-00029.safetensors",
|
80 |
+
"model.layers.16.input_layernorm.weight": "model-00007-of-00029.safetensors",
|
81 |
+
"model.layers.16.mlp.down_proj.weight": "model-00007-of-00029.safetensors",
|
82 |
+
"model.layers.16.mlp.gate_proj.weight": "model-00006-of-00029.safetensors",
|
83 |
+
"model.layers.16.mlp.up_proj.weight": "model-00007-of-00029.safetensors",
|
84 |
+
"model.layers.16.post_attention_layernorm.weight": "model-00007-of-00029.safetensors",
|
85 |
+
"model.layers.16.self_attn.k_proj.weight": "model-00006-of-00029.safetensors",
|
86 |
+
"model.layers.16.self_attn.o_proj.weight": "model-00006-of-00029.safetensors",
|
87 |
+
"model.layers.16.self_attn.q_proj.weight": "model-00006-of-00029.safetensors",
|
88 |
+
"model.layers.16.self_attn.v_proj.weight": "model-00006-of-00029.safetensors",
|
89 |
+
"model.layers.17.input_layernorm.weight": "model-00007-of-00029.safetensors",
|
90 |
+
"model.layers.17.mlp.down_proj.weight": "model-00007-of-00029.safetensors",
|
91 |
+
"model.layers.17.mlp.gate_proj.weight": "model-00007-of-00029.safetensors",
|
92 |
+
"model.layers.17.mlp.up_proj.weight": "model-00007-of-00029.safetensors",
|
93 |
+
"model.layers.17.post_attention_layernorm.weight": "model-00007-of-00029.safetensors",
|
94 |
+
"model.layers.17.self_attn.k_proj.weight": "model-00007-of-00029.safetensors",
|
95 |
+
"model.layers.17.self_attn.o_proj.weight": "model-00007-of-00029.safetensors",
|
96 |
+
"model.layers.17.self_attn.q_proj.weight": "model-00007-of-00029.safetensors",
|
97 |
+
"model.layers.17.self_attn.v_proj.weight": "model-00007-of-00029.safetensors",
|
98 |
+
"model.layers.18.input_layernorm.weight": "model-00007-of-00029.safetensors",
|
99 |
+
"model.layers.18.mlp.down_proj.weight": "model-00007-of-00029.safetensors",
|
100 |
+
"model.layers.18.mlp.gate_proj.weight": "model-00007-of-00029.safetensors",
|
101 |
+
"model.layers.18.mlp.up_proj.weight": "model-00007-of-00029.safetensors",
|
102 |
+
"model.layers.18.post_attention_layernorm.weight": "model-00007-of-00029.safetensors",
|
103 |
+
"model.layers.18.self_attn.k_proj.weight": "model-00007-of-00029.safetensors",
|
104 |
+
"model.layers.18.self_attn.o_proj.weight": "model-00007-of-00029.safetensors",
|
105 |
+
"model.layers.18.self_attn.q_proj.weight": "model-00007-of-00029.safetensors",
|
106 |
+
"model.layers.18.self_attn.v_proj.weight": "model-00007-of-00029.safetensors",
|
107 |
+
"model.layers.19.input_layernorm.weight": "model-00008-of-00029.safetensors",
|
108 |
+
"model.layers.19.mlp.down_proj.weight": "model-00008-of-00029.safetensors",
|
109 |
+
"model.layers.19.mlp.gate_proj.weight": "model-00008-of-00029.safetensors",
|
110 |
+
"model.layers.19.mlp.up_proj.weight": "model-00008-of-00029.safetensors",
|
111 |
+
"model.layers.19.post_attention_layernorm.weight": "model-00008-of-00029.safetensors",
|
112 |
+
"model.layers.19.self_attn.k_proj.weight": "model-00007-of-00029.safetensors",
|
113 |
+
"model.layers.19.self_attn.o_proj.weight": "model-00007-of-00029.safetensors",
|
114 |
+
"model.layers.19.self_attn.q_proj.weight": "model-00007-of-00029.safetensors",
|
115 |
+
"model.layers.19.self_attn.v_proj.weight": "model-00007-of-00029.safetensors",
|
116 |
+
"model.layers.2.input_layernorm.weight": "model-00002-of-00029.safetensors",
|
117 |
+
"model.layers.2.mlp.down_proj.weight": "model-00002-of-00029.safetensors",
|
118 |
+
"model.layers.2.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
|
119 |
+
"model.layers.2.mlp.up_proj.weight": "model-00002-of-00029.safetensors",
|
120 |
+
"model.layers.2.post_attention_layernorm.weight": "model-00002-of-00029.safetensors",
|
121 |
+
"model.layers.2.self_attn.k_proj.weight": "model-00001-of-00029.safetensors",
|
122 |
+
"model.layers.2.self_attn.o_proj.weight": "model-00001-of-00029.safetensors",
|
123 |
+
"model.layers.2.self_attn.q_proj.weight": "model-00001-of-00029.safetensors",
|
124 |
+
"model.layers.2.self_attn.v_proj.weight": "model-00001-of-00029.safetensors",
|
125 |
+
"model.layers.20.input_layernorm.weight": "model-00008-of-00029.safetensors",
|
126 |
+
"model.layers.20.mlp.down_proj.weight": "model-00008-of-00029.safetensors",
|
127 |
+
"model.layers.20.mlp.gate_proj.weight": "model-00008-of-00029.safetensors",
|
128 |
+
"model.layers.20.mlp.up_proj.weight": "model-00008-of-00029.safetensors",
|
129 |
+
"model.layers.20.post_attention_layernorm.weight": "model-00008-of-00029.safetensors",
|
130 |
+
"model.layers.20.self_attn.k_proj.weight": "model-00008-of-00029.safetensors",
|
131 |
+
"model.layers.20.self_attn.o_proj.weight": "model-00008-of-00029.safetensors",
|
132 |
+
"model.layers.20.self_attn.q_proj.weight": "model-00008-of-00029.safetensors",
|
133 |
+
"model.layers.20.self_attn.v_proj.weight": "model-00008-of-00029.safetensors",
|
134 |
+
"model.layers.21.input_layernorm.weight": "model-00008-of-00029.safetensors",
|
135 |
+
"model.layers.21.mlp.down_proj.weight": "model-00008-of-00029.safetensors",
|
136 |
+
"model.layers.21.mlp.gate_proj.weight": "model-00008-of-00029.safetensors",
|
137 |
+
"model.layers.21.mlp.up_proj.weight": "model-00008-of-00029.safetensors",
|
138 |
+
"model.layers.21.post_attention_layernorm.weight": "model-00008-of-00029.safetensors",
|
139 |
+
"model.layers.21.self_attn.k_proj.weight": "model-00008-of-00029.safetensors",
|
140 |
+
"model.layers.21.self_attn.o_proj.weight": "model-00008-of-00029.safetensors",
|
141 |
+
"model.layers.21.self_attn.q_proj.weight": "model-00008-of-00029.safetensors",
|
142 |
+
"model.layers.21.self_attn.v_proj.weight": "model-00008-of-00029.safetensors",
|
143 |
+
"model.layers.22.input_layernorm.weight": "model-00009-of-00029.safetensors",
|
144 |
+
"model.layers.22.mlp.down_proj.weight": "model-00009-of-00029.safetensors",
|
145 |
+
"model.layers.22.mlp.gate_proj.weight": "model-00009-of-00029.safetensors",
|
146 |
+
"model.layers.22.mlp.up_proj.weight": "model-00009-of-00029.safetensors",
|
147 |
+
"model.layers.22.post_attention_layernorm.weight": "model-00009-of-00029.safetensors",
|
148 |
+
"model.layers.22.self_attn.k_proj.weight": "model-00008-of-00029.safetensors",
|
149 |
+
"model.layers.22.self_attn.o_proj.weight": "model-00009-of-00029.safetensors",
|
150 |
+
"model.layers.22.self_attn.q_proj.weight": "model-00008-of-00029.safetensors",
|
151 |
+
"model.layers.22.self_attn.v_proj.weight": "model-00008-of-00029.safetensors",
|
152 |
+
"model.layers.23.input_layernorm.weight": "model-00009-of-00029.safetensors",
|
153 |
+
"model.layers.23.mlp.down_proj.weight": "model-00009-of-00029.safetensors",
|
154 |
+
"model.layers.23.mlp.gate_proj.weight": "model-00009-of-00029.safetensors",
|
155 |
+
"model.layers.23.mlp.up_proj.weight": "model-00009-of-00029.safetensors",
|
156 |
+
"model.layers.23.post_attention_layernorm.weight": "model-00009-of-00029.safetensors",
|
157 |
+
"model.layers.23.self_attn.k_proj.weight": "model-00009-of-00029.safetensors",
|
158 |
+
"model.layers.23.self_attn.o_proj.weight": "model-00009-of-00029.safetensors",
|
159 |
+
"model.layers.23.self_attn.q_proj.weight": "model-00009-of-00029.safetensors",
|
160 |
+
"model.layers.23.self_attn.v_proj.weight": "model-00009-of-00029.safetensors",
|
161 |
+
"model.layers.24.input_layernorm.weight": "model-00009-of-00029.safetensors",
|
162 |
+
"model.layers.24.mlp.down_proj.weight": "model-00009-of-00029.safetensors",
|
163 |
+
"model.layers.24.mlp.gate_proj.weight": "model-00009-of-00029.safetensors",
|
164 |
+
"model.layers.24.mlp.up_proj.weight": "model-00009-of-00029.safetensors",
|
165 |
+
"model.layers.24.post_attention_layernorm.weight": "model-00009-of-00029.safetensors",
|
166 |
+
"model.layers.24.self_attn.k_proj.weight": "model-00009-of-00029.safetensors",
|
167 |
+
"model.layers.24.self_attn.o_proj.weight": "model-00009-of-00029.safetensors",
|
168 |
+
"model.layers.24.self_attn.q_proj.weight": "model-00009-of-00029.safetensors",
|
169 |
+
"model.layers.24.self_attn.v_proj.weight": "model-00009-of-00029.safetensors",
|
170 |
+
"model.layers.25.input_layernorm.weight": "model-00010-of-00029.safetensors",
|
171 |
+
"model.layers.25.mlp.down_proj.weight": "model-00010-of-00029.safetensors",
|
172 |
+
"model.layers.25.mlp.gate_proj.weight": "model-00010-of-00029.safetensors",
|
173 |
+
"model.layers.25.mlp.up_proj.weight": "model-00010-of-00029.safetensors",
|
174 |
+
"model.layers.25.post_attention_layernorm.weight": "model-00010-of-00029.safetensors",
|
175 |
+
"model.layers.25.self_attn.k_proj.weight": "model-00010-of-00029.safetensors",
|
176 |
+
"model.layers.25.self_attn.o_proj.weight": "model-00010-of-00029.safetensors",
|
177 |
+
"model.layers.25.self_attn.q_proj.weight": "model-00010-of-00029.safetensors",
|
178 |
+
"model.layers.25.self_attn.v_proj.weight": "model-00010-of-00029.safetensors",
|
179 |
+
"model.layers.26.input_layernorm.weight": "model-00010-of-00029.safetensors",
|
180 |
+
"model.layers.26.mlp.down_proj.weight": "model-00010-of-00029.safetensors",
|
181 |
+
"model.layers.26.mlp.gate_proj.weight": "model-00010-of-00029.safetensors",
|
182 |
+
"model.layers.26.mlp.up_proj.weight": "model-00010-of-00029.safetensors",
|
183 |
+
"model.layers.26.post_attention_layernorm.weight": "model-00010-of-00029.safetensors",
|
184 |
+
"model.layers.26.self_attn.k_proj.weight": "model-00010-of-00029.safetensors",
|
185 |
+
"model.layers.26.self_attn.o_proj.weight": "model-00010-of-00029.safetensors",
|
186 |
+
"model.layers.26.self_attn.q_proj.weight": "model-00010-of-00029.safetensors",
|
187 |
+
"model.layers.26.self_attn.v_proj.weight": "model-00010-of-00029.safetensors",
|
188 |
+
"model.layers.27.input_layernorm.weight": "model-00011-of-00029.safetensors",
|
189 |
+
"model.layers.27.mlp.down_proj.weight": "model-00011-of-00029.safetensors",
|
190 |
+
"model.layers.27.mlp.gate_proj.weight": "model-00010-of-00029.safetensors",
|
191 |
+
"model.layers.27.mlp.up_proj.weight": "model-00010-of-00029.safetensors",
|
192 |
+
"model.layers.27.post_attention_layernorm.weight": "model-00011-of-00029.safetensors",
|
193 |
+
"model.layers.27.self_attn.k_proj.weight": "model-00010-of-00029.safetensors",
|
194 |
+
"model.layers.27.self_attn.o_proj.weight": "model-00010-of-00029.safetensors",
|
195 |
+
"model.layers.27.self_attn.q_proj.weight": "model-00010-of-00029.safetensors",
|
196 |
+
"model.layers.27.self_attn.v_proj.weight": "model-00010-of-00029.safetensors",
|
197 |
+
"model.layers.28.input_layernorm.weight": "model-00011-of-00029.safetensors",
|
198 |
+
"model.layers.28.mlp.down_proj.weight": "model-00011-of-00029.safetensors",
|
199 |
+
"model.layers.28.mlp.gate_proj.weight": "model-00011-of-00029.safetensors",
|
200 |
+
"model.layers.28.mlp.up_proj.weight": "model-00011-of-00029.safetensors",
|
201 |
+
"model.layers.28.post_attention_layernorm.weight": "model-00011-of-00029.safetensors",
|
202 |
+
"model.layers.28.self_attn.k_proj.weight": "model-00011-of-00029.safetensors",
|
203 |
+
"model.layers.28.self_attn.o_proj.weight": "model-00011-of-00029.safetensors",
|
204 |
+
"model.layers.28.self_attn.q_proj.weight": "model-00011-of-00029.safetensors",
|
205 |
+
"model.layers.28.self_attn.v_proj.weight": "model-00011-of-00029.safetensors",
|
206 |
+
"model.layers.29.input_layernorm.weight": "model-00011-of-00029.safetensors",
|
207 |
+
"model.layers.29.mlp.down_proj.weight": "model-00011-of-00029.safetensors",
|
208 |
+
"model.layers.29.mlp.gate_proj.weight": "model-00011-of-00029.safetensors",
|
209 |
+
"model.layers.29.mlp.up_proj.weight": "model-00011-of-00029.safetensors",
|
210 |
+
"model.layers.29.post_attention_layernorm.weight": "model-00011-of-00029.safetensors",
|
211 |
+
"model.layers.29.self_attn.k_proj.weight": "model-00011-of-00029.safetensors",
|
212 |
+
"model.layers.29.self_attn.o_proj.weight": "model-00011-of-00029.safetensors",
|
213 |
+
"model.layers.29.self_attn.q_proj.weight": "model-00011-of-00029.safetensors",
|
214 |
+
"model.layers.29.self_attn.v_proj.weight": "model-00011-of-00029.safetensors",
|
215 |
+
"model.layers.3.input_layernorm.weight": "model-00002-of-00029.safetensors",
|
216 |
+
"model.layers.3.mlp.down_proj.weight": "model-00002-of-00029.safetensors",
|
217 |
+
"model.layers.3.mlp.gate_proj.weight": "model-00002-of-00029.safetensors",
|
218 |
+
"model.layers.3.mlp.up_proj.weight": "model-00002-of-00029.safetensors",
|
219 |
+
"model.layers.3.post_attention_layernorm.weight": "model-00002-of-00029.safetensors",
|
220 |
+
"model.layers.3.self_attn.k_proj.weight": "model-00002-of-00029.safetensors",
|
221 |
+
"model.layers.3.self_attn.o_proj.weight": "model-00002-of-00029.safetensors",
|
222 |
+
"model.layers.3.self_attn.q_proj.weight": "model-00002-of-00029.safetensors",
|
223 |
+
"model.layers.3.self_attn.v_proj.weight": "model-00002-of-00029.safetensors",
|
224 |
+
"model.layers.30.input_layernorm.weight": "model-00012-of-00029.safetensors",
|
225 |
+
"model.layers.30.mlp.down_proj.weight": "model-00012-of-00029.safetensors",
|
226 |
+
"model.layers.30.mlp.gate_proj.weight": "model-00011-of-00029.safetensors",
|
227 |
+
"model.layers.30.mlp.up_proj.weight": "model-00012-of-00029.safetensors",
|
228 |
+
"model.layers.30.post_attention_layernorm.weight": "model-00012-of-00029.safetensors",
|
229 |
+
"model.layers.30.self_attn.k_proj.weight": "model-00011-of-00029.safetensors",
|
230 |
+
"model.layers.30.self_attn.o_proj.weight": "model-00011-of-00029.safetensors",
|
231 |
+
"model.layers.30.self_attn.q_proj.weight": "model-00011-of-00029.safetensors",
|
232 |
+
"model.layers.30.self_attn.v_proj.weight": "model-00011-of-00029.safetensors",
|
233 |
+
"model.layers.31.input_layernorm.weight": "model-00012-of-00029.safetensors",
|
234 |
+
"model.layers.31.mlp.down_proj.weight": "model-00012-of-00029.safetensors",
|
235 |
+
"model.layers.31.mlp.gate_proj.weight": "model-00012-of-00029.safetensors",
|
236 |
+
"model.layers.31.mlp.up_proj.weight": "model-00012-of-00029.safetensors",
|
237 |
+
"model.layers.31.post_attention_layernorm.weight": "model-00012-of-00029.safetensors",
|
238 |
+
"model.layers.31.self_attn.k_proj.weight": "model-00012-of-00029.safetensors",
|
239 |
+
"model.layers.31.self_attn.o_proj.weight": "model-00012-of-00029.safetensors",
|
240 |
+
"model.layers.31.self_attn.q_proj.weight": "model-00012-of-00029.safetensors",
|
241 |
+
"model.layers.31.self_attn.v_proj.weight": "model-00012-of-00029.safetensors",
|
242 |
+
"model.layers.32.input_layernorm.weight": "model-00012-of-00029.safetensors",
|
243 |
+
"model.layers.32.mlp.down_proj.weight": "model-00012-of-00029.safetensors",
|
244 |
+
"model.layers.32.mlp.gate_proj.weight": "model-00012-of-00029.safetensors",
|
245 |
+
"model.layers.32.mlp.up_proj.weight": "model-00012-of-00029.safetensors",
|
246 |
+
"model.layers.32.post_attention_layernorm.weight": "model-00012-of-00029.safetensors",
|
247 |
+
"model.layers.32.self_attn.k_proj.weight": "model-00012-of-00029.safetensors",
|
248 |
+
"model.layers.32.self_attn.o_proj.weight": "model-00012-of-00029.safetensors",
|
249 |
+
"model.layers.32.self_attn.q_proj.weight": "model-00012-of-00029.safetensors",
|
250 |
+
"model.layers.32.self_attn.v_proj.weight": "model-00012-of-00029.safetensors",
|
251 |
+
"model.layers.33.input_layernorm.weight": "model-00013-of-00029.safetensors",
|
252 |
+
"model.layers.33.mlp.down_proj.weight": "model-00013-of-00029.safetensors",
|
253 |
+
"model.layers.33.mlp.gate_proj.weight": "model-00013-of-00029.safetensors",
|
254 |
+
"model.layers.33.mlp.up_proj.weight": "model-00013-of-00029.safetensors",
|
255 |
+
"model.layers.33.post_attention_layernorm.weight": "model-00013-of-00029.safetensors",
|
256 |
+
"model.layers.33.self_attn.k_proj.weight": "model-00012-of-00029.safetensors",
|
257 |
+
"model.layers.33.self_attn.o_proj.weight": "model-00012-of-00029.safetensors",
|
258 |
+
"model.layers.33.self_attn.q_proj.weight": "model-00012-of-00029.safetensors",
|
259 |
+
"model.layers.33.self_attn.v_proj.weight": "model-00012-of-00029.safetensors",
|
260 |
+
"model.layers.34.input_layernorm.weight": "model-00013-of-00029.safetensors",
|
261 |
+
"model.layers.34.mlp.down_proj.weight": "model-00013-of-00029.safetensors",
|
262 |
+
"model.layers.34.mlp.gate_proj.weight": "model-00013-of-00029.safetensors",
|
263 |
+
"model.layers.34.mlp.up_proj.weight": "model-00013-of-00029.safetensors",
|
264 |
+
"model.layers.34.post_attention_layernorm.weight": "model-00013-of-00029.safetensors",
|
265 |
+
"model.layers.34.self_attn.k_proj.weight": "model-00013-of-00029.safetensors",
|
266 |
+
"model.layers.34.self_attn.o_proj.weight": "model-00013-of-00029.safetensors",
|
267 |
+
"model.layers.34.self_attn.q_proj.weight": "model-00013-of-00029.safetensors",
|
268 |
+
"model.layers.34.self_attn.v_proj.weight": "model-00013-of-00029.safetensors",
|
269 |
+
"model.layers.35.input_layernorm.weight": "model-00013-of-00029.safetensors",
|
270 |
+
"model.layers.35.mlp.down_proj.weight": "model-00013-of-00029.safetensors",
|
271 |
+
"model.layers.35.mlp.gate_proj.weight": "model-00013-of-00029.safetensors",
|
272 |
+
"model.layers.35.mlp.up_proj.weight": "model-00013-of-00029.safetensors",
|
273 |
+
"model.layers.35.post_attention_layernorm.weight": "model-00013-of-00029.safetensors",
|
274 |
+
"model.layers.35.self_attn.k_proj.weight": "model-00013-of-00029.safetensors",
|
275 |
+
"model.layers.35.self_attn.o_proj.weight": "model-00013-of-00029.safetensors",
|
276 |
+
"model.layers.35.self_attn.q_proj.weight": "model-00013-of-00029.safetensors",
|
277 |
+
"model.layers.35.self_attn.v_proj.weight": "model-00013-of-00029.safetensors",
|
278 |
+
"model.layers.36.input_layernorm.weight": "model-00014-of-00029.safetensors",
|
279 |
+
"model.layers.36.mlp.down_proj.weight": "model-00014-of-00029.safetensors",
|
280 |
+
"model.layers.36.mlp.gate_proj.weight": "model-00014-of-00029.safetensors",
|
281 |
+
"model.layers.36.mlp.up_proj.weight": "model-00014-of-00029.safetensors",
|
282 |
+
"model.layers.36.post_attention_layernorm.weight": "model-00014-of-00029.safetensors",
|
283 |
+
"model.layers.36.self_attn.k_proj.weight": "model-00013-of-00029.safetensors",
|
284 |
+
"model.layers.36.self_attn.o_proj.weight": "model-00014-of-00029.safetensors",
|
285 |
+
"model.layers.36.self_attn.q_proj.weight": "model-00013-of-00029.safetensors",
|
286 |
+
"model.layers.36.self_attn.v_proj.weight": "model-00013-of-00029.safetensors",
|
287 |
+
"model.layers.37.input_layernorm.weight": "model-00014-of-00029.safetensors",
|
288 |
+
"model.layers.37.mlp.down_proj.weight": "model-00014-of-00029.safetensors",
|
289 |
+
"model.layers.37.mlp.gate_proj.weight": "model-00014-of-00029.safetensors",
|
290 |
+
"model.layers.37.mlp.up_proj.weight": "model-00014-of-00029.safetensors",
|
291 |
+
"model.layers.37.post_attention_layernorm.weight": "model-00014-of-00029.safetensors",
|
292 |
+
"model.layers.37.self_attn.k_proj.weight": "model-00014-of-00029.safetensors",
|
293 |
+
"model.layers.37.self_attn.o_proj.weight": "model-00014-of-00029.safetensors",
|
294 |
+
"model.layers.37.self_attn.q_proj.weight": "model-00014-of-00029.safetensors",
|
295 |
+
"model.layers.37.self_attn.v_proj.weight": "model-00014-of-00029.safetensors",
|
296 |
+
"model.layers.38.input_layernorm.weight": "model-00014-of-00029.safetensors",
|
297 |
+
"model.layers.38.mlp.down_proj.weight": "model-00014-of-00029.safetensors",
|
298 |
+
"model.layers.38.mlp.gate_proj.weight": "model-00014-of-00029.safetensors",
|
299 |
+
"model.layers.38.mlp.up_proj.weight": "model-00014-of-00029.safetensors",
|
300 |
+
"model.layers.38.post_attention_layernorm.weight": "model-00014-of-00029.safetensors",
|
301 |
+
"model.layers.38.self_attn.k_proj.weight": "model-00014-of-00029.safetensors",
|
302 |
+
"model.layers.38.self_attn.o_proj.weight": "model-00014-of-00029.safetensors",
|
303 |
+
"model.layers.38.self_attn.q_proj.weight": "model-00014-of-00029.safetensors",
|
304 |
+
"model.layers.38.self_attn.v_proj.weight": "model-00014-of-00029.safetensors",
|
305 |
+
"model.layers.39.input_layernorm.weight": "model-00015-of-00029.safetensors",
|
306 |
+
"model.layers.39.mlp.down_proj.weight": "model-00015-of-00029.safetensors",
|
307 |
+
"model.layers.39.mlp.gate_proj.weight": "model-00015-of-00029.safetensors",
|
308 |
+
"model.layers.39.mlp.up_proj.weight": "model-00015-of-00029.safetensors",
|
309 |
+
"model.layers.39.post_attention_layernorm.weight": "model-00015-of-00029.safetensors",
|
310 |
+
"model.layers.39.self_attn.k_proj.weight": "model-00015-of-00029.safetensors",
|
311 |
+
"model.layers.39.self_attn.o_proj.weight": "model-00015-of-00029.safetensors",
|
312 |
+
"model.layers.39.self_attn.q_proj.weight": "model-00015-of-00029.safetensors",
|
313 |
+
"model.layers.39.self_attn.v_proj.weight": "model-00015-of-00029.safetensors",
|
314 |
+
"model.layers.4.input_layernorm.weight": "model-00002-of-00029.safetensors",
|
315 |
+
"model.layers.4.mlp.down_proj.weight": "model-00002-of-00029.safetensors",
|
316 |
+
"model.layers.4.mlp.gate_proj.weight": "model-00002-of-00029.safetensors",
|
317 |
+
"model.layers.4.mlp.up_proj.weight": "model-00002-of-00029.safetensors",
|
318 |
+
"model.layers.4.post_attention_layernorm.weight": "model-00002-of-00029.safetensors",
|
319 |
+
"model.layers.4.self_attn.k_proj.weight": "model-00002-of-00029.safetensors",
|
320 |
+
"model.layers.4.self_attn.o_proj.weight": "model-00002-of-00029.safetensors",
|
321 |
+
"model.layers.4.self_attn.q_proj.weight": "model-00002-of-00029.safetensors",
|
322 |
+
"model.layers.4.self_attn.v_proj.weight": "model-00002-of-00029.safetensors",
|
323 |
+
"model.layers.40.input_layernorm.weight": "model-00015-of-00029.safetensors",
|
324 |
+
"model.layers.40.mlp.down_proj.weight": "model-00015-of-00029.safetensors",
|
325 |
+
"model.layers.40.mlp.gate_proj.weight": "model-00015-of-00029.safetensors",
|
326 |
+
"model.layers.40.mlp.up_proj.weight": "model-00015-of-00029.safetensors",
|
327 |
+
"model.layers.40.post_attention_layernorm.weight": "model-00015-of-00029.safetensors",
|
328 |
+
"model.layers.40.self_attn.k_proj.weight": "model-00015-of-00029.safetensors",
|
329 |
+
"model.layers.40.self_attn.o_proj.weight": "model-00015-of-00029.safetensors",
|
330 |
+
"model.layers.40.self_attn.q_proj.weight": "model-00015-of-00029.safetensors",
|
331 |
+
"model.layers.40.self_attn.v_proj.weight": "model-00015-of-00029.safetensors",
|
332 |
+
"model.layers.41.input_layernorm.weight": "model-00016-of-00029.safetensors",
|
333 |
+
"model.layers.41.mlp.down_proj.weight": "model-00016-of-00029.safetensors",
|
334 |
+
"model.layers.41.mlp.gate_proj.weight": "model-00015-of-00029.safetensors",
|
335 |
+
"model.layers.41.mlp.up_proj.weight": "model-00015-of-00029.safetensors",
|
336 |
+
"model.layers.41.post_attention_layernorm.weight": "model-00016-of-00029.safetensors",
|
337 |
+
"model.layers.41.self_attn.k_proj.weight": "model-00015-of-00029.safetensors",
|
338 |
+
"model.layers.41.self_attn.o_proj.weight": "model-00015-of-00029.safetensors",
|
339 |
+
"model.layers.41.self_attn.q_proj.weight": "model-00015-of-00029.safetensors",
|
340 |
+
"model.layers.41.self_attn.v_proj.weight": "model-00015-of-00029.safetensors",
|
341 |
+
"model.layers.42.input_layernorm.weight": "model-00016-of-00029.safetensors",
|
342 |
+
"model.layers.42.mlp.down_proj.weight": "model-00016-of-00029.safetensors",
|
343 |
+
"model.layers.42.mlp.gate_proj.weight": "model-00016-of-00029.safetensors",
|
344 |
+
"model.layers.42.mlp.up_proj.weight": "model-00016-of-00029.safetensors",
|
345 |
+
"model.layers.42.post_attention_layernorm.weight": "model-00016-of-00029.safetensors",
|
346 |
+
"model.layers.42.self_attn.k_proj.weight": "model-00016-of-00029.safetensors",
|
347 |
+
"model.layers.42.self_attn.o_proj.weight": "model-00016-of-00029.safetensors",
|
348 |
+
"model.layers.42.self_attn.q_proj.weight": "model-00016-of-00029.safetensors",
|
349 |
+
"model.layers.42.self_attn.v_proj.weight": "model-00016-of-00029.safetensors",
|
350 |
+
"model.layers.43.input_layernorm.weight": "model-00016-of-00029.safetensors",
|
351 |
+
"model.layers.43.mlp.down_proj.weight": "model-00016-of-00029.safetensors",
|
352 |
+
"model.layers.43.mlp.gate_proj.weight": "model-00016-of-00029.safetensors",
|
353 |
+
"model.layers.43.mlp.up_proj.weight": "model-00016-of-00029.safetensors",
|
354 |
+
"model.layers.43.post_attention_layernorm.weight": "model-00016-of-00029.safetensors",
|
355 |
+
"model.layers.43.self_attn.k_proj.weight": "model-00016-of-00029.safetensors",
|
356 |
+
"model.layers.43.self_attn.o_proj.weight": "model-00016-of-00029.safetensors",
|
357 |
+
"model.layers.43.self_attn.q_proj.weight": "model-00016-of-00029.safetensors",
|
358 |
+
"model.layers.43.self_attn.v_proj.weight": "model-00016-of-00029.safetensors",
|
359 |
+
"model.layers.44.input_layernorm.weight": "model-00017-of-00029.safetensors",
|
360 |
+
"model.layers.44.mlp.down_proj.weight": "model-00017-of-00029.safetensors",
|
361 |
+
"model.layers.44.mlp.gate_proj.weight": "model-00016-of-00029.safetensors",
|
362 |
+
"model.layers.44.mlp.up_proj.weight": "model-00017-of-00029.safetensors",
|
363 |
+
"model.layers.44.post_attention_layernorm.weight": "model-00017-of-00029.safetensors",
|
364 |
+
"model.layers.44.self_attn.k_proj.weight": "model-00016-of-00029.safetensors",
|
365 |
+
"model.layers.44.self_attn.o_proj.weight": "model-00016-of-00029.safetensors",
|
366 |
+
"model.layers.44.self_attn.q_proj.weight": "model-00016-of-00029.safetensors",
|
367 |
+
"model.layers.44.self_attn.v_proj.weight": "model-00016-of-00029.safetensors",
|
368 |
+
"model.layers.45.input_layernorm.weight": "model-00017-of-00029.safetensors",
|
369 |
+
"model.layers.45.mlp.down_proj.weight": "model-00017-of-00029.safetensors",
|
370 |
+
"model.layers.45.mlp.gate_proj.weight": "model-00017-of-00029.safetensors",
|
371 |
+
"model.layers.45.mlp.up_proj.weight": "model-00017-of-00029.safetensors",
|
372 |
+
"model.layers.45.post_attention_layernorm.weight": "model-00017-of-00029.safetensors",
|
373 |
+
"model.layers.45.self_attn.k_proj.weight": "model-00017-of-00029.safetensors",
|
374 |
+
"model.layers.45.self_attn.o_proj.weight": "model-00017-of-00029.safetensors",
|
375 |
+
"model.layers.45.self_attn.q_proj.weight": "model-00017-of-00029.safetensors",
|
376 |
+
"model.layers.45.self_attn.v_proj.weight": "model-00017-of-00029.safetensors",
|
377 |
+
"model.layers.46.input_layernorm.weight": "model-00017-of-00029.safetensors",
|
378 |
+
"model.layers.46.mlp.down_proj.weight": "model-00017-of-00029.safetensors",
|
379 |
+
"model.layers.46.mlp.gate_proj.weight": "model-00017-of-00029.safetensors",
|
380 |
+
"model.layers.46.mlp.up_proj.weight": "model-00017-of-00029.safetensors",
|
381 |
+
"model.layers.46.post_attention_layernorm.weight": "model-00017-of-00029.safetensors",
|
382 |
+
"model.layers.46.self_attn.k_proj.weight": "model-00017-of-00029.safetensors",
|
383 |
+
"model.layers.46.self_attn.o_proj.weight": "model-00017-of-00029.safetensors",
|
384 |
+
"model.layers.46.self_attn.q_proj.weight": "model-00017-of-00029.safetensors",
|
385 |
+
"model.layers.46.self_attn.v_proj.weight": "model-00017-of-00029.safetensors",
|
386 |
+
"model.layers.47.input_layernorm.weight": "model-00018-of-00029.safetensors",
|
387 |
+
"model.layers.47.mlp.down_proj.weight": "model-00018-of-00029.safetensors",
|
388 |
+
"model.layers.47.mlp.gate_proj.weight": "model-00018-of-00029.safetensors",
|
389 |
+
"model.layers.47.mlp.up_proj.weight": "model-00018-of-00029.safetensors",
|
390 |
+
"model.layers.47.post_attention_layernorm.weight": "model-00018-of-00029.safetensors",
|
391 |
+
"model.layers.47.self_attn.k_proj.weight": "model-00017-of-00029.safetensors",
|
392 |
+
"model.layers.47.self_attn.o_proj.weight": "model-00017-of-00029.safetensors",
|
393 |
+
"model.layers.47.self_attn.q_proj.weight": "model-00017-of-00029.safetensors",
|
394 |
+
"model.layers.47.self_attn.v_proj.weight": "model-00017-of-00029.safetensors",
|
395 |
+
"model.layers.48.input_layernorm.weight": "model-00018-of-00029.safetensors",
|
396 |
+
"model.layers.48.mlp.down_proj.weight": "model-00018-of-00029.safetensors",
|
397 |
+
"model.layers.48.mlp.gate_proj.weight": "model-00018-of-00029.safetensors",
|
398 |
+
"model.layers.48.mlp.up_proj.weight": "model-00018-of-00029.safetensors",
|
399 |
+
"model.layers.48.post_attention_layernorm.weight": "model-00018-of-00029.safetensors",
|
400 |
+
"model.layers.48.self_attn.k_proj.weight": "model-00018-of-00029.safetensors",
|
401 |
+
"model.layers.48.self_attn.o_proj.weight": "model-00018-of-00029.safetensors",
|
402 |
+
"model.layers.48.self_attn.q_proj.weight": "model-00018-of-00029.safetensors",
|
403 |
+
"model.layers.48.self_attn.v_proj.weight": "model-00018-of-00029.safetensors",
|
404 |
+
"model.layers.49.input_layernorm.weight": "model-00018-of-00029.safetensors",
|
405 |
+
"model.layers.49.mlp.down_proj.weight": "model-00018-of-00029.safetensors",
|
406 |
+
"model.layers.49.mlp.gate_proj.weight": "model-00018-of-00029.safetensors",
|
407 |
+
"model.layers.49.mlp.up_proj.weight": "model-00018-of-00029.safetensors",
|
408 |
+
"model.layers.49.post_attention_layernorm.weight": "model-00018-of-00029.safetensors",
|
409 |
+
"model.layers.49.self_attn.k_proj.weight": "model-00018-of-00029.safetensors",
|
410 |
+
"model.layers.49.self_attn.o_proj.weight": "model-00018-of-00029.safetensors",
|
411 |
+
"model.layers.49.self_attn.q_proj.weight": "model-00018-of-00029.safetensors",
|
412 |
+
"model.layers.49.self_attn.v_proj.weight": "model-00018-of-00029.safetensors",
|
413 |
+
"model.layers.5.input_layernorm.weight": "model-00003-of-00029.safetensors",
|
414 |
+
"model.layers.5.mlp.down_proj.weight": "model-00003-of-00029.safetensors",
|
415 |
+
"model.layers.5.mlp.gate_proj.weight": "model-00003-of-00029.safetensors",
|
416 |
+
"model.layers.5.mlp.up_proj.weight": "model-00003-of-00029.safetensors",
|
417 |
+
"model.layers.5.post_attention_layernorm.weight": "model-00003-of-00029.safetensors",
|
418 |
+
"model.layers.5.self_attn.k_proj.weight": "model-00002-of-00029.safetensors",
|
419 |
+
"model.layers.5.self_attn.o_proj.weight": "model-00002-of-00029.safetensors",
|
420 |
+
"model.layers.5.self_attn.q_proj.weight": "model-00002-of-00029.safetensors",
|
421 |
+
"model.layers.5.self_attn.v_proj.weight": "model-00002-of-00029.safetensors",
|
422 |
+
"model.layers.50.input_layernorm.weight": "model-00019-of-00029.safetensors",
|
423 |
+
"model.layers.50.mlp.down_proj.weight": "model-00019-of-00029.safetensors",
|
424 |
+
"model.layers.50.mlp.gate_proj.weight": "model-00019-of-00029.safetensors",
|
425 |
+
"model.layers.50.mlp.up_proj.weight": "model-00019-of-00029.safetensors",
|
426 |
+
"model.layers.50.post_attention_layernorm.weight": "model-00019-of-00029.safetensors",
|
427 |
+
"model.layers.50.self_attn.k_proj.weight": "model-00018-of-00029.safetensors",
|
428 |
+
"model.layers.50.self_attn.o_proj.weight": "model-00019-of-00029.safetensors",
|
429 |
+
"model.layers.50.self_attn.q_proj.weight": "model-00018-of-00029.safetensors",
|
430 |
+
"model.layers.50.self_attn.v_proj.weight": "model-00018-of-00029.safetensors",
|
431 |
+
"model.layers.51.input_layernorm.weight": "model-00019-of-00029.safetensors",
|
432 |
+
"model.layers.51.mlp.down_proj.weight": "model-00019-of-00029.safetensors",
|
433 |
+
"model.layers.51.mlp.gate_proj.weight": "model-00019-of-00029.safetensors",
|
434 |
+
"model.layers.51.mlp.up_proj.weight": "model-00019-of-00029.safetensors",
|
435 |
+
"model.layers.51.post_attention_layernorm.weight": "model-00019-of-00029.safetensors",
|
436 |
+
"model.layers.51.self_attn.k_proj.weight": "model-00019-of-00029.safetensors",
|
437 |
+
"model.layers.51.self_attn.o_proj.weight": "model-00019-of-00029.safetensors",
|
438 |
+
"model.layers.51.self_attn.q_proj.weight": "model-00019-of-00029.safetensors",
|
439 |
+
"model.layers.51.self_attn.v_proj.weight": "model-00019-of-00029.safetensors",
|
440 |
+
"model.layers.52.input_layernorm.weight": "model-00019-of-00029.safetensors",
|
441 |
+
"model.layers.52.mlp.down_proj.weight": "model-00019-of-00029.safetensors",
|
442 |
+
"model.layers.52.mlp.gate_proj.weight": "model-00019-of-00029.safetensors",
|
443 |
+
"model.layers.52.mlp.up_proj.weight": "model-00019-of-00029.safetensors",
|
444 |
+
"model.layers.52.post_attention_layernorm.weight": "model-00019-of-00029.safetensors",
|
445 |
+
"model.layers.52.self_attn.k_proj.weight": "model-00019-of-00029.safetensors",
|
446 |
+
"model.layers.52.self_attn.o_proj.weight": "model-00019-of-00029.safetensors",
|
447 |
+
"model.layers.52.self_attn.q_proj.weight": "model-00019-of-00029.safetensors",
|
448 |
+
"model.layers.52.self_attn.v_proj.weight": "model-00019-of-00029.safetensors",
|
449 |
+
"model.layers.53.input_layernorm.weight": "model-00020-of-00029.safetensors",
|
450 |
+
"model.layers.53.mlp.down_proj.weight": "model-00020-of-00029.safetensors",
|
451 |
+
"model.layers.53.mlp.gate_proj.weight": "model-00020-of-00029.safetensors",
|
452 |
+
"model.layers.53.mlp.up_proj.weight": "model-00020-of-00029.safetensors",
|
453 |
+
"model.layers.53.post_attention_layernorm.weight": "model-00020-of-00029.safetensors",
|
454 |
+
"model.layers.53.self_attn.k_proj.weight": "model-00020-of-00029.safetensors",
|
455 |
+
"model.layers.53.self_attn.o_proj.weight": "model-00020-of-00029.safetensors",
|
456 |
+
"model.layers.53.self_attn.q_proj.weight": "model-00020-of-00029.safetensors",
|
457 |
+
"model.layers.53.self_attn.v_proj.weight": "model-00020-of-00029.safetensors",
|
458 |
+
"model.layers.54.input_layernorm.weight": "model-00020-of-00029.safetensors",
|
459 |
+
"model.layers.54.mlp.down_proj.weight": "model-00020-of-00029.safetensors",
|
460 |
+
"model.layers.54.mlp.gate_proj.weight": "model-00020-of-00029.safetensors",
|
461 |
+
"model.layers.54.mlp.up_proj.weight": "model-00020-of-00029.safetensors",
|
462 |
+
"model.layers.54.post_attention_layernorm.weight": "model-00020-of-00029.safetensors",
|
463 |
+
"model.layers.54.self_attn.k_proj.weight": "model-00020-of-00029.safetensors",
|
464 |
+
"model.layers.54.self_attn.o_proj.weight": "model-00020-of-00029.safetensors",
|
465 |
+
"model.layers.54.self_attn.q_proj.weight": "model-00020-of-00029.safetensors",
|
466 |
+
"model.layers.54.self_attn.v_proj.weight": "model-00020-of-00029.safetensors",
|
467 |
+
"model.layers.55.input_layernorm.weight": "model-00021-of-00029.safetensors",
|
468 |
+
"model.layers.55.mlp.down_proj.weight": "model-00021-of-00029.safetensors",
|
469 |
+
"model.layers.55.mlp.gate_proj.weight": "model-00020-of-00029.safetensors",
|
470 |
+
"model.layers.55.mlp.up_proj.weight": "model-00020-of-00029.safetensors",
|
471 |
+
"model.layers.55.post_attention_layernorm.weight": "model-00021-of-00029.safetensors",
|
472 |
+
"model.layers.55.self_attn.k_proj.weight": "model-00020-of-00029.safetensors",
|
473 |
+
"model.layers.55.self_attn.o_proj.weight": "model-00020-of-00029.safetensors",
|
474 |
+
"model.layers.55.self_attn.q_proj.weight": "model-00020-of-00029.safetensors",
|
475 |
+
"model.layers.55.self_attn.v_proj.weight": "model-00020-of-00029.safetensors",
|
476 |
+
"model.layers.56.input_layernorm.weight": "model-00021-of-00029.safetensors",
|
477 |
+
"model.layers.56.mlp.down_proj.weight": "model-00021-of-00029.safetensors",
|
478 |
+
"model.layers.56.mlp.gate_proj.weight": "model-00021-of-00029.safetensors",
|
479 |
+
"model.layers.56.mlp.up_proj.weight": "model-00021-of-00029.safetensors",
|
480 |
+
"model.layers.56.post_attention_layernorm.weight": "model-00021-of-00029.safetensors",
|
481 |
+
"model.layers.56.self_attn.k_proj.weight": "model-00021-of-00029.safetensors",
|
482 |
+
"model.layers.56.self_attn.o_proj.weight": "model-00021-of-00029.safetensors",
|
483 |
+
"model.layers.56.self_attn.q_proj.weight": "model-00021-of-00029.safetensors",
|
484 |
+
"model.layers.56.self_attn.v_proj.weight": "model-00021-of-00029.safetensors",
|
485 |
+
"model.layers.57.input_layernorm.weight": "model-00021-of-00029.safetensors",
|
486 |
+
"model.layers.57.mlp.down_proj.weight": "model-00021-of-00029.safetensors",
|
487 |
+
"model.layers.57.mlp.gate_proj.weight": "model-00021-of-00029.safetensors",
|
488 |
+
"model.layers.57.mlp.up_proj.weight": "model-00021-of-00029.safetensors",
|
489 |
+
"model.layers.57.post_attention_layernorm.weight": "model-00021-of-00029.safetensors",
|
490 |
+
"model.layers.57.self_attn.k_proj.weight": "model-00021-of-00029.safetensors",
|
491 |
+
"model.layers.57.self_attn.o_proj.weight": "model-00021-of-00029.safetensors",
|
492 |
+
"model.layers.57.self_attn.q_proj.weight": "model-00021-of-00029.safetensors",
|
493 |
+
"model.layers.57.self_attn.v_proj.weight": "model-00021-of-00029.safetensors",
|
494 |
+
"model.layers.58.input_layernorm.weight": "model-00022-of-00029.safetensors",
|
495 |
+
"model.layers.58.mlp.down_proj.weight": "model-00022-of-00029.safetensors",
|
496 |
+
"model.layers.58.mlp.gate_proj.weight": "model-00021-of-00029.safetensors",
|
497 |
+
"model.layers.58.mlp.up_proj.weight": "model-00022-of-00029.safetensors",
|
498 |
+
"model.layers.58.post_attention_layernorm.weight": "model-00022-of-00029.safetensors",
|
499 |
+
"model.layers.58.self_attn.k_proj.weight": "model-00021-of-00029.safetensors",
|
500 |
+
"model.layers.58.self_attn.o_proj.weight": "model-00021-of-00029.safetensors",
|
501 |
+
"model.layers.58.self_attn.q_proj.weight": "model-00021-of-00029.safetensors",
|
502 |
+
"model.layers.58.self_attn.v_proj.weight": "model-00021-of-00029.safetensors",
|
503 |
+
"model.layers.59.input_layernorm.weight": "model-00022-of-00029.safetensors",
|
504 |
+
"model.layers.59.mlp.down_proj.weight": "model-00022-of-00029.safetensors",
|
505 |
+
"model.layers.59.mlp.gate_proj.weight": "model-00022-of-00029.safetensors",
|
506 |
+
"model.layers.59.mlp.up_proj.weight": "model-00022-of-00029.safetensors",
|
507 |
+
"model.layers.59.post_attention_layernorm.weight": "model-00022-of-00029.safetensors",
|
508 |
+
"model.layers.59.self_attn.k_proj.weight": "model-00022-of-00029.safetensors",
|
509 |
+
"model.layers.59.self_attn.o_proj.weight": "model-00022-of-00029.safetensors",
|
510 |
+
"model.layers.59.self_attn.q_proj.weight": "model-00022-of-00029.safetensors",
|
511 |
+
"model.layers.59.self_attn.v_proj.weight": "model-00022-of-00029.safetensors",
|
512 |
+
"model.layers.6.input_layernorm.weight": "model-00003-of-00029.safetensors",
|
513 |
+
"model.layers.6.mlp.down_proj.weight": "model-00003-of-00029.safetensors",
|
514 |
+
"model.layers.6.mlp.gate_proj.weight": "model-00003-of-00029.safetensors",
|
515 |
+
"model.layers.6.mlp.up_proj.weight": "model-00003-of-00029.safetensors",
|
516 |
+
"model.layers.6.post_attention_layernorm.weight": "model-00003-of-00029.safetensors",
|
517 |
+
"model.layers.6.self_attn.k_proj.weight": "model-00003-of-00029.safetensors",
|
518 |
+
"model.layers.6.self_attn.o_proj.weight": "model-00003-of-00029.safetensors",
|
519 |
+
"model.layers.6.self_attn.q_proj.weight": "model-00003-of-00029.safetensors",
|
520 |
+
"model.layers.6.self_attn.v_proj.weight": "model-00003-of-00029.safetensors",
|
521 |
+
"model.layers.60.input_layernorm.weight": "model-00022-of-00029.safetensors",
|
522 |
+
"model.layers.60.mlp.down_proj.weight": "model-00022-of-00029.safetensors",
|
523 |
+
"model.layers.60.mlp.gate_proj.weight": "model-00022-of-00029.safetensors",
|
524 |
+
"model.layers.60.mlp.up_proj.weight": "model-00022-of-00029.safetensors",
|
525 |
+
"model.layers.60.post_attention_layernorm.weight": "model-00022-of-00029.safetensors",
|
526 |
+
"model.layers.60.self_attn.k_proj.weight": "model-00022-of-00029.safetensors",
|
527 |
+
"model.layers.60.self_attn.o_proj.weight": "model-00022-of-00029.safetensors",
|
528 |
+
"model.layers.60.self_attn.q_proj.weight": "model-00022-of-00029.safetensors",
|
529 |
+
"model.layers.60.self_attn.v_proj.weight": "model-00022-of-00029.safetensors",
|
530 |
+
"model.layers.61.input_layernorm.weight": "model-00023-of-00029.safetensors",
|
531 |
+
"model.layers.61.mlp.down_proj.weight": "model-00023-of-00029.safetensors",
|
532 |
+
"model.layers.61.mlp.gate_proj.weight": "model-00023-of-00029.safetensors",
|
533 |
+
"model.layers.61.mlp.up_proj.weight": "model-00023-of-00029.safetensors",
|
534 |
+
"model.layers.61.post_attention_layernorm.weight": "model-00023-of-00029.safetensors",
|
535 |
+
"model.layers.61.self_attn.k_proj.weight": "model-00022-of-00029.safetensors",
|
536 |
+
"model.layers.61.self_attn.o_proj.weight": "model-00022-of-00029.safetensors",
|
537 |
+
"model.layers.61.self_attn.q_proj.weight": "model-00022-of-00029.safetensors",
|
538 |
+
"model.layers.61.self_attn.v_proj.weight": "model-00022-of-00029.safetensors",
|
539 |
+
"model.layers.62.input_layernorm.weight": "model-00023-of-00029.safetensors",
|
540 |
+
"model.layers.62.mlp.down_proj.weight": "model-00023-of-00029.safetensors",
|
541 |
+
"model.layers.62.mlp.gate_proj.weight": "model-00023-of-00029.safetensors",
|
542 |
+
"model.layers.62.mlp.up_proj.weight": "model-00023-of-00029.safetensors",
|
543 |
+
"model.layers.62.post_attention_layernorm.weight": "model-00023-of-00029.safetensors",
|
544 |
+
"model.layers.62.self_attn.k_proj.weight": "model-00023-of-00029.safetensors",
|
545 |
+
"model.layers.62.self_attn.o_proj.weight": "model-00023-of-00029.safetensors",
|
546 |
+
"model.layers.62.self_attn.q_proj.weight": "model-00023-of-00029.safetensors",
|
547 |
+
"model.layers.62.self_attn.v_proj.weight": "model-00023-of-00029.safetensors",
|
548 |
+
"model.layers.63.input_layernorm.weight": "model-00023-of-00029.safetensors",
|
549 |
+
"model.layers.63.mlp.down_proj.weight": "model-00023-of-00029.safetensors",
|
550 |
+
"model.layers.63.mlp.gate_proj.weight": "model-00023-of-00029.safetensors",
|
551 |
+
"model.layers.63.mlp.up_proj.weight": "model-00023-of-00029.safetensors",
|
552 |
+
"model.layers.63.post_attention_layernorm.weight": "model-00023-of-00029.safetensors",
|
553 |
+
"model.layers.63.self_attn.k_proj.weight": "model-00023-of-00029.safetensors",
|
554 |
+
"model.layers.63.self_attn.o_proj.weight": "model-00023-of-00029.safetensors",
|
555 |
+
"model.layers.63.self_attn.q_proj.weight": "model-00023-of-00029.safetensors",
|
556 |
+
"model.layers.63.self_attn.v_proj.weight": "model-00023-of-00029.safetensors",
|
557 |
+
"model.layers.64.input_layernorm.weight": "model-00024-of-00029.safetensors",
|
558 |
+
"model.layers.64.mlp.down_proj.weight": "model-00024-of-00029.safetensors",
|
559 |
+
"model.layers.64.mlp.gate_proj.weight": "model-00024-of-00029.safetensors",
|
560 |
+
"model.layers.64.mlp.up_proj.weight": "model-00024-of-00029.safetensors",
|
561 |
+
"model.layers.64.post_attention_layernorm.weight": "model-00024-of-00029.safetensors",
|
562 |
+
"model.layers.64.self_attn.k_proj.weight": "model-00023-of-00029.safetensors",
|
563 |
+
"model.layers.64.self_attn.o_proj.weight": "model-00024-of-00029.safetensors",
|
564 |
+
"model.layers.64.self_attn.q_proj.weight": "model-00023-of-00029.safetensors",
|
565 |
+
"model.layers.64.self_attn.v_proj.weight": "model-00023-of-00029.safetensors",
|
566 |
+
"model.layers.65.input_layernorm.weight": "model-00024-of-00029.safetensors",
|
567 |
+
"model.layers.65.mlp.down_proj.weight": "model-00024-of-00029.safetensors",
|
568 |
+
"model.layers.65.mlp.gate_proj.weight": "model-00024-of-00029.safetensors",
|
569 |
+
"model.layers.65.mlp.up_proj.weight": "model-00024-of-00029.safetensors",
|
570 |
+
"model.layers.65.post_attention_layernorm.weight": "model-00024-of-00029.safetensors",
|
571 |
+
"model.layers.65.self_attn.k_proj.weight": "model-00024-of-00029.safetensors",
|
572 |
+
"model.layers.65.self_attn.o_proj.weight": "model-00024-of-00029.safetensors",
|
573 |
+
"model.layers.65.self_attn.q_proj.weight": "model-00024-of-00029.safetensors",
|
574 |
+
"model.layers.65.self_attn.v_proj.weight": "model-00024-of-00029.safetensors",
|
575 |
+
"model.layers.66.input_layernorm.weight": "model-00024-of-00029.safetensors",
|
576 |
+
"model.layers.66.mlp.down_proj.weight": "model-00024-of-00029.safetensors",
|
577 |
+
"model.layers.66.mlp.gate_proj.weight": "model-00024-of-00029.safetensors",
|
578 |
+
"model.layers.66.mlp.up_proj.weight": "model-00024-of-00029.safetensors",
|
579 |
+
"model.layers.66.post_attention_layernorm.weight": "model-00024-of-00029.safetensors",
|
580 |
+
"model.layers.66.self_attn.k_proj.weight": "model-00024-of-00029.safetensors",
|
581 |
+
"model.layers.66.self_attn.o_proj.weight": "model-00024-of-00029.safetensors",
|
582 |
+
"model.layers.66.self_attn.q_proj.weight": "model-00024-of-00029.safetensors",
|
583 |
+
"model.layers.66.self_attn.v_proj.weight": "model-00024-of-00029.safetensors",
|
584 |
+
"model.layers.67.input_layernorm.weight": "model-00025-of-00029.safetensors",
|
585 |
+
"model.layers.67.mlp.down_proj.weight": "model-00025-of-00029.safetensors",
|
586 |
+
"model.layers.67.mlp.gate_proj.weight": "model-00025-of-00029.safetensors",
|
587 |
+
"model.layers.67.mlp.up_proj.weight": "model-00025-of-00029.safetensors",
|
588 |
+
"model.layers.67.post_attention_layernorm.weight": "model-00025-of-00029.safetensors",
|
589 |
+
"model.layers.67.self_attn.k_proj.weight": "model-00025-of-00029.safetensors",
|
590 |
+
"model.layers.67.self_attn.o_proj.weight": "model-00025-of-00029.safetensors",
|
591 |
+
"model.layers.67.self_attn.q_proj.weight": "model-00025-of-00029.safetensors",
|
592 |
+
"model.layers.67.self_attn.v_proj.weight": "model-00025-of-00029.safetensors",
|
593 |
+
"model.layers.68.input_layernorm.weight": "model-00025-of-00029.safetensors",
|
594 |
+
"model.layers.68.mlp.down_proj.weight": "model-00025-of-00029.safetensors",
|
595 |
+
"model.layers.68.mlp.gate_proj.weight": "model-00025-of-00029.safetensors",
|
596 |
+
"model.layers.68.mlp.up_proj.weight": "model-00025-of-00029.safetensors",
|
597 |
+
"model.layers.68.post_attention_layernorm.weight": "model-00025-of-00029.safetensors",
|
598 |
+
"model.layers.68.self_attn.k_proj.weight": "model-00025-of-00029.safetensors",
|
599 |
+
"model.layers.68.self_attn.o_proj.weight": "model-00025-of-00029.safetensors",
|
600 |
+
"model.layers.68.self_attn.q_proj.weight": "model-00025-of-00029.safetensors",
|
601 |
+
"model.layers.68.self_attn.v_proj.weight": "model-00025-of-00029.safetensors",
|
602 |
+
"model.layers.69.input_layernorm.weight": "model-00026-of-00029.safetensors",
|
603 |
+
"model.layers.69.mlp.down_proj.weight": "model-00026-of-00029.safetensors",
|
604 |
+
"model.layers.69.mlp.gate_proj.weight": "model-00025-of-00029.safetensors",
|
605 |
+
"model.layers.69.mlp.up_proj.weight": "model-00025-of-00029.safetensors",
|
606 |
+
"model.layers.69.post_attention_layernorm.weight": "model-00026-of-00029.safetensors",
|
607 |
+
"model.layers.69.self_attn.k_proj.weight": "model-00025-of-00029.safetensors",
|
608 |
+
"model.layers.69.self_attn.o_proj.weight": "model-00025-of-00029.safetensors",
|
609 |
+
"model.layers.69.self_attn.q_proj.weight": "model-00025-of-00029.safetensors",
|
610 |
+
"model.layers.69.self_attn.v_proj.weight": "model-00025-of-00029.safetensors",
|
611 |
+
"model.layers.7.input_layernorm.weight": "model-00003-of-00029.safetensors",
|
612 |
+
"model.layers.7.mlp.down_proj.weight": "model-00003-of-00029.safetensors",
|
613 |
+
"model.layers.7.mlp.gate_proj.weight": "model-00003-of-00029.safetensors",
|
614 |
+
"model.layers.7.mlp.up_proj.weight": "model-00003-of-00029.safetensors",
|
615 |
+
"model.layers.7.post_attention_layernorm.weight": "model-00003-of-00029.safetensors",
|
616 |
+
"model.layers.7.self_attn.k_proj.weight": "model-00003-of-00029.safetensors",
|
617 |
+
"model.layers.7.self_attn.o_proj.weight": "model-00003-of-00029.safetensors",
|
618 |
+
"model.layers.7.self_attn.q_proj.weight": "model-00003-of-00029.safetensors",
|
619 |
+
"model.layers.7.self_attn.v_proj.weight": "model-00003-of-00029.safetensors",
|
620 |
+
"model.layers.70.input_layernorm.weight": "model-00026-of-00029.safetensors",
|
621 |
+
"model.layers.70.mlp.down_proj.weight": "model-00026-of-00029.safetensors",
|
622 |
+
"model.layers.70.mlp.gate_proj.weight": "model-00026-of-00029.safetensors",
|
623 |
+
"model.layers.70.mlp.up_proj.weight": "model-00026-of-00029.safetensors",
|
624 |
+
"model.layers.70.post_attention_layernorm.weight": "model-00026-of-00029.safetensors",
|
625 |
+
"model.layers.70.self_attn.k_proj.weight": "model-00026-of-00029.safetensors",
|
626 |
+
"model.layers.70.self_attn.o_proj.weight": "model-00026-of-00029.safetensors",
|
627 |
+
"model.layers.70.self_attn.q_proj.weight": "model-00026-of-00029.safetensors",
|
628 |
+
"model.layers.70.self_attn.v_proj.weight": "model-00026-of-00029.safetensors",
|
629 |
+
"model.layers.71.input_layernorm.weight": "model-00026-of-00029.safetensors",
|
630 |
+
"model.layers.71.mlp.down_proj.weight": "model-00026-of-00029.safetensors",
|
631 |
+
"model.layers.71.mlp.gate_proj.weight": "model-00026-of-00029.safetensors",
|
632 |
+
"model.layers.71.mlp.up_proj.weight": "model-00026-of-00029.safetensors",
|
633 |
+
"model.layers.71.post_attention_layernorm.weight": "model-00026-of-00029.safetensors",
|
634 |
+
"model.layers.71.self_attn.k_proj.weight": "model-00026-of-00029.safetensors",
|
635 |
+
"model.layers.71.self_attn.o_proj.weight": "model-00026-of-00029.safetensors",
|
636 |
+
"model.layers.71.self_attn.q_proj.weight": "model-00026-of-00029.safetensors",
|
637 |
+
"model.layers.71.self_attn.v_proj.weight": "model-00026-of-00029.safetensors",
|
638 |
+
"model.layers.72.input_layernorm.weight": "model-00027-of-00029.safetensors",
|
639 |
+
"model.layers.72.mlp.down_proj.weight": "model-00027-of-00029.safetensors",
|
640 |
+
"model.layers.72.mlp.gate_proj.weight": "model-00026-of-00029.safetensors",
|
641 |
+
"model.layers.72.mlp.up_proj.weight": "model-00027-of-00029.safetensors",
|
642 |
+
"model.layers.72.post_attention_layernorm.weight": "model-00027-of-00029.safetensors",
|
643 |
+
"model.layers.72.self_attn.k_proj.weight": "model-00026-of-00029.safetensors",
|
644 |
+
"model.layers.72.self_attn.o_proj.weight": "model-00026-of-00029.safetensors",
|
645 |
+
"model.layers.72.self_attn.q_proj.weight": "model-00026-of-00029.safetensors",
|
646 |
+
"model.layers.72.self_attn.v_proj.weight": "model-00026-of-00029.safetensors",
|
647 |
+
"model.layers.73.input_layernorm.weight": "model-00027-of-00029.safetensors",
|
648 |
+
"model.layers.73.mlp.down_proj.weight": "model-00027-of-00029.safetensors",
|
649 |
+
"model.layers.73.mlp.gate_proj.weight": "model-00027-of-00029.safetensors",
|
650 |
+
"model.layers.73.mlp.up_proj.weight": "model-00027-of-00029.safetensors",
|
651 |
+
"model.layers.73.post_attention_layernorm.weight": "model-00027-of-00029.safetensors",
|
652 |
+
"model.layers.73.self_attn.k_proj.weight": "model-00027-of-00029.safetensors",
|
653 |
+
"model.layers.73.self_attn.o_proj.weight": "model-00027-of-00029.safetensors",
|
654 |
+
"model.layers.73.self_attn.q_proj.weight": "model-00027-of-00029.safetensors",
|
655 |
+
"model.layers.73.self_attn.v_proj.weight": "model-00027-of-00029.safetensors",
|
656 |
+
"model.layers.74.input_layernorm.weight": "model-00027-of-00029.safetensors",
|
657 |
+
"model.layers.74.mlp.down_proj.weight": "model-00027-of-00029.safetensors",
|
658 |
+
"model.layers.74.mlp.gate_proj.weight": "model-00027-of-00029.safetensors",
|
659 |
+
"model.layers.74.mlp.up_proj.weight": "model-00027-of-00029.safetensors",
|
660 |
+
"model.layers.74.post_attention_layernorm.weight": "model-00027-of-00029.safetensors",
|
661 |
+
"model.layers.74.self_attn.k_proj.weight": "model-00027-of-00029.safetensors",
|
662 |
+
"model.layers.74.self_attn.o_proj.weight": "model-00027-of-00029.safetensors",
|
663 |
+
"model.layers.74.self_attn.q_proj.weight": "model-00027-of-00029.safetensors",
|
664 |
+
"model.layers.74.self_attn.v_proj.weight": "model-00027-of-00029.safetensors",
|
665 |
+
"model.layers.75.input_layernorm.weight": "model-00028-of-00029.safetensors",
|
666 |
+
"model.layers.75.mlp.down_proj.weight": "model-00028-of-00029.safetensors",
|
667 |
+
"model.layers.75.mlp.gate_proj.weight": "model-00028-of-00029.safetensors",
|
668 |
+
"model.layers.75.mlp.up_proj.weight": "model-00028-of-00029.safetensors",
|
669 |
+
"model.layers.75.post_attention_layernorm.weight": "model-00028-of-00029.safetensors",
|
670 |
+
"model.layers.75.self_attn.k_proj.weight": "model-00027-of-00029.safetensors",
|
671 |
+
"model.layers.75.self_attn.o_proj.weight": "model-00027-of-00029.safetensors",
|
672 |
+
"model.layers.75.self_attn.q_proj.weight": "model-00027-of-00029.safetensors",
|
673 |
+
"model.layers.75.self_attn.v_proj.weight": "model-00027-of-00029.safetensors",
|
674 |
+
"model.layers.76.input_layernorm.weight": "model-00028-of-00029.safetensors",
|
675 |
+
"model.layers.76.mlp.down_proj.weight": "model-00028-of-00029.safetensors",
|
676 |
+
"model.layers.76.mlp.gate_proj.weight": "model-00028-of-00029.safetensors",
|
677 |
+
"model.layers.76.mlp.up_proj.weight": "model-00028-of-00029.safetensors",
|
678 |
+
"model.layers.76.post_attention_layernorm.weight": "model-00028-of-00029.safetensors",
|
679 |
+
"model.layers.76.self_attn.k_proj.weight": "model-00028-of-00029.safetensors",
|
680 |
+
"model.layers.76.self_attn.o_proj.weight": "model-00028-of-00029.safetensors",
|
681 |
+
"model.layers.76.self_attn.q_proj.weight": "model-00028-of-00029.safetensors",
|
682 |
+
"model.layers.76.self_attn.v_proj.weight": "model-00028-of-00029.safetensors",
|
683 |
+
"model.layers.77.input_layernorm.weight": "model-00028-of-00029.safetensors",
|
684 |
+
"model.layers.77.mlp.down_proj.weight": "model-00028-of-00029.safetensors",
|
685 |
+
"model.layers.77.mlp.gate_proj.weight": "model-00028-of-00029.safetensors",
|
686 |
+
"model.layers.77.mlp.up_proj.weight": "model-00028-of-00029.safetensors",
|
687 |
+
"model.layers.77.post_attention_layernorm.weight": "model-00028-of-00029.safetensors",
|
688 |
+
"model.layers.77.self_attn.k_proj.weight": "model-00028-of-00029.safetensors",
|
689 |
+
"model.layers.77.self_attn.o_proj.weight": "model-00028-of-00029.safetensors",
|
690 |
+
"model.layers.77.self_attn.q_proj.weight": "model-00028-of-00029.safetensors",
|
691 |
+
"model.layers.77.self_attn.v_proj.weight": "model-00028-of-00029.safetensors",
|
692 |
+
"model.layers.78.input_layernorm.weight": "model-00029-of-00029.safetensors",
|
693 |
+
"model.layers.78.mlp.down_proj.weight": "model-00029-of-00029.safetensors",
|
694 |
+
"model.layers.78.mlp.gate_proj.weight": "model-00029-of-00029.safetensors",
|
695 |
+
"model.layers.78.mlp.up_proj.weight": "model-00029-of-00029.safetensors",
|
696 |
+
"model.layers.78.post_attention_layernorm.weight": "model-00029-of-00029.safetensors",
|
697 |
+
"model.layers.78.self_attn.k_proj.weight": "model-00028-of-00029.safetensors",
|
698 |
+
"model.layers.78.self_attn.o_proj.weight": "model-00029-of-00029.safetensors",
|
699 |
+
"model.layers.78.self_attn.q_proj.weight": "model-00028-of-00029.safetensors",
|
700 |
+
"model.layers.78.self_attn.v_proj.weight": "model-00028-of-00029.safetensors",
|
701 |
+
"model.layers.79.input_layernorm.weight": "model-00029-of-00029.safetensors",
|
702 |
+
"model.layers.79.mlp.down_proj.weight": "model-00029-of-00029.safetensors",
|
703 |
+
"model.layers.79.mlp.gate_proj.weight": "model-00029-of-00029.safetensors",
|
704 |
+
"model.layers.79.mlp.up_proj.weight": "model-00029-of-00029.safetensors",
|
705 |
+
"model.layers.79.post_attention_layernorm.weight": "model-00029-of-00029.safetensors",
|
706 |
+
"model.layers.79.self_attn.k_proj.weight": "model-00029-of-00029.safetensors",
|
707 |
+
"model.layers.79.self_attn.o_proj.weight": "model-00029-of-00029.safetensors",
|
708 |
+
"model.layers.79.self_attn.q_proj.weight": "model-00029-of-00029.safetensors",
|
709 |
+
"model.layers.79.self_attn.v_proj.weight": "model-00029-of-00029.safetensors",
|
710 |
+
"model.layers.8.input_layernorm.weight": "model-00004-of-00029.safetensors",
|
711 |
+
"model.layers.8.mlp.down_proj.weight": "model-00004-of-00029.safetensors",
|
712 |
+
"model.layers.8.mlp.gate_proj.weight": "model-00004-of-00029.safetensors",
|
713 |
+
"model.layers.8.mlp.up_proj.weight": "model-00004-of-00029.safetensors",
|
714 |
+
"model.layers.8.post_attention_layernorm.weight": "model-00004-of-00029.safetensors",
|
715 |
+
"model.layers.8.self_attn.k_proj.weight": "model-00003-of-00029.safetensors",
|
716 |
+
"model.layers.8.self_attn.o_proj.weight": "model-00004-of-00029.safetensors",
|
717 |
+
"model.layers.8.self_attn.q_proj.weight": "model-00003-of-00029.safetensors",
|
718 |
+
"model.layers.8.self_attn.v_proj.weight": "model-00003-of-00029.safetensors",
|
719 |
+
"model.layers.9.input_layernorm.weight": "model-00004-of-00029.safetensors",
|
720 |
+
"model.layers.9.mlp.down_proj.weight": "model-00004-of-00029.safetensors",
|
721 |
+
"model.layers.9.mlp.gate_proj.weight": "model-00004-of-00029.safetensors",
|
722 |
+
"model.layers.9.mlp.up_proj.weight": "model-00004-of-00029.safetensors",
|
723 |
+
"model.layers.9.post_attention_layernorm.weight": "model-00004-of-00029.safetensors",
|
724 |
+
"model.layers.9.self_attn.k_proj.weight": "model-00004-of-00029.safetensors",
|
725 |
+
"model.layers.9.self_attn.o_proj.weight": "model-00004-of-00029.safetensors",
|
726 |
+
"model.layers.9.self_attn.q_proj.weight": "model-00004-of-00029.safetensors",
|
727 |
+
"model.layers.9.self_attn.v_proj.weight": "model-00004-of-00029.safetensors",
|
728 |
+
"model.norm.weight": "model-00029-of-00029.safetensors"
|
729 |
+
}
|
730 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"unk_token": {
|
24 |
+
"content": "<unk>",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
}
|
30 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
|
3 |
+
size 499723
|
tokenizer_config.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"0": {
|
6 |
+
"content": "<unk>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"1": {
|
14 |
+
"content": "<s>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
},
|
21 |
+
"2": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false,
|
27 |
+
"special": true
|
28 |
+
}
|
29 |
+
},
|
30 |
+
"bos_token": "<s>",
|
31 |
+
"clean_up_tokenization_spaces": false,
|
32 |
+
"eos_token": "</s>",
|
33 |
+
"legacy": false,
|
34 |
+
"model_max_length": 1000000000000000019884624838656,
|
35 |
+
"pad_token": "<unk>",
|
36 |
+
"padding_side": "right",
|
37 |
+
"sp_model_kwargs": {},
|
38 |
+
"spaces_between_special_tokens": false,
|
39 |
+
"split_special_tokens": false,
|
40 |
+
"tokenizer_class": "LlamaTokenizer",
|
41 |
+
"unk_token": "<unk>",
|
42 |
+
"use_default_system_prompt": false
|
43 |
+
}
|
train_results.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 3.0,
|
3 |
+
"train_loss": 0.28055200490389104,
|
4 |
+
"train_runtime": 252630.326,
|
5 |
+
"train_samples_per_second": 5.482,
|
6 |
+
"train_steps_per_second": 0.043
|
7 |
+
}
|
trainer_log.jsonl
ADDED
@@ -0,0 +1,44 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"current_steps": 1000, "total_steps": 10818, "loss": 0.5163, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.078217455621301e-06, "epoch": 0.28, "percentage": 9.24, "elapsed_time": "6:28:55", "remaining_time": "2 days, 15:38:25"}
|
2 |
+
{"current_steps": 1000, "total_steps": 10818, "loss": 0.5163, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.078217455621301e-06, "epoch": 0.28, "percentage": 9.24, "elapsed_time": "6:28:55", "remaining_time": "2 days, 15:38:26"}
|
3 |
+
{"current_steps": 1000, "total_steps": 10818, "loss": 0.5163, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.078217455621301e-06, "epoch": 0.28, "percentage": 9.24, "elapsed_time": "6:28:55", "remaining_time": "2 days, 15:38:26"}
|
4 |
+
{"current_steps": 1000, "total_steps": 10818, "loss": 0.5163, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.078217455621301e-06, "epoch": 0.28, "percentage": 9.24, "elapsed_time": "6:28:55", "remaining_time": "2 days, 15:38:26"}
|
5 |
+
{"current_steps": 2000, "total_steps": 10818, "loss": 0.4627, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.153661242603551e-06, "epoch": 0.55, "percentage": 18.49, "elapsed_time": "13:00:55", "remaining_time": "2 days, 9:23:06"}
|
6 |
+
{"current_steps": 2000, "total_steps": 10818, "loss": 0.4627, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.153661242603551e-06, "epoch": 0.55, "percentage": 18.49, "elapsed_time": "13:00:55", "remaining_time": "2 days, 9:23:06"}
|
7 |
+
{"current_steps": 2000, "total_steps": 10818, "loss": 0.4627, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.153661242603551e-06, "epoch": 0.55, "percentage": 18.49, "elapsed_time": "13:00:55", "remaining_time": "2 days, 9:23:06"}
|
8 |
+
{"current_steps": 2000, "total_steps": 10818, "loss": 0.4627, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.153661242603551e-06, "epoch": 0.55, "percentage": 18.49, "elapsed_time": "13:00:55", "remaining_time": "2 days, 9:23:06"}
|
9 |
+
{"current_steps": 3000, "total_steps": 10818, "loss": 0.4393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.229105029585799e-06, "epoch": 0.83, "percentage": 27.73, "elapsed_time": "19:32:29", "remaining_time": "2 days, 2:55:30"}
|
10 |
+
{"current_steps": 3000, "total_steps": 10818, "loss": 0.4393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.229105029585799e-06, "epoch": 0.83, "percentage": 27.73, "elapsed_time": "19:32:29", "remaining_time": "2 days, 2:55:30"}
|
11 |
+
{"current_steps": 3000, "total_steps": 10818, "loss": 0.4393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.229105029585799e-06, "epoch": 0.83, "percentage": 27.73, "elapsed_time": "19:32:29", "remaining_time": "2 days, 2:55:30"}
|
12 |
+
{"current_steps": 3000, "total_steps": 10818, "loss": 0.4393, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.229105029585799e-06, "epoch": 0.83, "percentage": 27.73, "elapsed_time": "19:32:29", "remaining_time": "2 days, 2:55:30"}
|
13 |
+
{"current_steps": 4000, "total_steps": 10818, "loss": 0.3697, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.304548816568048e-06, "epoch": 1.11, "percentage": 36.98, "elapsed_time": "1 day, 2:02:03", "remaining_time": "1 day, 20:22:31"}
|
14 |
+
{"current_steps": 4000, "total_steps": 10818, "loss": 0.3697, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.304548816568048e-06, "epoch": 1.11, "percentage": 36.98, "elapsed_time": "1 day, 2:02:03", "remaining_time": "1 day, 20:22:31"}
|
15 |
+
{"current_steps": 4000, "total_steps": 10818, "loss": 0.3697, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.304548816568048e-06, "epoch": 1.11, "percentage": 36.98, "elapsed_time": "1 day, 2:02:03", "remaining_time": "1 day, 20:22:31"}
|
16 |
+
{"current_steps": 4000, "total_steps": 10818, "loss": 0.3697, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.304548816568048e-06, "epoch": 1.11, "percentage": 36.98, "elapsed_time": "1 day, 2:02:03", "remaining_time": "1 day, 20:22:31"}
|
17 |
+
{"current_steps": 5000, "total_steps": 10818, "loss": 0.2788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.379992603550296e-06, "epoch": 1.39, "percentage": 46.22, "elapsed_time": "1 day, 8:28:55", "remaining_time": "1 day, 13:47:45"}
|
18 |
+
{"current_steps": 5000, "total_steps": 10818, "loss": 0.2788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.379992603550296e-06, "epoch": 1.39, "percentage": 46.22, "elapsed_time": "1 day, 8:28:55", "remaining_time": "1 day, 13:47:45"}
|
19 |
+
{"current_steps": 5000, "total_steps": 10818, "loss": 0.2788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.379992603550296e-06, "epoch": 1.39, "percentage": 46.22, "elapsed_time": "1 day, 8:28:55", "remaining_time": "1 day, 13:47:45"}
|
20 |
+
{"current_steps": 5000, "total_steps": 10818, "loss": 0.2788, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.379992603550296e-06, "epoch": 1.39, "percentage": 46.22, "elapsed_time": "1 day, 8:28:55", "remaining_time": "1 day, 13:47:45"}
|
21 |
+
{"current_steps": 6000, "total_steps": 10818, "loss": 0.2757, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.455436390532545e-06, "epoch": 1.66, "percentage": 55.46, "elapsed_time": "1 day, 14:55:00", "remaining_time": "1 day, 7:15:00"}
|
22 |
+
{"current_steps": 6000, "total_steps": 10818, "loss": 0.2757, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.455436390532545e-06, "epoch": 1.66, "percentage": 55.46, "elapsed_time": "1 day, 14:55:00", "remaining_time": "1 day, 7:15:00"}
|
23 |
+
{"current_steps": 6000, "total_steps": 10818, "loss": 0.2757, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.455436390532545e-06, "epoch": 1.66, "percentage": 55.46, "elapsed_time": "1 day, 14:55:00", "remaining_time": "1 day, 7:15:00"}
|
24 |
+
{"current_steps": 6000, "total_steps": 10818, "loss": 0.2757, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.455436390532545e-06, "epoch": 1.66, "percentage": 55.46, "elapsed_time": "1 day, 14:55:00", "remaining_time": "1 day, 7:15:00"}
|
25 |
+
{"current_steps": 7000, "total_steps": 10818, "loss": 0.2708, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.530880177514793e-06, "epoch": 1.94, "percentage": 64.71, "elapsed_time": "1 day, 21:22:31", "remaining_time": "1 day, 0:44:56"}
|
26 |
+
{"current_steps": 7000, "total_steps": 10818, "loss": 0.2708, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.530880177514793e-06, "epoch": 1.94, "percentage": 64.71, "elapsed_time": "1 day, 21:22:31", "remaining_time": "1 day, 0:44:56"}
|
27 |
+
{"current_steps": 7000, "total_steps": 10818, "loss": 0.2708, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.530880177514793e-06, "epoch": 1.94, "percentage": 64.71, "elapsed_time": "1 day, 21:22:31", "remaining_time": "1 day, 0:44:56"}
|
28 |
+
{"current_steps": 7000, "total_steps": 10818, "loss": 0.2708, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.530880177514793e-06, "epoch": 1.94, "percentage": 64.71, "elapsed_time": "1 day, 21:22:31", "remaining_time": "1 day, 0:44:56"}
|
29 |
+
{"current_steps": 8000, "total_steps": 10818, "loss": 0.1397, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6063239644970415e-06, "epoch": 2.22, "percentage": 73.95, "elapsed_time": "2 days, 3:50:19", "remaining_time": "18:15:36"}
|
30 |
+
{"current_steps": 8000, "total_steps": 10818, "loss": 0.1397, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6063239644970415e-06, "epoch": 2.22, "percentage": 73.95, "elapsed_time": "2 days, 3:50:19", "remaining_time": "18:15:36"}
|
31 |
+
{"current_steps": 8000, "total_steps": 10818, "loss": 0.1397, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6063239644970415e-06, "epoch": 2.22, "percentage": 73.95, "elapsed_time": "2 days, 3:50:19", "remaining_time": "18:15:36"}
|
32 |
+
{"current_steps": 8000, "total_steps": 10818, "loss": 0.1397, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6063239644970415e-06, "epoch": 2.22, "percentage": 73.95, "elapsed_time": "2 days, 3:50:19", "remaining_time": "18:15:36"}
|
33 |
+
{"current_steps": 9000, "total_steps": 10818, "loss": 0.1026, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6817677514792902e-06, "epoch": 2.5, "percentage": 83.19, "elapsed_time": "2 days, 10:20:13", "remaining_time": "11:47:02"}
|
34 |
+
{"current_steps": 9000, "total_steps": 10818, "loss": 0.1026, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6817677514792902e-06, "epoch": 2.5, "percentage": 83.19, "elapsed_time": "2 days, 10:20:13", "remaining_time": "11:47:02"}
|
35 |
+
{"current_steps": 9000, "total_steps": 10818, "loss": 0.1026, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6817677514792902e-06, "epoch": 2.5, "percentage": 83.19, "elapsed_time": "2 days, 10:20:13", "remaining_time": "11:47:02"}
|
36 |
+
{"current_steps": 9000, "total_steps": 10818, "loss": 0.1026, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6817677514792902e-06, "epoch": 2.5, "percentage": 83.19, "elapsed_time": "2 days, 10:20:13", "remaining_time": "11:47:02"}
|
37 |
+
{"current_steps": 10000, "total_steps": 10818, "loss": 0.0998, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.572115384615385e-07, "epoch": 2.77, "percentage": 92.44, "elapsed_time": "2 days, 16:52:35", "remaining_time": "5:18:24"}
|
38 |
+
{"current_steps": 10000, "total_steps": 10818, "loss": 0.0998, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.572115384615385e-07, "epoch": 2.77, "percentage": 92.44, "elapsed_time": "2 days, 16:52:35", "remaining_time": "5:18:24"}
|
39 |
+
{"current_steps": 10000, "total_steps": 10818, "loss": 0.0998, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.572115384615385e-07, "epoch": 2.77, "percentage": 92.44, "elapsed_time": "2 days, 16:52:35", "remaining_time": "5:18:24"}
|
40 |
+
{"current_steps": 10000, "total_steps": 10818, "loss": 0.0998, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.572115384615385e-07, "epoch": 2.77, "percentage": 92.44, "elapsed_time": "2 days, 16:52:35", "remaining_time": "5:18:24"}
|
41 |
+
{"current_steps": 10818, "total_steps": 10818, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 22:10:30", "remaining_time": "0:00:00"}
|
42 |
+
{"current_steps": 10818, "total_steps": 10818, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 22:10:30", "remaining_time": "0:00:00"}
|
43 |
+
{"current_steps": 10818, "total_steps": 10818, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 22:10:30", "remaining_time": "0:00:00"}
|
44 |
+
{"current_steps": 10818, "total_steps": 10818, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 22:10:30", "remaining_time": "0:00:00"}
|
trainer_state.json
ADDED
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.9993761696818466,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 10818,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.28,
|
13 |
+
"learning_rate": 9.078217455621301e-06,
|
14 |
+
"loss": 0.5163,
|
15 |
+
"step": 1000
|
16 |
+
},
|
17 |
+
{
|
18 |
+
"epoch": 0.55,
|
19 |
+
"learning_rate": 8.153661242603551e-06,
|
20 |
+
"loss": 0.4627,
|
21 |
+
"step": 2000
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 0.83,
|
25 |
+
"learning_rate": 7.229105029585799e-06,
|
26 |
+
"loss": 0.4393,
|
27 |
+
"step": 3000
|
28 |
+
},
|
29 |
+
{
|
30 |
+
"epoch": 1.11,
|
31 |
+
"learning_rate": 6.304548816568048e-06,
|
32 |
+
"loss": 0.3697,
|
33 |
+
"step": 4000
|
34 |
+
},
|
35 |
+
{
|
36 |
+
"epoch": 1.39,
|
37 |
+
"learning_rate": 5.379992603550296e-06,
|
38 |
+
"loss": 0.2788,
|
39 |
+
"step": 5000
|
40 |
+
},
|
41 |
+
{
|
42 |
+
"epoch": 1.66,
|
43 |
+
"learning_rate": 4.455436390532545e-06,
|
44 |
+
"loss": 0.2757,
|
45 |
+
"step": 6000
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"epoch": 1.94,
|
49 |
+
"learning_rate": 3.530880177514793e-06,
|
50 |
+
"loss": 0.2708,
|
51 |
+
"step": 7000
|
52 |
+
},
|
53 |
+
{
|
54 |
+
"epoch": 2.22,
|
55 |
+
"learning_rate": 2.6063239644970415e-06,
|
56 |
+
"loss": 0.1397,
|
57 |
+
"step": 8000
|
58 |
+
},
|
59 |
+
{
|
60 |
+
"epoch": 2.5,
|
61 |
+
"learning_rate": 1.6817677514792902e-06,
|
62 |
+
"loss": 0.1026,
|
63 |
+
"step": 9000
|
64 |
+
},
|
65 |
+
{
|
66 |
+
"epoch": 2.77,
|
67 |
+
"learning_rate": 7.572115384615385e-07,
|
68 |
+
"loss": 0.0998,
|
69 |
+
"step": 10000
|
70 |
+
},
|
71 |
+
{
|
72 |
+
"epoch": 3.0,
|
73 |
+
"step": 10818,
|
74 |
+
"total_flos": 3075736122425344.0,
|
75 |
+
"train_loss": 0.28055200490389104,
|
76 |
+
"train_runtime": 252630.326,
|
77 |
+
"train_samples_per_second": 5.482,
|
78 |
+
"train_steps_per_second": 0.043
|
79 |
+
}
|
80 |
+
],
|
81 |
+
"logging_steps": 1000,
|
82 |
+
"max_steps": 10818,
|
83 |
+
"num_input_tokens_seen": 0,
|
84 |
+
"num_train_epochs": 3,
|
85 |
+
"save_steps": 1000,
|
86 |
+
"total_flos": 3075736122425344.0,
|
87 |
+
"train_batch_size": 1,
|
88 |
+
"trial_name": null,
|
89 |
+
"trial_params": null
|
90 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3995ac6ce8f75db4901ac1233ea0ebe0bbba8b9708bce92671c71507ed909ab1
|
3 |
+
size 7224
|
training_loss.png
ADDED