File size: 23,771 Bytes
41dbc03 |
1 |
{"AUTHORS":"bafkr4ihwekpujeddtf6zhfsdebi2drlwe5oqcoxgjfwx7ferhbqobfj6wm","LICENSE":"bafkr4ibsoazknxpee2qulrxrc3l4jmhaahstdqyem6dwyagq2hlwnjn6iu","README.md":"bafkr4ia6hg7qtn2fvhx5lr4uqu6rgvp4fmy4dgssb4owvdlzt5tr5vub4e","docs/Makefile":"bafkr4ick4j4xsb7smd4a7efyarojtbzsh6gwnngyabespqyqrlhumv3iru","docs/_templates/autosummary/base.rst":"bafkr4icgoporlsagdorsfp2vvr3vgkuvyidsnmz246v6qanvalwrdbtaji","docs/_templates/autosummary/class.rst":"bafkr4ih4iegu4dzlzje23wvqwdk5sjizrxvfl5rukr4pyo2jjjorbaeaje","docs/_templates/autosummary/module.rst":"bafkr4ic27qyvvbvcqoiil2bedopid72xmofq7ou4wthc6bxirmc2fzu3ce","docs/api/index.rst":"bafkr4igolgbnurx3eerrzikqqi46r3mkgm2dkju7x4pr34f2eehjnmbgtu","docs/conf.py":"bafkr4ifqhmt7uplzjffvzb3cewb7wa4ph2smzmzpu5dpavo3c2jpzeu3ki","docs/guide/faq.md":"bafkr4if25u2p65lur25w5junnafyxwe2wdrq7wh6jf6ejogklbtuyheiqq","docs/guide/getting_started.md":"bafkr4ie224mwoxfny6tcfadmqjpf4qtvuf5b2e5zg6emr2algydgsqyxmm","docs/guide/index.md":"bafkr4ia355ytjloggng4wir7bwdjbqardag5rmhf4g73thfjdu6pp5hsr4","docs/guide/instruction_tuning.md":"bafkr4idrugtsfkbg5dggcivmxnt7bo6jkskfxcdndjoxy3u3okfjkr2cpu","docs/guide/tokenization.md":"bafkr4ifvfhvazgnwcddizq4xpsztjc5s3bqwr5mfvzi3cmsesemmpuk5su","docs/guide/weights_conversion.md":"bafkr4ialbahrvejzgapgfm7f5to752exilu64wv6qn7io3vmm54vljor5y","docs/imgs/llama-falcon.png":"bafkr4id6hagmjqhkgep2hzvu26oeujj2zknvgq5hwsfdb65f7svpkyutq4","docs/index.rst":"bafkr4ifnj2amu2bndujdojcwoehg4nfooji54bjze6mj3gaalctl3q2dru","docs/make.bat":"bafkr4ieeahkcfwaoaubldgpwxfaz5llpmwetzsrn5sydasbri7dfapjtnm","docs/requirements.txt":"bafkr4ifl3ejlg6xijxvbta5bwlscsdzl5r4eevpjn5lrg56k5umu26m2ci","examples/evaluate_retriever_nq.sh":"bafkr4igwav52oy5aw27rnanp7xticyv5qnhwfzhu43cx72ynrek42lui6a","examples/evaluate_zeroshot_gpt.sh":"bafkr4id2hx6njnv7v5gtv2d3jsy627rbbwy37izb6pphtjn7ilgvgpcc24","examples/finetune.sh":"bafkr4ih3ykslp6xe7lt5hlui3puvtdivznh3gvfejeoflelj4bkymlctsu","examples/finetune_mnli_distributed.sh":"bafkr4iaphuufi4cz3dy2htojfly23db26z7ym6lfoaisc7zq475hzhesra","examples/finetune_race_distributed.sh":"bafkr4ialu4ybbyki2dkzqyfiedneyhymzm3pui7drzgufxztxitb7vtirq","examples/finetune_retriever_distributed.sh":"bafkr4ibbhdxthxkglxczinfqrdw62pr7mkmfebsfjqtnizjdnxx5tgs3n4","examples/hf_to_megatron.sh":"bafkr4ifhlq3idal2cqbotigihybjwnnuiagujffj2uaahnicvsyn5ixk7e","examples/merge_mp_bert.sh":"bafkr4iafwit67bvw7opeak2wu54blftzvcvf6shwhtfl3dfkunxh75stmi","examples/msdp/README.md":"bafkr4igw7dgjbblujvw7sauqcmzhjgqlxghrvenrrxgefzsldtw4akappu","examples/msdp/data_processing.sh":"bafkr4ihv3czsrdyc3xuvniz7hq4johs7nuy62jlsqtzsmhsygq5ci5qz24","examples/msdp/eval_knwl_generation.sh":"bafkr4ia4x6p3tljw46ovo3tbuy56ey4oypcbxmqwev6tppjhjp7sakytry","examples/msdp/eval_resp_generation.sh":"bafkr4ifcfcjic4gf7oihd2aayuze5yrpcffv6eglxy623nf6yb5l6sbr54","examples/msdp/prep_resp_gen.sh":"bafkr4ibma4iqatqurkpql3pk56fmobu63qkfmgn5virp7cnc425nv4eqaa","examples/msdp/prompt_knwl_gen.sh":"bafkr4igqvraavlwzcr55rl6p75ihjuilnbnbdu3wxiw7yzrsxmzqt6pyni","examples/msdp/prompt_resp_gen.sh":"bafkr4idmo5bt7r7bs6igwool4bcqklcwdnugyyw4h2gasgqy6xquhdspua","examples/parallelize.sh":"bafkr4iehl4alqdpo52x664brqbcprolsgwebw74xmyhrhavdpdy5qkfywu","examples/pretrain_bert.sh":"bafkr4id5geqdxa74bkn3vb5pnkcwwjzvp445h2vpx6zct7t74zum5bij2y","examples/pretrain_bert_distributed.sh":"bafkr4idh3dg46yaf4mtdlazkxdng2hubtzc3gvuln47rcsxxrfeuvd2iha","examples/pretrain_bert_distributed_with_mp.sh":"bafkr4if3djq7pqgusi5jwlmv75gilf2xwljwbvvyardntu77cxj5f6eyke","examples/pretrain_gpt.sh":"bafkr4iabou2nikzr2azwttdupxuo6xrm6u2tn32gzpjh3wc5mmlm2wp63q","examples/pretrain_gpt3_175B.sh":"bafkr4ia7xhgqivw7ku5ldr2g4yhmvuyce4qg5ody4zrkq7zxxcp3zp4a2e","examples/pretrain_gpt_distributed.sh":"bafkr4ihladd52npvlo32l3pst4w5r3x6kxkhcioquyk44jpd52lo2avbne","examples/pretrain_gpt_distributed_with_mp.sh":"bafkr4iecnum4nhbvxzrlrm4sukvbj7etqmeb76pyrtruwr6hvcjuoi5ake","examples/pretrain_ict.sh":"bafkr4ibubttjrbaexl3dvodi3atoezuoxlljsg55rkutkqrak7xg44uvwm","examples/pretrain_t5.sh":"bafkr4iautlylojgklzcvq4ouqr5za37vxfpjhg34xsy6evwncztennlqre","examples/pretrain_t5_distributed.sh":"bafkr4iajusck6rlftiea5ti2f2wubzdmbtz3fyg7gziom2crs3bfckpzvu","examples/pretrain_t5_distributed_with_mp.sh":"bafkr4ihe2tnub37iuy26zampgfhddaass47dj6x5spjwowl4z6tuik73bi","examples/run_text_generation_server_345M.sh":"bafkr4idfkrifjjmhyen5iecyyale254r57vbqr4af5bxdoz3tscyukg3bu","examples/run_text_generation_server_345M_8_tensor_parallel.sh":"bafkr4iau2gxxq5fuww2v75thlhqjjtbtrdt5u4jimibce7tfgbrdouehv4","examples/sc21/CONFIG.sh":"bafkr4iex6a6lcmn6vkxy3c7h5smlzx7soylg4s4ske35djpelmtm6uchji","examples/sc21/README.md":"bafkr4igpjdp5toa7wtwcthcvp5pxb6tottzw5tdfd2wah3vcbk3lcwhw74","examples/sc21/SBATCH.sh":"bafkr4igpprvisqzuw7qvukmd7gkb7eaoav4uxd6ohp2jcuj4saghzpbxly","examples/sc21/SRUN.sh":"bafkr4igvfw6vo6ttnmkkqrqbvolym77ugpkfq3kylwc7aq7a6li2h6ciqa","examples/sc21/run_figure_11.sh":"bafkr4if3hp735hc4nvgbvpnaljoibbpgjd4q2zeagwyewvqzcm5zponpti","examples/sc21/run_figure_12.sh":"bafkr4ibf6rt45epe55uancnlnx2l2vi5iaxjhrr26l4s5uk5arc4tgce6a","examples/sc21/run_figure_13.sh":"bafkr4ifi5nbrtobzxr6uwv2qcnz2tddr4ewxjyznky7542paf2jp6xp77e","examples/sc21/run_figure_14.sh":"bafkr4idqsk63pwvggnrkl5j6gctvr7lfxft546lyaeejyezppkkrr6xm6a","examples/sc21/run_figure_15.sh":"bafkr4ic7oxthcj4t37vizhruiuvbwqgxetk3fknxm2zhtqycckxsqapqwi","examples/sc21/run_figure_16.sh":"bafkr4idvclbzc3idfl7ohkzrryvwe6y5k2dtwhi5ndvlgwpeil3uzb7upa","examples/sc21/run_figure_17.sh":"bafkr4iebxsm3tyjorwgpoovw34pehqnh4lstokcdvas6bufc4dgcbscu6e","examples/sc21/run_figure_18.sh":"bafkr4iexh264opsrfapwiakhr7bxhqf3qjxr5nyzrazinobdyjfae4tkum","examples/sc21/run_table_1.sh":"bafkr4igojtssc67oyeml2pw6gsjxtxaif4ehv56i46grdg7yi5deos2rrm","examples/verify.sh":"bafkr4icxahckpqfzs6hfgmjlqbdeitfxynj5jo3mta25esisobzlh6uvgq","finetune.py":"bafkr4ibkwh62titir536jxlt45ndixl3ujwe6nazb7xkylr424j6jifavq","megatron/__init__.py":"bafkr4ieopvgf3qe3niqqcodjrfjnnytcyc4k25mmuy3bygttwdwialzvoe","megatron/arguments.py":"bafkr4igzrbkvxccthwimrpju62qh47dgm2lis3aznibaa5cpbngjpfhpym","megatron/checkpointing.py":"bafkr4ia6drh5rgayqw5uxaii4el5hvsrki555gtwrwtsiwyghpnuokctqm","megatron/core/__init__.py":"bafkr4ib7pkvlboj45inkvxkki5vqipdda4kblehwci7dwcxuy7avvpf3c4","megatron/core/parallel_state.py":"bafkr4ig6g7czdvaokn2b6l2swqq7jeh3r7iaidu7gi73um6wfq7jbcjcqq","megatron/core/tensor_parallel/__init__.py":"bafkr4ian43egrvyimk7bh6yyhjtl6xcxforumqw7cgysblmv2j7ykkmrf4","megatron/core/tensor_parallel/cross_entropy.py":"bafkr4iclr6od64utlk5j537tsr4axhho6gqc6fvx75vip7n6t4e2isogei","megatron/core/tensor_parallel/data.py":"bafkr4ich5c3jdzydizj5qgrw6fzdbfxixkabontu3qnaug5se7vhc25j3e","megatron/core/tensor_parallel/layers.py":"bafkr4icvjvklz34dmjtzkf2rrwruk7ymfu7xj75a75roggyde462owe6zm","megatron/core/tensor_parallel/mappings.py":"bafkr4idtoj2fyy7sqanjmshssdavniucnvkrs4bao5drgvklekcl2x2qlq","megatron/core/tensor_parallel/random.py":"bafkr4ichoxk6pcvkvdk66zkkrd4bo7r3wlr6b63qm2drie27pfzijxfdhu","megatron/core/tensor_parallel/utils.py":"bafkr4iaie2wj42sp5oxyk4xfvwk6w7qw4pbnecl2u6n5eeqnaxokxj53oi","megatron/core/utils.py":"bafkr4ie7jsqjvilpayy6qw4rmvpcatjem3z76yglx6gj75dtkcyujic72u","megatron/data/Makefile":"bafkr4igpym3folhpjptgv4gl4nnm3rykogmvlsfntq6zyyvytd7lii6lvi","megatron/data/__init__.py":"bafkr4iardpskfn74ychqbdf36gkzd5chmjvyposaj3vbog54mgo2krsk7a","megatron/data/autoaugment.py":"bafkr4id7mutjdqwwkkyelmbceqa7a2zpwt2f7g6y55egpoaofuvlbypbc4","megatron/data/bert_dataset.py":"bafkr4ibze7yonzgkrvi47w7fn5hl2oe6jz3eaj5e3f3jlwz6tf7dwqpode","megatron/data/biencoder_dataset_utils.py":"bafkr4ibhrn6dg2hnlra2k42c5o6vumobarpfh7dbu7sas3ekohql7m3c2m","megatron/data/blendable_dataset.py":"bafkr4ibh6y7o6mi6cafe3fo5svlyrvhpublag3oa7v2a7wyb5bayibnzuq","megatron/data/data_samplers.py":"bafkr4ieziq6kjnmc7ed6cxjmfg5lg7j4ucr5l3fwa6qvlumya4snrbsk5m","megatron/data/dataset_utils.py":"bafkr4ibhvjabnh4dsd4n3kfirde2jmlxulofsy5pr6sqb4wzmoinz5p4bm","megatron/data/gpt_dataset.py":"bafkr4ie6u722zskhzcpqbup4e7g5qisgk4hstlq2dbluc7bnzbymmixdfe","megatron/data/helpers.cpp":"bafkr4if2ivnmlvii3tasvp2yuallup6ttnmtonjk4bs5e3gltm4capfg6q","megatron/data/ict_dataset.py":"bafkr4ihgxh7t3do2vf47halk6edkz5a53anyytgst4q2z44ykahjwpsryy","megatron/data/image_folder.py":"bafkr4ida23awij72me2hnuryzwraqfnhvf6psl352iakissie6lae7xusm","megatron/data/indexed_dataset.py":"bafkr4iddifzpm4d5xwd6yun7c4f76xizrcpahsck2ghrrm3i7ydmicil2e","megatron/data/instruction_dataset.py":"bafkr4ih3r4lavib3y45tfnxd33zguvixehvez33hons33na7d6ailhbjji","megatron/data/orqa_wiki_dataset.py":"bafkr4ih3cflg7rts25cf6ficrorga4saf2hvdpiw4ggqbnsg357evfvtym","megatron/data/realm_dataset_utils.py":"bafkr4ib63hisghbmvzrlj4qvgcvjmtgbkm4amfrrgncnkvqkwgjlwj2dsq","megatron/data/realm_index.py":"bafkr4iglgiukf7u4yit7iylw4ysxzi3a4mbjvyoxfjh75a76c5rey6spfu","megatron/data/t5_dataset.py":"bafkr4ignefkcbge7u3can7uczomznl5awk7fsejfftjfznpsggcnfb77a4","megatron/data/test/test_indexed_dataset.py":"bafkr4ibqzewfah3imviky5mvcsua5wvd4tmgglm2uf2qugeqxub7qxleca","megatron/data/test/test_preprocess_data.sh":"bafkr4igiomthwbedm2thu3w63d6vbpfse3ij6xlhdnrcaukntee3csmk4m","megatron/dist_signal_handler.py":"bafkr4ib3oattm7sysiotrgybzxcb4oody7z7dd74bzb737jvgu6hrhsoae","megatron/fp16_deprecated/loss_scaler.py":"bafkr4ihi6wj2oagzjk6tukmwovofm3o6xc2qw2bdsjmofrbhocyyqcofim","megatron/fused_kernels/__init__.py":"bafkr4iedfqv5vvuiaj5sqxr7rgspjnj7m5pynuzmjubrmckulchvrafuie","megatron/fused_kernels/compat.h":"bafkr4ibo7zwt5amj577vyn3gqz5u4oooypsd3l4bqsvapickidhbwtlmx4","megatron/fused_kernels/fused_weight_gradient_dense.cpp":"bafkr4idzcpqd6vwbxbqv4f3eody3zuzoxgfophpibs3wx2wlrklw7lowiq","megatron/fused_kernels/fused_weight_gradient_dense.cu":"bafkr4ibbzp5zdtekzq4f24nz7udjw3jk4cfax37kxk7yp45hq26jcsojju","megatron/fused_kernels/layer_norm_cuda.cpp":"bafkr4ieeuu2krrhcshejjsptvqcpkux22m6s4s6n7to64h5pu2zbjl6p34","megatron/fused_kernels/layer_norm_cuda_kernel.cu":"bafkr4iht34rjllfc73b7m2ql4xrd5aftgfvjx7qb4k2e5exfmzluvulmna","megatron/fused_kernels/scaled_masked_softmax.cpp":"bafkr4ieyfkq3dwixc6hmu5h56tu3jenfnxb5xorobaje5ptkecvldmcrsy","megatron/fused_kernels/scaled_masked_softmax.h":"bafkr4ie6cykmx2mn4c35rihupyewjlfrmqqmyswvujia3rkv4g2bb2nyda","megatron/fused_kernels/scaled_masked_softmax_cuda.cu":"bafkr4ihgurpmh6ql4k4pnx5nkto566j65xr3nhhh5e76jrlramew5ksmau","megatron/fused_kernels/scaled_softmax.cpp":"bafkr4icbec22uxcirarbtw4rt3tt4ujezugdcxouovnaxtwk24usxq4jby","megatron/fused_kernels/scaled_softmax_cuda.cu":"bafkr4ieiscxqunexzvnzhawuswekgl4tfcqxbtxz66fviwmm7xf3kj7xcy","megatron/fused_kernels/scaled_upper_triang_masked_softmax.cpp":"bafkr4idbpus2coczfkucu53ds6ai4moa57ap6aoj3jsjd4uz63zqxt4m5e","megatron/fused_kernels/scaled_upper_triang_masked_softmax.h":"bafkr4ibaxlvqeym6elfvdvve2vyjswzyi77q3sm7qvlv4ttt6fv7hqbjqm","megatron/fused_kernels/scaled_upper_triang_masked_softmax_cuda.cu":"bafkr4ig5iyi7nnqeph6trznbpp7cifdh6xg3uvpirhjtkmhv5jtt6thije","megatron/fused_kernels/tests/__init__.py":"bafkr4ifpcne3t5pzugtkaqcn5i3nzskjtpfslsnnyejlpte2spfoihzsmi","megatron/fused_kernels/tests/test_fused_kernels.py":"bafkr4igfifdyhbgqfewn7q6fbio2g36f3vxgyz3a7zcs22y7rhocqrua3i","megatron/fused_kernels/type_shim.h":"bafkr4id5jsvtdrf43mtv3b7yfqdtkkcvtacsp352nmh4zml4b4dwhgscla","megatron/global_vars.py":"bafkr4ih3f7y5eeigmk2wmnezwdagidckoeshaavhi6nlscwgys7nrvfrsm","megatron/indexer.py":"bafkr4idmvymfg4m6d6ng6um5n7n7jjrv2wyeqotgpjbmnjv52ssoq6hq2q","megatron/initialize.py":"bafkr4ifbwcmnwo7e6nnmqr3ic73ivhbhwb627fh4yddswjhc4da6fungny","megatron/memory.py":"bafkr4id5crsdedwyjjgoy7afdihodvbkibywvarw57bb4gkw34cg35jmw4","megatron/metrics.py":"bafkr4ihq4awf3b2o4mckw3a6u725swqgtvh4shrtjscvse3dpdppayozfq","megatron/microbatches.py":"bafkr4icxlex7vjuwloc3ysy4w4nc5l25ltl6bq47it6tzitbd3zv3wbedq","megatron/model/__init__.py":"bafkr4ico23ekmeehmrdk5qjkhepdwm5hszwhr55pvmxxll4jechspov5cy","megatron/model/bert_model.py":"bafkr4ie76pcmxqa6uat3ewumcfablvfssis5mcbtwke4o66pnrntx56fum","megatron/model/biencoder_model.py":"bafkr4ic4nhufpy33krnsjoc755igxjry73d73chmfl3fmexgk6bli5i7yy","megatron/model/classification.py":"bafkr4ibj6xqxqwkxwr2253n6rq2cwxjkcgvadfcfknbspljziv2zsbunxq","megatron/model/distributed.py":"bafkr4iffvpvz3s3z62zapvvdtewzlqxgwzngfy3yere2pq3kfqs53k67iy","megatron/model/enums.py":"bafkr4icdzfxgtf7iqcxqvhcgdwymtse67apxbsittkii5qmyzszbb2up7q","megatron/model/falcon_model.py":"bafkr4ifaf7xgymq22oaewwm7hz67qfytoe36323gje5mbbdumerxyvcpf4","megatron/model/fused_bias_gelu.py":"bafkr4ifobduyhw6z3a6u2esbzv3ovxc3e2kkggignvqg6ckzaovskzbrnu","megatron/model/fused_layer_norm.py":"bafkr4igckp6srwcb2s6afobjmpob2j7qa2opfkruisaj7qpvaan6q2z4u4","megatron/model/fused_softmax.py":"bafkr4igraaf6ultjrdruhr653wuobtepx5opj23p2q2jza27bj25krkxla","megatron/model/glu_activations.py":"bafkr4iewdvm6t2i5rnzvicf3zk43ejtnjolgdrh4qluc3zeyyqmorq4kza","megatron/model/gpt_model.py":"bafkr4ihg4k6toqmdfviq46apbfv7ixamzwijmmwez4e2yakgkumfj6763y","megatron/model/language_model.py":"bafkr4ieqkybwaudvj7xc2dzhfywvaww7mmgvgg3v55qdfwkcyx6yvbsnsq","megatron/model/llama_model.py":"bafkr4idjknvcxulssq5jdtshdtu22x4bvqoiwxwh6nmehgfs2d72ak7lmi","megatron/model/mistral_model.py":"bafkr4icurzbqtx2aihqidp7nqhrhohquq6ccetyfnvc2wdawvyghnnld6u","megatron/model/module.py":"bafkr4iby2niclsoawpnss7felfxkggmd55mvoymcomvceq67dgr2bkqoq4","megatron/model/multiple_choice.py":"bafkr4ie4fr277llgssmhz5lnlxzq7uqlgx4pn4cglbz6w67u2t6vttcfvq","megatron/model/positional_embeddings.py":"bafkr4ig2jeadpwpudwkunuw5p6mrn5xeaudv4dpgnqz2cveyy7jjgrz4xy","megatron/model/t5_model.py":"bafkr4ic22bnt6wzo2ogokhergoiw6vvuupknflmsrjnxqa3u4zpjh6luya","megatron/model/transformer.py":"bafkr4idbvr2i5auxecdrucx2i6xemlqajqxl662jvtuzq5afrp5jxc5yi4","megatron/model/utils.py":"bafkr4ibsepqdtgq7gyyirsa2wuqss47jpcaijinq2utky54ulzpqlvjgsm","megatron/mpu/tests/__init__.py":"bafkr4ifpcne3t5pzugtkaqcn5i3nzskjtpfslsnnyejlpte2spfoihzsmi","megatron/mpu/tests/commons.py":"bafkr4ig5eg7zczpppicmxkjy7xwfzqebwcq77vfodxkxyc6zuqemr6ob4u","megatron/mpu/tests/test_cross_entropy.py":"bafkr4ifp4cp3glfrsahqb5zdnap3yr3w7n2go5itcskecueocg63ercqke","megatron/mpu/tests/test_data.py":"bafkr4icvyofvovvkcish2z7k7ixolm66w35gi35tnrur2h4j4puo24k42m","megatron/mpu/tests/test_initialize.py":"bafkr4iax5btesyody2ftvfxp776vumhtjy4jm63ndhhpdsziloxqmu7xhm","megatron/mpu/tests/test_layers.py":"bafkr4ibngqqgowclygtc2hf76xawkl6dniffafmtiiy4h7qlnpj65z2eb4","megatron/mpu/tests/test_random.py":"bafkr4idbzodgjsc5przr2kdxpjh56jyybiso2rlirx6ojgr7la7l6jvuu4","megatron/optimizer/__init__.py":"bafkr4ic22qookq4xt54jlixikrqhyg7v7653oyrj6zsleyp5dqiptwd224","megatron/optimizer/clip_grads.py":"bafkr4ib2mmyzatcv6rgbkc2fxzdvceq2nkiwmbj6o22pityztmmhy6nmue","megatron/optimizer/distrib_optimizer.py":"bafkr4ialtg4x7letfuqhposok53xeqpng44xrwet4a3o7sheydeco2kmpa","megatron/optimizer/grad_scaler.py":"bafkr4iallaykq3xgrmv7kifusjn7betskigotzug3ifmvmxxdsejrhnj2e","megatron/optimizer/optimizer.py":"bafkr4ifscocrx4t2j6sbf7z4gbqs6mvbaccxrnjgsehaw3dd54joay3v2i","megatron/optimizer_param_scheduler.py":"bafkr4iffya24yedufc4bd6rfzfqscnawvlaty5bddqvakw2ivf2magw5ei","megatron/p2p_communication.py":"bafkr4idlmel225p5qrq4naz37yh6kzex57ihvdzubxpiu6kyb7lv2thave","megatron/schedules.py":"bafkr4ifwsss22dmxchh6lb44txcydhyuo2n555lpssyi2vz6v5zprchcrm","megatron/static/index.html":"bafkr4iaxlgaaanteugznsokgnstxsbouytxlors337uruk6ktnj7c2vgf4","megatron/text_generation/__init__.py":"bafkr4ia6k7g5nrbseoo3i6t7vgxkirnoqnikhk3jtsicriednrukpxivb4","megatron/text_generation/api.py":"bafkr4ige6fxv526j4d6g5kxrmbi2udsw4knz65xypxxgilt5dzp67xbu7y","megatron/text_generation/beam_utils.py":"bafkr4iai5wdtpymcuhugjypt2rpvy3deislnzmm7wz4wshcwy2ucovbn4u","megatron/text_generation/communication.py":"bafkr4ient5al7eg5g63jswiakfhv2pct2mj5etcbpq4lazqjrvc2fymzgm","megatron/text_generation/forward_step.py":"bafkr4igze2xhsuwwcra7c6yjr4rogkzxisdxpaero4fp6qt6wsl2bhppjm","megatron/text_generation/generation.py":"bafkr4ihzahqxndqeehfrcu4ddmdy7l7z5o2jdvyxrsa3srmr477erg3gly","megatron/text_generation/sampling.py":"bafkr4ibaph5zwuclpvpk5gyyyoytl42ixpamgksueye45a6ullar3k4n6e","megatron/text_generation/tokenization.py":"bafkr4ieuxeuilhwyr2ytpob4x2bkge77yo6rpr7cinzmnlu6hmal2xw5ae","megatron/text_generation_server.py":"bafkr4ice2dbcaew3v7kjs7oiziwydtkso6wihqxwxojeqb4hbxbjhy6dum","megatron/timers.py":"bafkr4igjxp7ddf5xx4ko6hfk7oltmaus56yak5dqjbyiwow4zxfskvpkwq","megatron/tokenizer/__init__.py":"bafkr4idwhuzos4ggpuh3xdwf5mavwh2v4gpbvxas2vtuakywjbx3tfrdnu","megatron/tokenizer/bert_tokenization.py":"bafkr4if6ccjfeluvozuxqbmvwyimuvkz42jqbmauzq62z4xnjecgqdevve","megatron/tokenizer/gpt2_tokenization.py":"bafkr4id46iuy4ejuavadapp5vgpdp5yvcrwda4rubwvrhgmdsvrhczteei","megatron/tokenizer/tokenizer.py":"bafkr4idl3ugcuapbomibjztfps5osiuapapojzzjynrd5zocxwgw37e7hm","megatron/training.py":"bafkr4ibdy32kwryq66vkf4qgi2tg5efav3eycna6h5475oqyyfmdqniemu","megatron/utils.py":"bafkr4icdjcejxfd5aagx6anana5he4v2myg7cdnpvzl2i6rm4cf65cf3cu","megatron/wandb_logger.py":"bafkr4ig72julyu5rzenphllggpbd6oz6zfebvgj34xwrjab327mog4mbwe","pretrain_bert.py":"bafkr4idwyih47aqpvsplulz2td27zhpdqoxtrusch43ndjzzctnwzm3yo4","pretrain_ict.py":"bafkr4icr54szvd2qfplw6656ch2unyxuhquig2tstqi74d2temj2xt7d6a","pretrain_t5.py":"bafkr4ifmvgfewn4oa4vs4enn5wubolc7okje2rracojmxrlw7gptilvjh4","requirements.txt":"bafkr4igxf35kaa2psknhybmjzvzolx7kxzuvrzuc7gnhl4uvhrwigawzlu","setup.py":"bafkr4if6qjfbm2dvk7cc6qjyzuly6kfyupc266dympeymwtbwueei6kxea","tasks/data_utils.py":"bafkr4ighsssbf3ut4zqcvoalfotp7f6krj2p7laflalfw4kbhnipwyfbl4","tasks/eval_utils.py":"bafkr4igqsmtakumugnptujbqh63olp4ese3qs3bnu44ca7lqrmq7ogihqi","tasks/finetune_utils.py":"bafkr4iblfn4pvm7td6sskxrzbp45c4vrbsix43ki3k26hsvus4ffueb2di","tasks/glue/data.py":"bafkr4ibpbrxkgysnuileqmgystiplvl2q6gtbj346jn5qvmxjoebrgxvpi","tasks/glue/finetune.py":"bafkr4ib57wqqoqgo5oswx65bypcqcgmlr6m7kn77wfcthugq5lg3dynqim","tasks/glue/mnli.py":"bafkr4iha4semgnsibtbuzcyjjb4btxziaiurcgffvhbrrlhbvtgdqz2pqq","tasks/glue/qqp.py":"bafkr4ieuvyr627lgyztxoludrgotrfc6qvjovcxn6mg53muo7saiamitii","tasks/main.py":"bafkr4iay7z7dni4qvh6os7fouqhr4buog7illfpvg264s3uhgnrnehiwpa","tasks/msdp/README.md":"bafkr4id5gu2hvj7h2ipwlefwbubuxk52ieqateih4lsbfyqxf55hd6v4ye","tasks/msdp/evaluate.py":"bafkr4iaul3uwf4m5uimg7gcxamaqwvwmwfkmgv6iaffjkmyywy4mp3ymku","tasks/msdp/main.py":"bafkr4iecmumc7mtvcgwaafetwy2bzisc6g5jhg3xrokn4xiltnmd6ls3ey","tasks/msdp/metrics.py":"bafkr4igspizwhpali75q2zzx36o3mnxpgiieqpztfi5lsdp5fsmrqhv42y","tasks/msdp/preprocessing.py":"bafkr4ieeje6yxtzatdwy6e6javp6rpzftob6coqkphc2xhejmnw4z2df6e","tasks/msdp/prompt.py":"bafkr4iaaqqfsvxyuiwaaxnkppiwjuqepyo2hn4sqqnjrna27lxq57funqi","tasks/orqa/README.md":"bafkr4igrnpfx5sq3xdqxodl3h2qqzj745fu7pq2jszxf7yrsc6lxd2ctha","tasks/orqa/evaluate_orqa.py":"bafkr4ifyxbiwu6o6mrocj77s323glnjlgrzlotmpyqtj7cwlwb4f5jy35a","tasks/orqa/evaluate_utils.py":"bafkr4ibj26cuhoazrdgycbls36f25pef24ijo5mdzybblsoect5pzlu2ju","tasks/orqa/supervised/data.py":"bafkr4ihxzir6wr3p5ws23p2j6dwnwgoo7g4lgaj42shxobn2gwo5i7ueiu","tasks/orqa/supervised/eval_utils.py":"bafkr4ifgctzao5anbkmmptizbhkgha5vekmuhuk6txh2clmk2vy2okc2ue","tasks/orqa/supervised/finetune.py":"bafkr4ibthbawu7vibdfbdmq7mq745zetepkmi7hsyigt2g7cgoislaaxki","tasks/orqa/unsupervised/nq.py":"bafkr4ibqenaaukusjbdyz5xrmyjpi37zsfujfev66nzikalcth7y4nqame","tasks/orqa/unsupervised/qa_utils.py":"bafkr4icjfoolyoo2fda5rr4f36ii2es2i7xzpi76nqqjdnaiitobe4vsva","tasks/orqa/unsupervised/tokenizers.py":"bafkr4ihru2z2q4rhkyxvubhupg5sxi4dh3mgpgp5ddl2hiiw2gzlaq4wvq","tasks/race/data.py":"bafkr4iclkbubgqrcopvfmllusj74k5ftcalvqaeui2twnglr3tkpv3gqsu","tasks/race/finetune.py":"bafkr4idnhhq7vb3ikafpmkrepdpq726r7tmwmz3pxlv4ito4j7rjwjnsxy","tasks/zeroshot_gpt/datasets.py":"bafkr4igv3htl444cfp7ek3fnwirzqhovyhtvlser55gcrhj3xjbt27ffgy","tasks/zeroshot_gpt/detokenizer.py":"bafkr4iceji76nxln6r4jkn4zorkzvgykb5s4ymfajzmrmi46clfj2qehri","tasks/zeroshot_gpt/evaluate.py":"bafkr4idj4zusotl2ao3t24mqsvjpcuah6y6fgrmfsgc7bjdqq54ept34tu","tests/__init__.py":"bafkr4ifpcne3t5pzugtkaqcn5i3nzskjtpfslsnnyejlpte2spfoihzsmi","tests/conftest.py":"bafkr4icpqbjjmasqtlbwgqaqn7qysmexaxjeabmzxcp4lps2wrg2zd6ws4","tests/pytest.ini":"bafkr4ihdse24mnybtoyzct7nu7feik6ipesj77hem7rfqdlhlzz5amk5su","tests/tensor_parallel/test_cross_entropy.py":"bafkr4iatffa64rs63hyxcq3x7ybeisn6rwnjoe62rp6w2hlnbgl4omoyoi","tests/tensor_parallel/test_data.py":"bafkr4igond2dzro2vditaxxiqcmndgr3x4kfvpyde3yo4gu4ocl276ivq4","tests/tensor_parallel/test_mappings.py":"bafkr4ig6fpsotbfvtff6t67nzvrxfhemaraxi2mgzzhqf2vvqhnyahahba","tests/tensor_parallel/test_random.py":"bafkr4ietwhj5kfqom34wgfjop4gthvh2ta6pyiunpbvkyxzwzezqpqt4bq","tests/tensor_parallel/test_tensor_parallel_utils.py":"bafkr4iakztjohka27s5sde2ambjfyfc576odjuh63a3qhd7lxmjj7zjnsm","tests/test_activations.py":"bafkr4ic4k4n2pihp6kjgzyn4qmahpgocktu647fa7cywrpfe37brsyksnm","tests/test_basic.py":"bafkr4ibnklfphrllf77m3prqa446zx667trbrsgvszlfwkkmzm72sqysvi","tests/test_layernorm_order.py":"bafkr4ibzftkcwvotwn3cnm4oamyel7zi4witz7y7jtaw5ohi4rpybnrvga","tests/test_llama_weights.py":"bafkr4ihixur2xayihdesg5vjr6j2lqwkklieid3u2v3h7cf66c7z2n2xam","tests/test_parallel_state.py":"bafkr4igympi2llmos6x7pk2uqni7tc4mwkzhu7q3q2mxhoybyipgoegjbm","tests/test_utilities.py":"bafkr4ieqaniglv3nrvuhwld7wvlg2evtehhnjldtw3dhwvv5vkz2kzpjai","tests/test_utils.py":"bafkr4ico5hgy6spy3m3ny2nwithgmnfagh5ofpal4hpsd32alb3ymgivbq","tests/test_wandb.py":"bafkr4ichkknqqh3vt7pciakzt2trw6h6fhvec4owd2w2v3zz7envnnnjoy","tools/checkpoint_loader_megatron.py":"bafkr4if2w2xyddq2vbyfbw6whzn6kcu33zzmdowvvhbcqnhcephpb762ie","tools/checkpoint_saver_megatron.py":"bafkr4icxcb2afvs4k2zypy3ubryzzxtxrkgz6lpcgzw3ygooegvaij76ea","tools/checkpoint_util.py":"bafkr4igezvds7ud3hgnzqmc2aamny4k2cstkwyhf47cpho7qmkcdnbsfc4","tools/linter.py":"bafkr4ibt2ygdwakfpy7e3dsylihdbsnotscxinvk4ciojtdd4jwsmzjuma","tools/merge_datasets.py":"bafkr4ihcmtxhprin24uyq3csgo3lkmeyezijilccdcs55dafwh54grhmfy","tools/openwebtext/README.md":"bafkr4ifkxqziifjgteiynfz3jcj5egsjmrtjmnb6a2n5pmjwh3lonesqlu","tools/openwebtext/add_id.py":"bafkr4ifvimn5xv2z5w5xoq3rfn6ng3i2ymvwe63dwntu6j2qpta2jspxhm","tools/openwebtext/blacklist_urls.py":"bafkr4ictvnrojkedjj5hd22wj7shho22iyq6efbihtzzn6xr3ke2f4yb4u","tools/openwebtext/cleanup_dataset.py":"bafkr4igvxcri62iaql32vmlrzf6jirsmfvrm7a5zif72fqpqpoupdkgkdm","tools/openwebtext/cleanup_fix_dataset.py":"bafkr4ifozgfvdr4ob4fsashd4pk23mtzoe3miklqkthn2jgtmmhxkjm2cy","tools/openwebtext/filter_ngrams.py":"bafkr4ibqr5ubfusg3o7bcbm4ndgfalpvqj2qmkdcfxhhvilyksdt7a7ujq","tools/openwebtext/find_duplicates.py":"bafkr4ifjattzomvhxvpywffrbeyp7fv6xwla4wevuemcoytkjnjikhnlye","tools/openwebtext/group_duplicate_url.py":"bafkr4igp5lpuawji6ujs5tr4rtoecz4vnaikjyfclntzgehjkk6worjyem","tools/openwebtext/merge_jsons.py":"bafkr4iap657rnoy6ukc3bftyu5rvmuzajgs3vmz5cwl2b4j3jg6yfno2ay","tools/openwebtext/remove_group_duplicates.py":"bafkr4ige73e627bfdxeqlkw72giavynl75wclkaobk6uz7r736kungxd2q","tools/preprocess_data.py":"bafkr4ia5qq5let6slhvtoidvqku7vedpqsfftngebgfh6sps3fr7nsaohu","tools/preprocess_instruct_data.py":"bafkr4ic6woe4xp6siycqsxbawvehmnwpbolatdms2ffv6qyr6uhn7lgu3i","tools/push_to_hub.py":"bafkr4ih5awzqkygbnsaycl3vywsqvfz4oax72vuceeljibluf7lqzmb45e","tools/run_text_generation_server.py":"bafkr4idmeqsxxvmjsiigvjyp2qn4evgr7brngzfrp6arrid3qshxgnhc5q","tools/text_generation_cli.py":"bafkr4ict6iluxwcya7xzzn3g37jujnkbc54f6m5mq7dqu764kqafzap77m","verify_correctness.py":"bafkr4ifj6bmaq3hg6xnmltz2hp54ea4243sccf3l23edq3hlv5lwyolutm","weights_conversion/hf_to_megatron.py":"bafkr4iepkfzdpgj3y3s3intw73scw3nqaaxzq4m6im7ggpbfg5m3yjgjbq","weights_conversion/megatron_to_hf.py":"bafkr4ifrhamb4aiklkj7swrv36l6uxx3lbdmg7pzdq56qzyhgatuglrlfa","weights_conversion/utils/__init__.py":"bafkr4ibdybzb7al37nxkxwzvpbuimpuw2tvvik7esyrul3mp5mbg4hjpta","weights_conversion/utils/merge_llama.py":"bafkr4ig2jl4f7wsutb34irephanu4nglalzgge4kp4lmmbmjriskx553l4","weights_conversion/utils/permute_qkv.py":"bafkr4idkoo6b2kw7oo5paxfpplywqc3qqyif67cjemixalh77ry7upx5me"} |