diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" new file mode 100644--- /dev/null +++ "b/ndarray-cache.json" @@ -0,0 +1,4067 @@ +{ + "metadata": { + "ParamSize": 327 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 40960000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 40960000, + "byteOffset": 0 + } + ], + "md5sum": "38a5852e50166528e5b7f0ea135045bf" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_6", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "dbd608b0ba9d0839a9a388efae021a98" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 32040960, + "records": [ + { + "name": "param_1", + "shape": [ + 32000, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120000, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 5120000 + }, + { + "name": "param_3", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 14950400 + }, + { + "name": "param_4", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 16179200 + }, + { + "name": "param_5", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 19456000 + }, + { + "name": "param_7", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 19865600 + }, + { + "name": "param_8", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 22077440 + }, + { + "name": "param_9", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30924800 + }, + { + "name": "param_10", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 32030720 + }, + { + "name": "param_11", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 32035840 + } + ], + "md5sum": "fa3a360bc9528aef158882dfeee04184" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 32440320, + "records": [ + { + "name": "param_12", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 0 + }, + { + "name": "param_13", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 9830400 + }, + { + "name": "param_14", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 11059200 + }, + { + "name": "param_15", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 14336000 + }, + { + "name": "param_16", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14745600 + } + ], + "md5sum": "e0681a5ff19de3529216af6238dce9e1" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_26", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "63af423be9eebcc68604abacaa7eb5fc" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 29132800, + "records": [ + { + "name": "param_17", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_18", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 2211840 + }, + { + "name": "param_19", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 11059200 + }, + { + "name": "param_20", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 12165120 + }, + { + "name": "param_21", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 12170240 + }, + { + "name": "param_22", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 12175360 + }, + { + "name": "param_23", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22005760 + }, + { + "name": "param_24", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 23234560 + }, + { + "name": "param_25", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 26511360 + }, + { + "name": "param_27", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 26920960 + } + ], + "md5sum": "17e00e28d96b73067d6e8fd90299774a" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_36", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "821b777cc10f8d623547235510e7b903" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_28", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_29", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_30", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_31", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_32", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_33", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_34", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_35", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_37", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "d7e2a2c3c2e60269f40b65e2ace80fa5" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_46", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "b8a24449dba8fd0840ee3be024c2eb71" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_38", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_39", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_40", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_41", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_42", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_43", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_44", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_45", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_47", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "e4bace3710532b9642dda05904391d97" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_56", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "bcd80e4f9834b6940bee42a9dcab9737" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_48", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_49", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_50", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_51", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_52", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_53", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_54", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_55", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_57", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "aa8e60f169ac5ed4b3ee7e2b667a0478" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_66", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "68e958a0a04b1b14301ed6a52a9ae25a" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_58", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_59", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_60", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_61", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_62", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_63", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_64", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_65", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_67", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "c3e33356ddc72685b6fc52e4226f408c" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_76", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "fcdb1c0d91b15c32c0df808639a49634" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_68", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_69", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_70", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_71", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_72", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_73", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_74", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_75", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_77", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "028e9b790770fc970a15a6c9830eafa0" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_86", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "74a7b1eaa0f44d1d13280ca48de50b5f" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_78", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_79", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_80", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_81", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_82", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_83", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_84", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_85", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_87", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "f790b29f4f2fe1f2d76fd3699c3c6a90" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_96", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "0c5e3dc5d5abe8dc07bcf854df2abe8f" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_88", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_90", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_91", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_92", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_93", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_94", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_95", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_97", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "22046b0690f4ca44bbb585ff4f3da3b5" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_106", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "0660425b174dbaf3b50aa192e68646e1" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_98", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_99", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_100", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_101", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_102", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_103", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_104", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_105", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_107", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "46cf8c19d2817540ba3d72f62c7b6d29" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_116", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "15bca81e45385438bed5124850c72717" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_108", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_109", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_110", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_111", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_112", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_113", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_114", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_115", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_117", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "c5650fdc0087f8b28ce5ebe4e73cc074" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_126", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "5b9026a5a6a133f7d969e91dab31fdcb" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_118", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_119", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_120", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_121", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_122", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_123", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_124", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_125", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_127", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "fc0c57eb40f78c1183b015d835539573" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_136", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "8146e0c15432e54b013aa84a7f7a66ed" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_128", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_130", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_131", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_132", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_133", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_134", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_135", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_137", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "c5d52d43cafde79b652540e86dc05f7d" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_146", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "aecbc1e69c928488822f18cf1b99fdb9" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_138", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_139", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_140", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_141", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_142", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_143", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_144", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_145", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_147", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "1586ed0ba8ba0e4c5e689c654e96191c" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_156", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "ab3a1039b873a8e41815f9b3b78e4e7c" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_148", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_149", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_150", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_151", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_152", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_153", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_154", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_155", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_157", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "e768a69a215097660537f441b9f8763b" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_166", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "c20162e6b341d1013f4a87d31a1fcc06" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_158", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_159", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_160", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_161", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_162", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_163", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_164", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_165", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_167", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "dd1a14e603278c4fafe9833f8ecd2cfc" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_176", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "0b5d75176cd9fb0a1511f42625fcb541" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_168", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_169", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_170", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_171", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_172", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_173", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_174", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_175", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_177", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "4d084f06d880bbb1a0c61a4d5ed2dc3c" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_186", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "ef25801bc5e2a64941ad0916209a4b81" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_178", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_179", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_180", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_181", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_182", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_183", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_184", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_185", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_187", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "3033c678913a1fced2b88a913377b961" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_196", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "879702f8e1effbde71ec852699b75e16" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_188", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_189", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_190", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_191", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_192", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_193", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_194", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_195", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_197", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "5a16678a0feeba1b2d68a53689657915" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_206", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "87827ef77be01a0e0b8a38a24f956990" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_198", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_199", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_200", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_201", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_202", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_203", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_204", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_205", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_207", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "5937f0f8c3000aeeb4806d136f02b1b1" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_216", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "00a1278e1865f929ccd56eb1c0332d13" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_208", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_209", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_210", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_211", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_212", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_213", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_214", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_215", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_217", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "15a4c5e02fadb8219500d7de2122cf45" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_226", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "f406f2438f445c007a3e0f23c729b024" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_218", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_219", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_220", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_221", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_222", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_223", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_224", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_225", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_227", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "3635830a67021725ce0d679a6c1bc36a" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_236", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "0adb68805b52a3059298bece193b268f" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_228", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_229", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_230", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_231", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_232", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_233", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_234", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_235", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_237", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "1a5269a47838514eb797b00cdabfac96" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_246", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "215987c7b753497cb75e5c80c7055daa" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_238", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_239", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_240", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_241", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_242", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_243", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_244", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_245", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_247", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "fd0c8aed5bbc35ed94e21b68e55a9a46" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_256", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "f17f8e52c6b6bc8e713324389d8c05c2" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_248", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_249", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_250", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_251", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_252", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_253", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_254", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_255", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_257", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "8948b22ec3fc09e97a1e8ad8de8767ea" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_266", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "39b85a82364429daaed853a4a72d8ccb" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_258", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_259", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_260", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_261", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_262", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_263", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_264", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_265", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_267", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "1b58b2bcfcd8c2a242a593b148f32250" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_276", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "d2674e52f3ba70fb7a8c09bcc8df24db" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_268", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_269", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_270", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_271", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_272", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_273", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_274", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_275", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_277", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "4fd6eb3abc9789bafade311355d9c8ff" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_286", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "45a9d94413252c5bdf653b0088199e25" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_278", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_279", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_280", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_281", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_282", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_283", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_284", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_285", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_287", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "a3dabd752dce695c37122c3715d4485b" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_296", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "8973a98d0e1a32e174fc4340687a11b1" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_288", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_289", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_290", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_291", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_292", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_293", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_294", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_295", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_297", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "0d17c2e04112f9696a4ee0e5d718dcfd" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_306", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "d2b5fd048176f535961b1e6c161f4637" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_298", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_299", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_300", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_301", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_302", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_303", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_304", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_305", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_307", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "506d2eb25ae626e8b5d36473eb96b669" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 17694720, + "records": [ + { + "name": "param_316", + "shape": [ + 13824, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 0 + } + ], + "md5sum": "ae13aa3c333abb1715b8a1f559a6e383" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 26920960, + "records": [ + { + "name": "param_308", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_309", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_310", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_311", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_312", + "shape": [ + 7680, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9830400, + "byteOffset": 9963520 + }, + { + "name": "param_313", + "shape": [ + 7680, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19793920 + }, + { + "name": "param_314", + "shape": [ + 2560, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 3276800, + "byteOffset": 21022720 + }, + { + "name": "param_315", + "shape": [ + 2560, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 24299520 + }, + { + "name": "param_317", + "shape": [ + 13824, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 24709120 + } + ], + "md5sum": "33a93a79323cc8dd018950322315950b" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 40960000, + "records": [ + { + "name": "param_323", + "shape": [ + 32000, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 40960000, + "byteOffset": 0 + } + ], + "md5sum": "b1bc9c20f7ad3559cf5df4c7dbfa6195" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 16137216, + "records": [ + { + "name": "param_318", + "shape": [ + 2560, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8847360, + "byteOffset": 0 + }, + { + "name": "param_319", + "shape": [ + 2560, + 216 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 8847360 + }, + { + "name": "param_320", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9953280 + }, + { + "name": "param_321", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9958400 + }, + { + "name": "param_322", + "shape": [ + 2560 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120, + "byteOffset": 9963520 + }, + { + "name": "param_324", + "shape": [ + 32000, + 80 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5120000, + "byteOffset": 9968640 + }, + { + "name": "param_325", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 15088640 + }, + { + "name": "param_326", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 15612928 + } + ], + "md5sum": "2ae8dcb02075e37ae3d98ce072e13283" + } + ] +} \ No newline at end of file