diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" new file mode 100644--- /dev/null +++ "b/ndarray-cache.json" @@ -0,0 +1,4395 @@ +{ + "metadata": { + "ParamSize": 327 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 65540096, + "records": [ + { + "name": "param_0", + "shape": [ + 32002, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65540096, + "byteOffset": 0 + } + ], + "md5sum": "9cb124d2f411408db1bcde6d8e976343" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_6", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "0e9c3348ca4b7cae07a8a758ce8eb124" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 31785472, + "records": [ + { + "name": "param_1", + "shape": [ + 32002, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192512, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 8192512 + }, + { + "name": "param_3", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 20775424 + }, + { + "name": "param_4", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 22348288 + }, + { + "name": "param_5", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 30736896 + } + ], + "md5sum": "b48c498d282a3c2c085ea04623e4686e" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_8", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7c8550330f43255911b0c3450283b33e" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_7", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_9", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_10", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_11", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_12", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_13", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "db1264ae307213b6f71ef5510bd17d1c" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_16", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9740dd25a0815e16953bbc3b2abd4d08" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_18", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "305f70a5502c75841d21ccf83040ff40" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_14", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_15", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_17", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_19", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_20", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_21", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_22", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "16f341f2f6e96610de6c4ef04befd3e3" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_26", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "0e6aa1f5b82445b8c229fa395aa1b45e" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_28", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7d10f8bd8b7cd84b3ae3d1e86ae97359" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_23", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_24", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_25", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_27", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_29", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_30", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_31", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "1b085e9527880d83af99aeb0d00045dc" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_36", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1e80f79c72a1a6be5d8e19bd00b67d50" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_38", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "18184ab1071248dc87f15abd82be3118" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_32", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_33", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_34", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_35", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_37", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "aa26ef1f115aeec2de28c878077bc5b7" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_46", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "6fe3fc0d11cc3959ce751795d4c29812" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_39", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_40", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_41", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_42", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_43", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_44", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_45", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "09df7bf839582d262a70872f0a84cbd3" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_48", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "736720c518fa0367d045c2767e8a4683" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_47", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_49", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_50", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_51", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_52", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_53", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "4ddc112aa10d8692a4383445b604f59a" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_56", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "19e5441268075c7650825b58e2c9f63f" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_58", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "4299858dfd39b1f89799a4ec553295eb" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_54", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_57", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_59", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_60", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_61", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_62", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "dcee462247d4382e8fbc3e401d6dc630" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_66", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fb9ce814bc270c29ae501070ea524a91" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_68", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "40b4b65a9de98901476f5bf673966919" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_63", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_64", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_65", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_67", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_69", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_70", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_71", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "4052237d6b8b4531d253a9f58c316af4" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_76", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "094e36c38eb538482be8e4c764445f57" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_78", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a95eb560378a1772a56d78ca85c14c4a" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_72", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_73", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_74", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_75", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_77", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "8d70c88ce458a63693c7f3a965703108" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_86", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "2759512e4d0613cc47a283fe51f527ce" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_79", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_81", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_82", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_83", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_84", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "148b0720015cd5ab50c36585473f2c05" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5a622149cc008f9351a62916bf1dd289" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_87", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_92", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_93", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "5b882c04fcadc69b29643bdebc685f7d" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_96", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "b663f439b6ef98852cc3d564d41f6ba8" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_98", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5cd007fa4bfe5f4d89740e4b93cdc2c2" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_94", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_95", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_97", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_99", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_100", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_102", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "adecca24262606b45a884516414cde2e" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_106", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "a4e5299cf23cc1cd54b21b81b65d061e" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_108", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3cc54f6c59c608343e6570142951cd35" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_103", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_104", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_105", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_107", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_109", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_110", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_111", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "9e4de1056c50a94d16e50da1e5cbe93d" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_116", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "61bde840b4f09b2a7b2922a269abcced" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_118", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a3fa0310a63bc22e5c7f383ee5e3ccce" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_112", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_113", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_114", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_115", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_117", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "87897611d687eb67b76a98551aa0953d" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_126", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7fb7ca15dc3e38dbb2101aede90a7631" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_119", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_120", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_121", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_122", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_123", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_124", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_125", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "7b23fda77ff197b3504c116cbc292a6b" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7d7687340087c775bdd20ea0655a175e" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_127", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_130", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_131", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_132", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_133", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "1dba0980ab28c5c5b84fdc9471eb88c0" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_136", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7a5dec5d6d01f0aa564dd1a8cca4fd5b" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_138", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "8530953ed3c4382426ce280c9c0b13fb" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_134", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_135", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_137", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_139", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_140", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_141", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_142", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "b6fa8ad9f876cabfb0260b3d656c4dff" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_146", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5708875f36bafc8f8a9ceb97028536fa" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_148", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "58257a67a9c5e3ec993feeaefb4aa15b" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_143", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_144", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_145", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_147", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_149", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_150", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_151", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "e1c25011cde1d5b42c41eb69c6f02929" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_156", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e7f0e515b5e7fb729c6ac968f67925bc" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_158", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a3f8fb33768f60baa9b3538f38988801" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_152", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_153", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_154", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_155", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_157", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "34deacb7105d44bb4db5152d773a1778" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_166", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5f0af83070c36fb565b6b7a109a6fed7" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_159", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_160", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_161", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_162", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_163", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_164", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_165", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "fad1cfcf3bae22a7baa558bb5d870bdb" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_168", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "97bedfc8b7967195275942fa4cb9015b" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_167", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_169", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_170", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_171", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_172", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_173", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "8f79db5e6d8df284de7e8c9d93a002c4" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_176", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "d4ae67b906e7bc646830290f19bc3d11" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_178", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3359112c2f91be7cf555218516ad48bc" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_174", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_175", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_177", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_179", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_180", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_181", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_182", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "bbe7975390a7dadb8d43bd301b8a8217" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_186", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7520df3e10bb80b426ce4e6891b30414" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_188", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5e6c80b9329e5afb9e721e6f5036f3e0" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_183", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_184", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_185", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_187", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_189", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_191", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "0fabc664cc1166daae3e2a43fc7b97d7" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_196", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "936494032516fe9bee746695f59dcc34" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_198", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "e65163e1d106f1100adfd0940d13a683" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_192", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_193", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_194", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_197", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "19451e8d54cb2ca12944b9f7f4d07f37" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_206", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "54dcece12c1826e2de4b6f8bdf8deec4" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_199", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_202", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_203", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_204", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_205", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "67cb1870927aa1bb5700d11f9dde17d7" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_208", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0cb66ce6a866f22e4d1de016503d2839" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_207", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_209", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_210", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_212", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_213", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "feca57ee646e76c824006a7babf9a2fa" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_216", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "d2e0b0256b53c5c69bf0db9ec24e0006" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_218", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "8491a1eb962ed93f5f7ebf6e8f379aaf" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_214", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_217", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_219", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_220", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_221", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_222", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "f18596b1e20e979b7c0e97261ea92005" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_226", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fee2729a6f4221d4ec631324f67af7bb" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_228", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "775bb83c49fbe8af37142fac934bcfb0" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_223", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_224", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_225", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_227", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_229", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_230", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_231", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "4e2db4f23dc12607857bc806903890c6" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_236", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "560538c6a3b4a58adec4328fa630a59f" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_238", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "e8ce889174324e263b190269656ad186" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_232", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_233", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_234", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_235", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_237", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "6bbf6e1d1a13684c79e86058cd81e705" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_246", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "336f76e0078e087bfa3986f4d68a450a" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_239", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_240", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_241", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_242", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_243", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_244", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_245", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "06d2ca33cb135c902d70e58445dd3105" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_248", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "02fd190c2708e174624956cf47906fdd" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_247", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_249", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_250", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_251", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_252", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_253", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "c291d4f8447b43714f489866bf028365" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_256", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "803fb5cb4606cc7596b9fa24dabbc6ea" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_258", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "20be2eb8ea53a7fbc3e5dcb92f72ff0b" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_254", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_255", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_257", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_259", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_260", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_261", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_262", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "d8f196260a3b8281dd5bb352896912b3" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_266", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "6910f775df5a7abef2858fd744d60fc4" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_268", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0ea4e4176e883846a93f85957e928b3b" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_263", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_264", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_265", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_267", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_269", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_270", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_271", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "0a6fad40ecb25e06f23a1e7fbc14fe23" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_276", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "49ed553f4836d6570e9c219166e104f7" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_278", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "61c640f8e5c854575f8d065116603150" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_272", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_273", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_274", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_275", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_277", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "cd463253683d7536b0ade494342f73ba" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_286", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "8e3c881aa0d9530f58b31699466f12f9" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_279", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_280", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_281", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_282", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_283", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_284", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_285", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "271f67fb2edff453e237cbe41fc2b12e" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_288", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "8776eea0f0afe5ad79762129c9b2b422" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_287", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_289", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_290", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_291", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_292", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_293", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "92953f132e54392c259df45de3e43dac" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_296", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "4dcd16f4b31ed6eeb907c628b26abd97" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_298", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "03825eead2c958cae247927551f952bf" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_294", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_295", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_297", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_299", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_301", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_302", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "5d8a3b3485885d2a1f1e6481ca27adcb" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_306", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "046b3f2a4c0e9b0d5a8b925aa4e496a4" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f862f87c2f8a6c31e2e4a7542b18cc9b" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_303", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_304", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_307", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_309", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_311", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "dca32b3a5b70fca0462226b926d8d80b" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_316", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e68339a5857c5b7ceb1ebef1ac4909ad" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_318", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "e6a7d4b33558414adfbec9afa29fd74e" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_312", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_313", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_314", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_315", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_317", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "e20b3eb4e15e42087e67e1d2d87472ba" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 65540096, + "records": [ + { + "name": "param_323", + "shape": [ + 32002, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65540096, + "byteOffset": 0 + } + ], + "md5sum": "ae1eefc895d92cc5e72dcf32a494dcb1" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 12935680, + "records": [ + { + "name": "param_319", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_320", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_321", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_322", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3686400 + }, + { + "name": "param_324", + "shape": [ + 32002, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192512, + "byteOffset": 3694592 + }, + { + "name": "param_325", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 11887104 + }, + { + "name": "param_326", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 12411392 + } + ], + "md5sum": "c70632be0058e30292fa0f7f2e3b8a07" + } + ] +} \ No newline at end of file