diff --git a/mlc-chat-config.json b/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..6af70a4ca7582a6598d95f2f705b513cca0db42a --- /dev/null +++ b/mlc-chat-config.json @@ -0,0 +1,22 @@ +{ + "model_lib": "SOLAR-10.7B-Instruct-v1.0-q4f16_1", + "local_id": "SOLAR-10.7B-Instruct-v1.0-q4f16_1", + "conv_template": "llama_default", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 4096, + "num_shards": 1, + "use_presharded_weights": false, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "tokenizer.json", + "tokenizer.model" + ], + "model_category": "llama", + "model_name": "SOLAR-10.7B-Instruct-v1.0", + "vocab_size": 32000, + "prefill_chunk_size": -1, + "max_window_size": 4096 +} \ No newline at end of file diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..f3ba1174576622a0217a40a005e9314185f00c38 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,6539 @@ +{ + "metadata": { + "ParamSize": 487 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "938f4378ebd23ac35f8cc0f687da6104" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_6", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "01312e179fbb9199cb5ee56f475ba271" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 31784960, + "records": [ + { + "name": "param_1", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 8192000 + }, + { + "name": "param_3", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 20774912 + }, + { + "name": "param_4", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 22347776 + }, + { + "name": "param_5", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 30736384 + } + ], + "md5sum": "d3eda9a4cad70dadda8214a3caeaa1ab" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_8", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7045a0461a12d13d5a4398c97849d617" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_7", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_9", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_10", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_11", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_12", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_13", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "26ca1c0995190e5acb6dd6b2009cdc66" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_16", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5efd9651e33c8aab5384e52b5d367ff8" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_18", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "294ca7574dc91748eb571c48fa9c4c20" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_14", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_15", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_17", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_19", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_20", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_21", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_22", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "2db206e74e2af7482fcc684bb395498b" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_26", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "41fb027e9d334e0e6396fc8483468e16" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_28", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "07b08673fed56394497c081ee705eb94" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_23", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_24", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_25", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_27", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_29", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_30", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_31", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "6001e192f8a8b042b0de66ff6809d969" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_36", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7a27ecffcc5ece9a816b98b389c96674" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_38", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "63de686a9f097b8e0491ca196871a1f7" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_32", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_33", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_34", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_35", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_37", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "baf54489afd2f9b8c4c7abf16d11c96d" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_46", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9a399d1c4d6e42af48598e71dc3c8b55" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_39", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_40", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_41", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_42", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_43", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_44", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_45", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "edc06e26931a23183c7bf47f9fd94137" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_48", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3d140be0ca4bf3635d21b6c8971227f5" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_47", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_49", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_50", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_51", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_52", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_53", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "90469ba6b013f3b309787d6f67e8662f" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_56", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "39a6437fe795f3e84d849660dbc88ec1" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_58", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f535493354569dc3a074c514473c2c2f" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_54", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_57", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_59", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_60", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_61", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_62", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "b5d3d22c989e8806a9b9fcbd37021d25" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_66", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "90b7628f0f01ae98663b575477bf96b6" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_68", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "4974ad9536ee570b811d4ef13140e5d6" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_63", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_64", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_65", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_67", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_69", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_70", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_71", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "07b39dd0f0deb4f6f88705b05e291805" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_76", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9f06d2a89423ab9e614679798eafcb2a" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_78", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "280eccfb8b0fbbfc9184d604fda7fa0a" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_72", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_73", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_74", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_75", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_77", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "7c3c588acdf9412240114a1fc4762fa8" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_86", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "948435c0378cc278617ab85773ac08b3" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_79", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_81", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_82", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_83", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_84", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "70e8651085a5efdef27ec9503ca079d4" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "dfb7a5029eb9c83676d284f46fbbe06c" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_87", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_92", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_93", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "22d6d6e847218fdd3c546dbf7307fe26" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_96", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "6d251e56b1943cb0e4e7ef1a1791a1b7" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_98", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "04be030b1359b2c8108940ea1fe76043" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_94", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_95", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_97", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_99", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_100", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_102", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "f1b1e8c268415196e92949147a9d1618" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_106", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "eb88df0eea8a14c4bcc89554be2cebd3" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_108", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "dcfe96de25853178ce0199ab39e45253" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_103", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_104", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_105", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_107", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_109", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_110", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_111", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "7dfb8eeac1bc463a0ee184d4be2bf041" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_116", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "39197811b17f2006ec1cc00924aaaca0" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_118", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "6547e83901f045868c5cdb79c6a24fa4" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_112", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_113", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_114", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_115", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_117", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "9597a62b88692f969709c838131f3c6b" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_126", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fb2948b4b2d42039739c063e843fbfc9" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_119", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_120", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_121", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_122", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_123", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_124", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_125", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "c8646c9edec45e04753743076c8ee446" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "d271cf618b7f131d0ed01ff5b24519dc" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_127", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_130", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_131", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_132", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_133", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "28bf8de1aa94bcf5f173791ff2d8ac1a" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_136", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e9e70235b5f9980946ba2293e20bcaad" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_138", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "32bfd23c26154035fb4661b79801b12b" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_134", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_135", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_137", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_139", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_140", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_141", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_142", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "916fdbdd3119938d5cd5fc18f68a0edb" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_146", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "da1a635bbf735dd480cc9d608589c768" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_148", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "42c52ffc7ed735860986e2b3ecaab9cd" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_143", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_144", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_145", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_147", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_149", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_150", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_151", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "b67aa86e63c0223516f8f2cf74e17397" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_156", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7b9eeba472b9eb27620767640ebeafc0" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_158", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "4675a3313d2dc686fd367f469b8f9822" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_152", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_153", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_154", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_155", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_157", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "84e316d8ed25ea45493e4c54b052c3b0" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_166", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "8751ae46aacc6e0e9909a06b0e5edbfa" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_159", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_160", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_161", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_162", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_163", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_164", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_165", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "f990636ec0bbe80ae4bf40d711d0db32" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_168", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f5ea4f216f6dbc5c0c04600f4e07ea7f" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_167", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_169", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_170", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_171", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_172", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_173", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "cd050be4afd23eb71712c01c756b15e4" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_176", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1b75cd9aff6131a508247eda6793c5fc" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_178", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "d0266177305aaa582fe9ac125e2ebffb" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_174", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_175", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_177", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_179", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_180", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_181", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_182", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "c2a65dc134c5b4336285cbe89e8f56df" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_186", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "cbc61fd129ac538f4b9da858a5d124a3" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_188", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a2ca62dd158fbac49cce218cfa1efbe3" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_183", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_184", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_185", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_187", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_189", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_191", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "eb1f26d2e73adb772fdb693a77e4369e" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_196", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1cd5cc8112643fcab37c25e19ab92cbe" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_198", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0109fe146033ea558e4757bf87a6f25b" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_192", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_193", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_194", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_197", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "3e0e4c020dd4b85e4274823ae0deef80" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_206", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e1d31e63ad062f33a412297d15cb4cbf" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_199", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_202", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_203", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_204", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_205", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "425144cab1d0275428383960e8342b09" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_208", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "6de5935a9f5339143627bd8b6cfe697f" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_207", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_209", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_210", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_212", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_213", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "9a83474bd80337428ef29d6b32c30abf" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_216", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "994dd0d86913e7a07d8861fd939739ea" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_218", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "629d668977e2821cb206b48591f83b03" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_214", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_217", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_219", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_220", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_221", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_222", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "75773b0dd6648dcffdb83a839fa0a20e" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_226", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1b2f471cbf7240f8c15a314a182694fb" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_228", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "80817f8029a48ece1e9745a2add1d290" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_223", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_224", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_225", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_227", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_229", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_230", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_231", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "5308de88e0ebdd87514f013eeadcb164" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_236", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "2146fe524afd8064f0c4d02aa1c96cb5" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_238", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f8363a7b8e11b1b141046e342c58e8a5" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_232", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_233", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_234", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_235", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_237", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "868c7293895b9b5ef0dd725cad995824" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_246", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "992f197c5a82a9bb6a655bfdc167ff5f" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_239", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_240", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_241", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_242", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_243", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_244", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_245", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "fc379773bdff162abd59721c9e865fcc" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_248", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a6c1c7749bd20b56a63091c9e0078350" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_247", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_249", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_250", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_251", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_252", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_253", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "0da1249d6200f994d2ec5b31b44b2579" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_256", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "18988c044bf216d4e5cb6162e47d4d8b" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_258", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "699842304638e22bba9c7b37e2bb6101" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_254", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_255", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_257", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_259", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_260", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_261", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_262", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "f8989f811c21548026b169a545904015" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_266", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e4665e136d25fc7de491e803c5bff9ea" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_268", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "51cb77252e7913210e30bb67d9ebea3a" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_263", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_264", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_265", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_267", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_269", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_270", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_271", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "6e1d1e77b2e8a246b5659807ddfae3ba" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_276", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "f37d6995ea9ca9444c6e69bbc8001dc0" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_278", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "40788b0c43d74270ea0ba68ac8363550" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_272", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_273", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_274", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_275", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_277", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "ea323f8fb26460b46d7fd808cb0f0092" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_286", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1fd86ac22140255e9c40b4ea1b421827" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_279", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_280", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_281", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_282", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_283", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_284", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_285", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "d311dfae73c84c7111da3d28c824cc4d" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_288", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "e56ae4570a547f60ae0ffff769efb3e1" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_287", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_289", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_290", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_291", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_292", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_293", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "8649f16ff113c92b6d323a416e04465e" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_296", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "ec5693b9808470488ed7dd0eba8ec65b" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_298", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "6706b59fd62e2a04f40ba0dc3e2712b3" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_294", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_295", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_297", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_299", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_301", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_302", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "769aaeca11caab032f7c8a5bb57e6f0e" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_306", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "c1066062abdbbd26a9ad327e6e7ab2c3" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "8f4d36ae59affff8029fe98cb33119f9" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_303", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_304", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_307", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_309", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_311", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "6e3d7dd70df0c9229616d98a2a00237b" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_316", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "2fa7c5bd24f478c7c3ad432e36f6fcd1" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_318", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "a713b72d1ee6c495c9c5019942912742" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_312", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_313", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_314", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_315", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_317", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "2b41548a3453d0436c9a2c55ef633935" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_326", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7df64f369005bfac7875e8de87a231fc" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_319", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_320", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_321", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_322", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_323", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_324", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_325", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "92b04f0d3d53a5abab047665e6df6e2a" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_328", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "d72a7f78763de00c32a57531a8cb10ab" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_327", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_329", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_330", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_331", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_332", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_333", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "e8d6037e3cbabdf4c3550fa1c1653d6c" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_336", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "3b5ed9091d16eeb316d63e9b14521934" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_338", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "965d224410e5dde1d6a8a6b4632cdb87" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_334", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_335", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_337", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_339", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_340", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_341", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_342", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "fa3b7be03e2dfc92224ba8c8045a0814" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_346", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "df3fcfc12b8942c6491edfd2dc117e68" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_348", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "478bd416228d5fcd5e61ae5ff56c0826" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_343", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_344", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_345", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_347", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_349", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_350", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_351", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "9171ff8178b4805825d7f418bd624007" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_356", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "ec27bd0992d1c96f5507f72062aefd7a" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_358", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "073ee51bab6863d3f6ecd5e81d275764" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_352", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_353", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_354", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_355", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_357", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "8b033cd809b25aa1b517839eb602c942" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_366", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "240d7159b453bbf463bfb0690af6027f" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_359", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_360", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_361", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_362", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_363", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_364", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_365", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "35f2c59986e2e7d446848785bc4cb5eb" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_368", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "431b77b5a4c49d50d319515ca34ba6d3" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_367", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_369", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_370", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_371", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_372", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_373", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "eaeaf8ce164b3421651074c3891f799e" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_376", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "c23ec5d3dd754ab38d5f5c4fb6c81765" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_378", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "324ee9c85465f35658f249cefa232b15" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_374", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_375", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_377", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_379", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_380", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_381", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_382", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "8d13c23d27690ceef47cc7eeb9a74539" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_386", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "043b342842744b29ecb78713f82eae9d" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_388", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "df3b76b992b67c5cc6832cb9cc8ed204" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_383", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_384", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_385", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_387", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_389", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_390", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_391", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "dece9e3455ac475edc03c471f3be24ef" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_396", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "c5ee04a8105c9302fdbf8f71683b1c66" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_398", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "9c7248cdc5a26999e3f5765967596024" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_392", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_393", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_394", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_395", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_397", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "a66a43b6b38f6274dbea808b459e83d5" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_406", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "55fc8eefc0fa8a14c46865a498ecdf42" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_399", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_400", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_401", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_402", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_403", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_404", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_405", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "13c857577c679c33439f453b44bb0f69" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_408", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "9ae601a69c5f8be6bff42dd40df00d40" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_407", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_409", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_410", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_411", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_412", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_413", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "ce2bc4e0695a4b1bb2fdfb0dd341040a" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_416", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "e704f1525599a8c7b10a90efd659c90c" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_418", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "9ab0bc6e5519bb7006c6736d611e1ed4" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_414", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_415", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_417", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_419", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_420", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_421", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_422", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "df2daca16475e1ad320eb7c9e4f486b4" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_426", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9670d462edf97d34f91249203e7068e7" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_428", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "be3f985f205cc04336354ef3ca9a0a59" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_423", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_424", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_425", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_427", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_429", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_430", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_431", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "00a603fd2fa0319933ee3ea249579ef2" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_436", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "86bfe5497f17b33e4cb1c343ed4e03f6" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_438", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "ca1f67f11a19c231014dcdf1e065d35e" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_432", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_433", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_434", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_435", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_437", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "cab4f0afa210e82840f6204cee299912" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_446", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "01297c0f241c3de0f009f302368db897" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_439", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_440", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_441", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_442", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_443", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_444", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_445", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "e40127726e75be550a88b90d92f70a23" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_448", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "4eba8642fd3b615a6c572c51af0164a9" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_447", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_449", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_450", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_451", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_452", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_453", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "7a1722e61a8863bf8616f7cd639fd4b3" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_456", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9cd3f408558e42134009e6df6a17507b" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_458", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "80e7e891cdd67197b7f32d966d85a77a" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_454", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_455", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_457", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_459", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_460", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_461", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_462", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "18f45d3446a5c720c5802771d810eb51" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_466", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "68565e805825d245210166fa46bf9832" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_468", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3d50f8df560b1e49a270b6e05bf0e3d5" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_463", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_464", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_465", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_467", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_469", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_470", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_471", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "d5ed6de1eaf3c5fc8241dcc31b1d9b24" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_476", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "f32b479635bb045dc9cf6b290376f485" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_478", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "28c2ae03577e284e92e97aa65818402b" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_472", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_473", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_474", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_475", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_477", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "be926de1743f90d8b55b7beb760cce1e" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_483", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "3f2e13a0dfec472408edc2ebc696f84d" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 12935168, + "records": [ + { + "name": "param_479", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_480", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_481", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_482", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3686400 + }, + { + "name": "param_484", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 3694592 + }, + { + "name": "param_485", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 11886592 + }, + { + "name": "param_486", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 12410880 + } + ], + "md5sum": "48e8aa65f05fba337318ffb71eae4214" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..da2f8a02bcd8458eff255c82aa6473e8f9d156ef --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a83663d1a2fabef35cfd0e563b2b9d3d9d47b514c085da9f680a81bb35bd60 +size 65536000 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..0f0db7f28c817b52119f3667a754b239b9d36e1f --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb9be68f13444bd5e69c8e13cbbcd56e023b756fc49092788d5f0a95e053650 +size 58720256 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..a50b7d23a20375e068d5bbf60598740fbe301133 --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f8183d2c9796bb2874ba114ec6e1e18e6ce4c39e5aacdc6ae17865b42f5512 +size 22036480 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..f002ab37315a99c2e74f53d7fdd47e3abe2d8af1 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:913b89bacf1dc87aa542f30b7a93d6d6a3c8d40c2e11e80a514f63e1dc773d64 +size 58720256 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3f3a78f744e13c442706f589c3d337a226b8c9c --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95abb140f603aafa30592288dc07b45bb07a070e88f75ef930547b7f1d96b573 +size 29360128 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..92ac99b37a10006f6671f2c3dac5184c19af2974 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80208a58fd57ac0a824b0c90837ac716c1aecdc2bbc7127a227325f214f5b7ac +size 30932992 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..c91d37f79f77b7ce43843b0ccfc11ed8e5ebd3d5 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4564d25bd71062be8b4e20d4718219c89afaf1068378598fba50b70e3e75c751 +size 58720256 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..e69b656ec13c681001e96bb705527f1d8c291ba1 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4673b9ef974c999e43d31d91b77f6b511ab371fadb535f2ca1904cc1f05832e +size 27279360 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7646d2f281da399f92abb7307cf9c2bd2b7687e --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930028d9219c6a09bc207729b095bebd59a99d0520c56e7435376e778da16a55 +size 29360128 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e33130a1ae82da2036f48686246974427b3b033 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f20075ccdb4291ea3fe4d19cf3ef967b4b86aeb35907441c1687c0d5adbb899c +size 25182208 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e066a8026e296c7c64ca1ab728e656954c81f2f --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6164f0426de91065fdff37392845c5087bf80bc6a8927cdde32cfa5238686776 +size 58720256 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ee5114e8e30ad9a94e06e16bc3dbbe91fb4523e --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ddbd35a99c5cfd1c937f0014aca208074a220f77f1fdc0eec68a0073216047 +size 29360128 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3bb83875b5c521f3cba5deccd1a96270bf24850 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3184ebbf7b9c135c822106307572315d8a3bdf4b8787dc9a97975394f7acab30 +size 31784960 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..576f284a5c3e94bc62a51a7151eee565d448a144 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45a47ec6fbec0eb883518f340be9bb1f4f4f3e6eb13425a3d9d554e2d167ff3 +size 33046528 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..e421e9f3464623daf0dc93b0eb98c69de4a1efba --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29b2e4898aafac119408d14a3b76d9f00b0357c8a8aca482a90a66710f136d0 +size 58720256 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a6d01d9ae923f57e2cf328841997fadc5cf4367 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a330be5fbe77ba6751bdc53d70cb28c079cf9b22a82b5f7f142979551731adca +size 29360128 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a1796ca3bf6307b8fb6a57fced09cc1b17de64 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771bebb1b9dcf4491db49420a9cc5cb0952c5edfb6ee5341f6ed9843fbf88a23 +size 22036480 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..c475db72eba17827e252c5a3cb4a535008b65ba1 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce9a3f2f16f2565f59fc621fe9a1db1c0793aa85816e0f5d675af0ff53109e5 +size 58720256 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..c24300ceb6b4ce69b1a9cf6591e2072b2c768620 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:938cd665c8e184ae553d88795de968cf736c9b73e34c1bef60d280139995e39e +size 29360128 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4aa178e27c004e62d67a02759da9c50112022b5 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b77b1076fa63201380d18323795aab7dc3d8931fffe8fbb4ff40104300fcdf +size 30932992 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..c264499d2d2a17b828b03b2b534deaa1ce85b8b2 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796612f912c320bbb0d950cc336277393da6bb7e190d642071d03d0bfd1b8c1d +size 58720256 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..3bd68275cb84a6c60254f418484782b85b089b2d --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a41a7ad8a8c2f70f7ae4f8161d8146c5e1401d180fe31716d1d6e7d7bf31c8e +size 27279360 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d93bebf9acaa495866ec29a4eefe6992d470b59 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63e543bfc02236a21aec4abd11abfc0277094671185177007036e1bee90847ee +size 29360128 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..198652851acbbc89ee1a46be9d7b32b193b23d01 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58f415e3405213975be6461c138d0985288bfd727dc680385da1715909b7764 +size 29360128 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3fa6de128fcf45b7e624e8d6a6b15088f1b5637 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af9ed8a710349194c24d32b176dbc0ceebc04e9ed4b5ab08246475c4a92e1c4 +size 25182208 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..b1dcdb550afa5c9dfee8c4e7812b06fb30b25248 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d15389886873e58ae552817e074ea2104d79ceacaebc294452cee2af884f01 +size 58720256 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..18db17f91f674d9cb16660743c29b65008defcf4 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cadcb580078a5b232b276c1110c2d902e60e446e5d2dd50d31c1157a8024a0e +size 29360128 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..1efcea7ae9c1b103e8ce35b1ffd0b673648ac61d --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24c5543d95139ca3e0b8276d55a1693dd58cfb376e6ac164df0cd440ce388e4 +size 33046528 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..53166bbf32a6654f4ffe13d302dae48476d786e0 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f542cbca557c5e5eff64c6a45934169bd3de428ffe09f10bcd4d638fef41966d +size 58720256 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..de571ea32ec2940f7f91aa0cb81b7e2f30f6fc3c --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4794272d49984aef9a5d0712f3038195fe56ae492c0815d22bdf6d5ab11f7c56 +size 29360128 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..f91bafe55cd6a7bb29185cbcf0c5baa0d608c424 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4b78155bdca1ac80e82378380c95437f528f1bc1dd12d8d4b74707a257967c +size 22036480 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..af5c3ab92b9cae6e97eb301b1cec1801b406001a --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae960560e0d614bb986cd7c3402bcdd76adc769da0aa4c61847df3e71657ce93 +size 58720256 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2836758ede8940f8056a0b78bdc5b886e7e3578 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b0e22d9f49f8f143b1b5c148c398fd3aef5b59b71ab1b0981bd1fb123f5a9d +size 29360128 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..eeef5c1aebcf29cc21aadda5e78ea38785ba238b --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f3d96d0f764c48313a4b98e8b1e13b95e0657a43cd306d13fb4903852d02c7 +size 30932992 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab29cee76ab4106d1619fbe1c3a6c9a58328c07f --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede13aba3eadb2b65f8ebf1be8524c49c1af034d844cd1aba1c554f98bbfc186 +size 25182208 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..305ed69c803b58f5ae6a5a39d3208e4d20c1168a --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17407b5f7450c64707d78d4c731c0c9810a8371e8c93d5f94db5e3757137c65f +size 58720256 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..6839a682c072f186d0bf66d5dbfee0033d7e1c6d --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d5eb180c59c18a4a3b58c24e833717037454f71946fada5d3f949360456d09 +size 27279360 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7d6a7d20315a478ee173a6eb9a288d9076f12a4 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be33045ea44ecf54b7b3be83b4455e43aa169800c7d1404b4fcb082931df3d78 +size 29360128 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..a50ecd04f76e34a4b1a04fbee0ef7c9717a3bee2 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142f8ecd047129e2f251bf55d9368ecee5d048dab2ec7bd8bec38f3aa5bad41f +size 25182208 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..8f4b146ff177ec74e681431af283ba32196eb880 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41a424db691671f5941d2c28e093b28c6b1d4478fa34a63bd9347ca97c445db +size 58720256 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..006c1cc567db8a3f8bd2d0305e9bcfb22908381e --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf585e0b84a1e15f20191ad9ce97276fbdbc9603d1d3f4a5433bf4f3500b1aa +size 29360128 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7f01f1cfd3020eb529fd97b90e6a3c04799931c --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a909e277acbbc413dd60db2893229fcba60dd18c7d8427b16a5b83c6c92c0aa0 +size 33046528 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..04196e5503b58700229bc90f8c4bed42e2e7e8fa --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a51f505e7318f73b549652acd16365318a25e0ca62a993b88df071e7a0a5fc18 +size 58720256 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e9d1346bdb1e40f1757861616dab6caae4143f2 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9888ea338a2ce69d06451a2ffc180b626a4707a9cf447b721010b941f7c34d +size 29360128 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..37bb776d1117a38ebffd8ce02311d0d08dae6cb8 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9160b2c3571da852efa4f9034e66b8be9ec54f846a7da6e1b74584eeac736a5 +size 22036480 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..74188ffaf28bf24e22266ad6c21a6f71d84d6666 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f3dfbababc17bc9a523363bbd57a4a63db992824577ec91af222ac698570ae +size 58720256 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..4bda0650ea179e21eeb5fdb6b734a7f3c966df5f --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b6a8dd7b32ebc987801efbd77b40030e0268f27418f0b662f78849451d9f670 +size 58720256 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..d08f32eeea9ef495050596915db5b47b84e9a9fd --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20be7b08170ee077e8394f9a0ae8a5403e7bbf19f95db08a136cc4e27b8f2e52 +size 29360128 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..1864c9f2944b8e5d5d6325cc9dc93ea7d4dcb4b2 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90b232642611b2163635d1cdbddfa7fbcb1a28a5e39c4c511207eab76685982 +size 29360128 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee3ab9b8845632f9003b73195fa8224c092366cb --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1008e62d94dd6a5cefed9ce132a6178509030c5376e2b9528183ae4a80ab6964 +size 33046528 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..de6b3b06f16f18db17df7f5b2ffa78d866e4f78e --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf0a287b07e1b32836b453d9f41b25e123ee55b24cf1fbca844b84502010870 +size 58720256 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..402f073e98e6d0e316383be1d39fec8014402f99 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e75e3428e23e16911062187ec55bc4747ff7e5a2bc4ac524ac99902a255e13 +size 29360128