diff --git a/mlc-chat-config.json b/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..4a0d4acd410f6e24fae9652b0d402193dd13a405 --- /dev/null +++ b/mlc-chat-config.json @@ -0,0 +1,16 @@ +{ + "model_lib": "Llama-2-13b-chat-omniquant-w2a16g128asym", + "local_id": "Llama-2-13b-chat-omniquant-w2a16g128asym", + "conv_template": "llama-2", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "tokenizer.model" + ], + "model_category": "llama", + "model_name": "Llama-2-13b-chat-omniquant" +} \ No newline at end of file diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..fa13f8c0dd3e0567f5d873e3e705c93c3d124bf2 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,6995 @@ +{ + "metadata": { + "ParamSize": 565 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 327680000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 327680000, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_7", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 31703040, + "records": [ + { + "name": "param_1", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 19660800 + }, + { + "name": "param_3", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20889600 + }, + { + "name": "param_4", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 22118400 + }, + { + "name": "param_5", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 28672000 + }, + { + "name": "param_6", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29081600 + }, + { + "name": "param_8", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 29491200 + } + ] + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_15", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_21", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_9", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_10", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_11", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_12", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_13", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_14", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_16", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_17", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_18", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_19", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_20", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_29", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_22", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_23", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_24", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_25", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_26", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_27", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_28", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_30", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_31", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_32", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_35", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_43", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_33", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_34", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_36", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_37", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_38", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_39", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_40", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_41", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_42", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_44", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_45", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_49", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_57", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_46", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_47", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_48", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_50", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_51", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_52", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_53", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_54", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_55", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_56", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_58", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_63", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_71", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_59", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_60", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_61", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_62", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_64", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_65", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_66", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_67", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_68", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_69", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_70", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_77", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_72", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_73", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_74", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_75", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_76", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_78", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_79", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_80", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_81", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_91", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_82", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_83", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_84", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_85", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_86", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_87", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_88", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_89", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_90", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_92", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_99", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_105", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_93", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_94", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_95", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_96", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_97", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_98", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_100", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_101", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_102", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_103", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_104", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_113", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_106", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_107", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_108", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_109", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_110", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_111", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_112", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_114", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_115", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_116", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_119", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_127", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_117", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_118", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_120", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_121", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_122", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_123", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_124", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_125", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_126", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_128", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_129", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_133", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_141", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_130", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_131", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_132", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_134", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_135", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_136", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_137", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_138", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_139", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_140", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_142", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_147", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_155", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_143", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_144", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_145", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_146", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_148", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_149", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_150", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_151", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_152", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_153", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_154", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_161", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_156", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_157", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_158", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_159", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_160", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_162", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_163", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_164", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_165", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_175", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_166", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_167", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_168", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_169", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_170", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_171", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_172", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_173", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_174", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_176", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_183", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_189", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_177", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_178", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_179", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_180", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_181", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_182", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_184", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_185", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_186", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_187", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_188", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_197", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_190", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_191", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_192", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_193", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_194", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_195", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_196", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_198", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_199", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_200", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_203", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_211", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_201", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_202", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_204", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_205", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_206", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_207", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_208", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_209", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_210", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_212", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_213", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_217", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_225", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_214", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_216", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_218", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_219", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_220", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_221", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_222", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_223", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_224", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_226", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_231", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_239", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_227", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_228", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_229", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_230", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_232", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_233", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_234", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_235", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_236", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_237", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_238", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_245", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_240", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_241", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_242", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_243", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_244", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_246", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_247", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_248", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_249", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_259", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_250", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_251", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_252", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_253", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_254", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_255", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_256", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_257", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_258", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_260", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_267", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_273", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_261", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_262", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_263", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_264", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_265", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_266", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_268", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_269", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_270", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_271", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_272", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_281", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_274", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_275", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_276", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_277", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_278", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_279", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_280", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_282", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_283", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_284", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_287", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_295", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_285", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_286", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_288", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_289", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_290", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_291", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_292", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_293", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_294", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_296", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_297", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_301", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_309", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_298", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_299", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_300", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_302", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_303", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_304", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_305", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_306", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_307", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_308", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_310", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_315", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_323", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_311", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_312", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_313", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_314", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_316", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_317", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_318", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_319", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_320", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_321", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_322", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_329", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_324", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_325", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_326", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_327", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_328", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_330", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_331", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_332", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_333", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_343", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_334", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_335", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_336", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_337", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_338", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_339", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_340", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_341", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_342", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_344", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_351", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_357", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_345", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_346", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_347", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_348", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_349", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_350", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_352", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_353", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_354", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_355", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_356", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_365", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_358", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_359", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_360", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_361", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_362", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_363", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_364", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_366", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_367", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_368", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_371", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_379", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_369", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_370", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_372", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_373", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_374", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_375", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_376", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_377", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_378", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_380", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_381", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_385", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_393", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_382", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_383", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_384", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_386", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_387", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_388", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_389", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_390", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_391", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_392", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_394", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_399", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_407", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_395", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_396", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_397", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_398", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_400", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_401", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_402", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_403", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_404", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_405", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_406", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_413", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_408", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_409", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_410", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_411", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_412", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_414", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_415", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_416", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_417", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_427", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_418", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_419", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_420", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_421", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_422", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_423", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_424", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_425", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_426", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_428", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_435", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_441", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_429", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_430", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_431", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_432", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_433", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_434", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_436", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_437", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_438", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_439", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_440", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_449", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_442", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_443", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_444", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_445", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_446", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_447", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_448", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_450", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_451", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_452", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_455", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_463", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_453", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_454", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_456", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_457", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_458", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_459", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_460", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_461", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_462", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_464", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_465", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_469", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_477", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_466", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_467", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_468", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_470", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_471", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_472", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_473", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_474", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_475", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_476", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_478", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 31723520 + } + ] + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_483", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_491", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 32952320, + "records": [ + { + "name": "param_479", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_480", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 1228800 + }, + { + "name": "param_481", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 7782400 + }, + { + "name": "param_482", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 8192000 + }, + { + "name": "param_484", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 8601600 + }, + { + "name": "param_485", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 10813440 + }, + { + "name": "param_486", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 13025280 + }, + { + "name": "param_487", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30720000 + }, + { + "name": "param_488", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31825920 + }, + { + "name": "param_489", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32931840 + }, + { + "name": "param_490", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 32942080 + } + ] + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_497", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 33054720, + "records": [ + { + "name": "param_492", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_493", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_494", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 2457600 + }, + { + "name": "param_495", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9011200 + }, + { + "name": "param_496", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 9420800 + }, + { + "name": "param_498", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9830400 + }, + { + "name": "param_499", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 12042240 + }, + { + "name": "param_500", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 14254080 + }, + { + "name": "param_501", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 31948800 + } + ] + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_511", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 32829440, + "records": [ + { + "name": "param_502", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 0 + }, + { + "name": "param_503", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1105920 + }, + { + "name": "param_504", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 1116160 + }, + { + "name": "param_505", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 1126400 + }, + { + "name": "param_506", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20787200 + }, + { + "name": "param_507", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22016000 + }, + { + "name": "param_508", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 23244800 + }, + { + "name": "param_509", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 29798400 + }, + { + "name": "param_510", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 30208000 + }, + { + "name": "param_512", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 30617600 + } + ] + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_519", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_525", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 31969280, + "records": [ + { + "name": "param_513", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_514", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 2211840 + }, + { + "name": "param_515", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19906560 + }, + { + "name": "param_516", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21012480 + }, + { + "name": "param_517", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22118400 + }, + { + "name": "param_518", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 22128640 + }, + { + "name": "param_520", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 22138880 + }, + { + "name": "param_521", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23367680 + }, + { + "name": "param_522", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 24596480 + }, + { + "name": "param_523", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31150080 + }, + { + "name": "param_524", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 31559680 + } + ] + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_533", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 33361920, + "records": [ + { + "name": "param_526", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 0 + }, + { + "name": "param_527", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 2211840 + }, + { + "name": "param_528", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 4423680 + }, + { + "name": "param_529", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22118400 + }, + { + "name": "param_530", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 23224320 + }, + { + "name": "param_531", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24330240 + }, + { + "name": "param_532", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 24340480 + }, + { + "name": "param_534", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24350720 + }, + { + "name": "param_535", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25579520 + }, + { + "name": "param_536", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 26808320 + } + ] + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_539", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 19660800, + "records": [ + { + "name": "param_547", + "shape": [ + 15360, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 19660800, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 27627520, + "records": [ + { + "name": "param_537", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 0 + }, + { + "name": "param_538", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 409600 + }, + { + "name": "param_540", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 819200 + }, + { + "name": "param_541", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 3031040 + }, + { + "name": "param_542", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 5242880 + }, + { + "name": "param_543", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 22937600 + }, + { + "name": "param_544", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 24043520 + }, + { + "name": "param_545", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25149440 + }, + { + "name": "param_546", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 25159680 + }, + { + "name": "param_548", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 25169920 + }, + { + "name": "param_549", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 26398720 + } + ] + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_553", + "shape": [ + 27648, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 327680000, + "records": [ + { + "name": "param_562", + "shape": [ + 32000, + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 327680000, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 32782336, + "records": [ + { + "name": "param_550", + "shape": [ + 5120, + 320 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 6553600, + "byteOffset": 0 + }, + { + "name": "param_551", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6553600 + }, + { + "name": "param_552", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 6963200 + }, + { + "name": "param_554", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 7372800 + }, + { + "name": "param_555", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 9584640 + }, + { + "name": "param_556", + "shape": [ + 5120, + 864 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 17694720, + "byteOffset": 11796480 + }, + { + "name": "param_557", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 29491200 + }, + { + "name": "param_558", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 30597120 + }, + { + "name": "param_559", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31703040 + }, + { + "name": "param_560", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31713280 + }, + { + "name": "param_561", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 31723520 + }, + { + "name": "param_563", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 31733760 + }, + { + "name": "param_564", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 32258048 + } + ] + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c88e85e65bad524119bfa0f2fae156b044dc45d --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb8c2d8a4ba799831bc7f2feed6bac6fb242a6d26632fa2502a091e83596e44 +size 327680000 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..439a84d04a8d7f2266a97a6d822902a30d2d5f6d --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac8c327c61e3d94e00043992ae989a7ef8f59be7d96a85049193bd34cbb56b4 +size 35389440 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..986ff9913eb98153f87fa6a29eb7c27617c1a45a --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db89f9eee3e37020a4611f2d43c1ed1f3ae460c358b86a8e29236cb5882e7adc +size 27627520 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c6754d6640b6c7ecf5abb028dd1faa87105ccc4 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a98d18f9c731d2fac3d7faf12393365e375612b123fefae1254f1c54e190e9d +size 27627520 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bda6bfc2ed2ad93ce30e486427c4ea4574297a5 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95cd9b54285e79ecda038fc53e544ddcf1909228dc0172689a133e23436d615 +size 35389440 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..194ecda1c13a04e94589384a4e86394671a5941c --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413279fe8f15743a1a5e422940b7fcb9db4c6e13b097a7e5f8813d45b6b2a961 +size 19660800 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..17ddaa67fa38b5d435f79e2277980b1777d8879a --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a145b719098199bab55ee35810a8d033d210e491a6be359cece622f2ace2bef4 +size 32952320 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..a674ce911c433ef8f842d926b92279feea46c5d1 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d643aba418fe452bc2edd9eefdd82b95b81fea9d9d0dff9f9d1b8c6bfceae8 +size 35389440 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..2df8caf8077b259acabef8c16a64fb5a330a597a --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e621849b9e6af299206a3345d0c63c1e40ace2b0c545a7874be3325d335a0daf +size 19660800 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..7381638719a5b70eb65f52fd62b997a6c0a85dc7 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1575233467df54e91274a46273a15d7d6e5f422c3d14b87c77553d8539f4e5fd +size 32952320 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..676815c7859687845aba6ddccbcd168ffcd4a678 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79aa1a2c8fb2230dd3b4a12d1503a9f53d43a5b2596aa82a70a781cc0793a7af +size 35389440 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..af5d00769f247dbcf9016e92e6ac2c88141266de --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a35f7cf31b5fabbfc55d4782990caa43d79d8a75746b17d77319b497df4a76 +size 33054720 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..07c74c5d0a68d44d10cb27f36f694f0988d9b9e0 --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a160a4e496d851bbb053c6272529fcb37a03fa4d5ca7792aa8205b274a1635b7 +size 35389440 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..79bdbe8b0710f90bb4902746b8ede919f183d780 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d1ba3f2a1f36bf890f44ab1aa1e3e66d0b22a15c6cb2114c32a6396d9666bb +size 35389440 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..0479d2edc8b58517f773e0844487cc75dc83871b --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349abcaa9364f868d983a0f1d9c551bd58f1ebd08859ee3746b7966bcaa44506 +size 32829440 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..a39912b5797c97db9d748a5bb75effc16296d718 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af251bd824ba072897c4dee30476f7f01e37ddf46b06f2e0f9ad165089b018c4 +size 19660800 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a813d719f06eca1b7394e521bd942e312af4f7f --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f92e9f9676fd161522f4909417b7f75ee3d8da0f845048924a37219fcd84b9 +size 35389440 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..06dacddbe21859cbc4dcc65f192fb4bec528eaa0 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb5c679e9574a51f2946fce92992dc86aef0c395f3ecdb10d3c33403a21a58a +size 31969280 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..7946f899927dd908a104aac29418952fc2ad5759 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e78253c9b9e62725b8f5a9da67390e3da859642fbb9cd85f40b86d31cde01f6 +size 19660800 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d35ba0054c14a81191fd0664e6b66dec58911cc --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da42af6430e48a1d851a2c415d4e75a7c18fc1fa33eef61a80afb633ff1a8c36 +size 33361920 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..6246e5ef5313b4fad35ea7da104aae03270988a5 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a7df6e22ad1a16c9b929a64842bc95f6fc76cf4165376fecc28956f5b1cb92 +size 35389440 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d9e3e02b3a3e22e462905d48109846fb12f4818 --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9a5ba28f751defcfeba086d224e894d8e50f1f5657db284fe8141a9f3bfe85 +size 19660800 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..41e69b254449f510c661d6b4f2bf047cf53e4b40 --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24de112da564e66d4941555d8de617dec61ae3e5cd2a2e59b2b2271212bd1e85 +size 27627520 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d27ea628b33f1455b898387d4827e084f597e2b --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9330c7e823446d7bbfec8ec8bf2b5edd6ef13c83b81e467dbd48fb954bca9f48 +size 35389440 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..0afe1f9f2a4b2b609f30f6b85321ce5a84b962a0 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7b937ef4dc7df8a8a1796951972fe994b5b8798f9dccac0444f02829a7ef67 +size 19660800 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..9aa5e1fa75b01bbfad295e607e70f1a7597ba12e --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fccdfe5f59afdb742bc2a8fba7155f0578ecf599ad9018ae27b806ac73cfadc +size 327680000 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..da4eeb082b07c8ae67f65f6f5bad800308928b95 --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25366520631d9263b1ebc0d729662006865328c779c340d27cb58b0da856a045 +size 32782336 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..d62678a091753f1e0a747ca7950d03c443b1fc52 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502e1d666207b2491fa413bb1208dd9a4fe95bba0328d38c0c842fd8cd6dea53 +size 32952320 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..132f386de2cd60ab239d674a6ca249e29b8c218b --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f181886a4fb52b833d137cf2848c25601e3c90373b499cb38c30f5510bb459d0 +size 35389440 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..21733ea975c1cb13682c7658c053feb18f8547e9 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee05bbe9093001b50cd3d364ef97918c68c176bc02d981d77ad26b84a454957 +size 19660800 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..535e4de40a46a53f3dd67435475aaa7815586e80 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa03113ad71233c9766b2a4f3678ffbb180596dbd3570e7403c754eb9e33958f +size 32952320 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..645367cc48cd2bb9440b07fa3489c36346e867cf --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a6d9f56b191966691dda22a097a6eb912c7a3ec0b8df1d04af02ee71666c66 +size 35389440 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea31754e8c05a9d35d867dec83cd996ccccd131d --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd4daed8b62c77af401bc843be2115e7e749e2d441f06e2a0a438669723f516e +size 33054720 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..65230547ac36945bc9817296d4f24ea96d30fd17 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868f9a6da81a37b2949c3598a3ce86fadc758c6d8041676bf8745361a26a57c6 +size 35389440 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d01f5bb2a2474982f5481d78aebfb56fbe6f528 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f9f7d043fee7af88e324e93278fdb7f9da11daf5528749fd643ea82e3c07bd +size 31703040 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8bcf113468a677a4059dc88fe50bb0f399a5246 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99f4d106a985463b476c82dd6c8c2f00c9221ced85f4bf79ee5184c4dfefcf5 +size 32829440 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6ee3ae6906e039690252d272808d6c7f9ac66e6 --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dacc0b3974573913bf3b1615858345448e05fb8c239f862a71b66898c7920d4 +size 19660800 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..056d3b53b348a0b0fc760783feddd7b0ee686727 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2f1cf79397b7b1ade4b0b12b41ffa7d4b629f0c4f49c38f9aaddb30062f5cd +size 35389440 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f6cc6ae626cab9db4a0d801ed3879f33ab1eb24 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b995fed61c185bfe7ed0a8e833236915b7eea20e690b9467f26ace1fe25da65 +size 31969280 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..02f14be23efbceb0cb26b2844b2366c7ab317f9d --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c237c11d522f14930280a4104124348100873296c334c43f8e4d78665affd1 +size 19660800 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..c52060ae1c6f5ed228ec38e89a6cfce2d6d19d6a --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00168f50d7c83e538cbdb20ac18cb41cbdabb4cea1a2ed415e147a09dcd8460 +size 33361920 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..3086d55fad3485c6f77ee2be165c46a8ab03943d --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cedefcbb94226f7c46e74cfff311882ff5b8f859c86b1f51745ad8e9185cbef1 +size 35389440 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..11d184ae277fc208321f62f48ed0f081634b8bd6 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fdf1c3645eafa41c961f60ee201ae90d5d0a849991735416abc3bce3318d12d +size 19660800 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fcfe5a0244c3cbfcba63ad65cb51e01a804295a --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5853ff1490c25b863d01d0e1a3783c98b10b9a54e6e4f82c968bcae61b485ba5 +size 27627520 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..3cb0f073f341728840c3a6a47718f52594169980 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcdc51ae053e6722b9fe5e0b1da42f2b184bad3983af411b3b0ab02a7448f530 +size 35389440 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..86c171eba792ce077f225cbe22aa8449ca7f92bd --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b3ee827e25005820f62a2b96ee5a67bacae92aa7e3cdec92fbe800de75374e +size 19660800 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..b173f785367f0e6b0d4862ccdce92a6956966692 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a95887328ef643f843da5f44248ca62ec2469c650fa3a44f7f59101b095a9f4 +size 19660800 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..8cc4b38c574d2317eac685318d27e1f86eb5b14d --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ca6a69d14e9c7c992966aa125f6b219e588bfdd2c12673d2269558c45a3521 +size 32952320 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..7bc685236ae25e74fa3805e593549ce45b39d785 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc135640ebf2cf0cb124be70d5d9713a6a8dd5049c9680ab0cb8b0843e8a090c +size 35389440 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..cdec5cae6e2641aa8071a1290e5e1217d3090b78 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46bb7f775296430aee65878abd140781efdda85d03b7c42b1dd6c7de0474b66 +size 19660800 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..ce19595f4b1d493a689a2aca47f52839ab291786 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84db2953c7510b045e629ad8545fc590390f8dedffd57a571bf62654a1cdf481 +size 32952320 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..a51b3e7124b3a9a4ecff5120ace82e4613b83fad --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f552c36a607b83f5ef7a0f034eea6f9420600d92c7d6ae9eed4ce3403aee7ac1 +size 35389440 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..3197a62e6f912af3d48daa4c1f457c2b95ea3372 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8ed64804eea58f2c8291f639a33abe24bcd78065fc958d6856d888d5b4ce5 +size 33054720 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c950cc4aee742cdd026b8e8f82388e63d0dc1ff --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1db73ae64509eb549c962b9bc1adfc5b32a6e3ff5a647d4bb20a5b3a2e0558 +size 35389440 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5f9aaa7550295bfbd3c9d68525515739d7dbc00 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6530ffd7fb55e991eb62d8695f6308afd63a7950eb6e3bb7fc7316fea5205151 +size 32829440 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..eac0a1c9699297fe21f3b4b900fce846b65a7cf3 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33026b8bbaa5318683bc3a1595fed474868fcc9d4bf289ed73520ab2f884759d +size 19660800 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..c208bd517d299adb402c8eb3e34c08415598b23c --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d500302656dfe904c1489509289111a7a5840409c62439a5dfe5075b52ed9ede +size 35389440 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e0f26b966f267f96124310756d54dc78a541c0f --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f183c24120bccef14176cf41e5bd5b91ccfd5b519d776adb4252d3856cf699a +size 35389440 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6ad4a82fecb06cb9523c5bb0dd08c97da5d986d --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb60a545fa02f95fff6d0692b268525b6805f98ce7b414353ff9b0e9f818ef2 +size 31969280 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7bd570aa1db3698f2b946dbb1366ec01b412ab1 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6568fcd74deefccf8fd5ae049b5dc531eecf4476407b0966af2f6592ba39674d +size 19660800 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..64d2b173c55ac9dbc00ca1ffc9a8a275398debbe --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ebd222ad260589702ab9843a5ef0866c730e0e36c30ad36aaa9ee9d3c168f9e +size 33361920 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..46cc4f685e9f33fa5ed0dc213c98d86012f63984 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2225db773d767da886e0dbd6c3d7f681b9dc64aea92dfd7a907ce77f7ab25236 +size 35389440 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ffa010464c252831ecd81c367af4bf06100deff --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975b9694d7d4f70986388f3355dae34cddd9a8c70163634412346419e1c4729c +size 19660800 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..e36bb1b6e16db0061cfc2ba0da8f884e6782dd1d --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e63e0683ab8b75a70c7bcf572ca2de7038d543e3b38ba594fa484bbca4e0b0b +size 27627520 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..491f913dc135240002b1afe8ab97d64e01a7558d --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663083f6ce9912a3997b259ccf541a8b21a1caadf61d723594711caae92b83ab +size 35389440 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..6bd7011a588d22fe8034656e84a08ca53fc5935e --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2dedf013f21cec82f2cb962964a9d7c0f4f5424b603d4ac52d3c24dab98e22 +size 19660800 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..8097e994e9b592f5d2d4d949d56841986f9a036d --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc539b5b021ab940a65b3eb9c8fca6fcd472f81ac2557828a4d0690f2c85767a +size 32952320 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3d864072798abfd7438f113d0db0900f3d8aa33 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060aec9e7bba5efe97fd753cfa6fcc5a18ee4fe50b1da4717fe1517ba350a604 +size 31969280 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef6c59108962186dca84ed8d43b73ab44e11208a --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5306fb3377985fa19aaf25b97bbb6868f0849cdf6f282dc1e032b7510e20efc2 +size 35389440 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0301b34b0c8505ccb6b1c99aebe3b4ed917b730 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5c20519e48356a1bd8c4ebe8f07aade79f4e81273301a30d91cd8be5f73cdd +size 19660800 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..24627c2754592974575f5abef52c051b01dce5b4 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7e230a693d5148871d68d2b6e91570fcc28022472589754c76a45f55c16c04 +size 32952320 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc82e442c00cf7ff2c3d289bcf0d0d7e19ae41e6 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0dfa245bc85528045d59cacee4f40f90b6655ccf54e7bd61975bb2078dfc81f +size 35389440 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..680fb3bbb3c392279771f04ea197a03d27ae19b6 --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894a62caec46b1a0e6e10d5a890dbb66e0bf38d2c62da304a4bd2d36fa8dbb86 +size 33054720 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..e85643ffcaa910b7ccd35e02ffb5590894f28c9a --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada895550592ba1d08bbca7702ec18441b4dfc5493249a7671205cd50f138e6e +size 35389440 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ad59833c8a54473c4de91f3442267e2d3069eed --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3161339e7108560deaddc41accc681d4ef3d5956c4801cb0217958061e422034 +size 32829440 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..23812ebe90e4a81bea961315442e1b288a04a116 --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07301ded33b03a1b5d18c18f895565c350577d560c5b474bb391fd7518391ef0 +size 19660800 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..00c901457b1c0d1c1995f38581959656449b4bde --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ed24b97286bdbe7dd810aed7582ab8b0c3f65dfdb5f411ec3d38beb7a437b5 +size 35389440 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..0035deb820e9b3f6bab0d2459abf3c4ab44028df --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7770ab69427d876012d107ad8153b3cfa53e8e6f9bfd552f9af2ecd5485d47d +size 31969280 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2d792373b97cf1d4c38427542637abe0d377dc2 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6175668fad52e7599ffb4ba7dd1dda527559e295d5314879551bbd446603165a +size 19660800 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..1eb87940cb327349ccc5be3fa0498e1846503e9d --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ece0d74d39401e5fc372dd6ad3897f7fb14565bcacced4d02f5586b466ceffb +size 19660800 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..37c5846b6ff4b96060875adfe2aa7b2a4e988f49 --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43965ac785a406e0abec2b34a10f469e03bdf4940874ff32549b4d4567cc8d9 +size 33361920 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..0365b560898626fa5775dc95b224cb71b871bcd4 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79fecebebf0147c0c584b3912009ee4c17231d5aada551cf184a5edfde8293e +size 35389440 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..eae7caddbcb112e5684be5bf0f9f1f0a1da09670 --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47db701c14bf1a8f91645757f346a60256711769723daa9c1f527e8737889161 +size 19660800 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..23d02e45eaed7a04e8d5c631da70c82362b0930c --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69399b5eb62897140af8bcf00d971dec4f538bb6d939458979b5de530755fc8e +size 27627520 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..bbf9f58fefd7d5ebb760130fdac9dfba42930b8b --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2aafb5e86ed481e139513d46eec48f0e388dea1801139cf44cac212920b035 +size 35389440 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..1218e15a5bbf8e7b491ac87609bf05ac7829e3eb --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fe21fd65e91b4d3a62860161f260d0e0ce9518ffc93883245a34699bd7146b +size 19660800 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a52bf8b9ab389c1b8dced4aa02e8ddda736bac8 --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974b48c11508df106e1a05b388e58434604dea219312722d66fd89bae3fa0c8d +size 32952320 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..29dd667abd6a71fef563f58d2062a7934981d399 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3f79d9551ae7788cfb3ecad27d34dcfd64b4de55ee4d00c25bc8634491a359 +size 35389440 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4b212a52850e8b4b35156d54843b7fffef270b2 --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e576119b3bb373e0116c66e8d3f9007a4396821bead18db7ada9c5556aa9d6cb +size 19660800 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..b61bb211981b2d4d736dd9c6c9faecad8d4e0ed3 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dba2e252759bd762491c6cdf3efac6e1a8bb5e47135c75db55d4bc252e678eea +size 33361920 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..76fda9de79745613778886174ac3e21fefdc8055 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5f54fdcfc35d3dac2cea016b7f1986a77d0d96735ba961f25558ea37cd3d86 +size 32952320 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..24f93fe7310f313c233e8a14dca5c5a0af3b005b --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2ac7e28aab73ab2db8aa044f1e34710617ca43f29378fe69816ba4e0895b1d +size 35389440 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..9cb70e1973219e74d042979a8504621d010d530a --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a07eabf64e4c3a009c537b586a1724ae94829c96ae17eecb6a720f6300ceeda +size 33054720 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a67c1b616bccee25708e24fcccd60d7c274ca7d --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d909a698e8fa91993ca3e8329041e162b04f9f17a86eb8c02edac6bc4e54e9f +size 35389440 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..117e5cacf16a55a6fd18ce9d016fe9def36678ce --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c98b5c8c8967b9dac972d3b77e6e725e0efa59657ccd0e9ee1d1a2592e24582f +size 32829440 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d7a03f33a6fb54b6978aa88e3d3319c61a2c1e2 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52465ddbe176275653db2422a90f1c0522b8d5ff3a2a13938b9c99d95b5aa13 +size 19660800 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..160d2e61ee8c338471291a93836775df4aa36b61 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfda6267ccfbcfd736b477fa7d361c0f346910a4d5be8c8abffd41dd205f5e3f +size 35389440 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0c9deed101445a0b984d66c464afd1a74356f8e --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e13fa5a20171946914e493d137f4df612b91a1d756e43c1c35f3bce1117e366 +size 31969280 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc4401c49f0c6bb8aff05f73b8d7f32e5d881fe8 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce0ea6fb030e2313ff9d72661226ded51e57c232d2c5d3dcb12654450f2c14ad +size 19660800 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..cffd09d40d2344cbb90979891d5f2d849ff9e96d --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff703d3cb37213f10609c1535ea8883c07c4e9f76c8f2e326cd427aa5d6e1e5e +size 33361920 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3ae10c221b7590795e86663e3ded116878aeb3e --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:426f23a7b9a8634a28a35d8e79605afc7709b9a386df2131bdf6480529937364 +size 35389440 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..86e36f1f21a099833c6418929dc37f87df631205 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43aebd6eaadd9470781cbdb66ee724dea69116a7b6977ba14174d1ce62ad0498 +size 35389440 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..d14b9ee7f10e437004666ccb84b45d3b8500233b --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad4c80bf97089ca616f1d15fa23bc32b8ae6e270bc7c3de7a9dc15e1e37f644 +size 19660800 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..56698c5e7388306873cbf8eb202277b1635a30ea --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68ef451f64a9c8809e8e4f3f65836f4537616e70d665764cf703db354304bd4 +size 27627520 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..5022bfc8633845d02e45dd13308c27ec56d584aa --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdcff590ad7439b420b5cfb7ca1f1fff7e1eeae58312f721717e545a4f95b27e +size 35389440 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..4271f8b64a4d46d26a0935171db925bd7cb238ae --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc2f5ca9b9dcd249a424597b9fa405c304d52fb4aba5f211af2c163e91923ea +size 19660800 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..e15cc14ff08447084709222bee9351420ed8e6af --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b46f5650ca28c00ac04a11c184bacc9e2afd68bfcb305f789ecc5012f01619 +size 32952320 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8cbc236764a633deb88734951d914148888e85b --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccc8796c25ed1ecbc30f33bda74b9e00d4c9463892c7c41aac6a25dd40d22353 +size 35389440 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bb42ae71aa042afc86aa1a44c362f3e28313c84 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f732c729320caf13b23e579a660cfbc394e809a47223c71d689d5aba36806f +size 19660800 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d40609004af8710209395746db3091d2d4e28e4 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007980a607a308ecc61a239cae3c0bae4aaa1709f33cf055e645ab1d6e5a0bea +size 32952320 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..9bf66c07a5c3e48e414c6eb24d4130af7370fa11 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c16ef9583c000837ffc6e833f326a891a29f5da87f8ad2b95b2539adf72d55fc +size 35389440 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..de966dea7ecc6dfa1a741c55efdad63d914dfa89 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d9f026499549a56b84ef644e9fa8ccdbc222a2ae5064f87f5a6c669cb2fefee +size 19660800 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..60a3b115fef174a24364a974f072a746360e5ad4 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04bc26649491f3ba4dd73cfcaede5bc023136331710a94b52e44b6694738d79 +size 33054720 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..0edea4c15df944bccccf7ec74f995dfbe9b6f351 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5dd095a2e570fd635e856473494d799f0448d4a9489b05b52b5eb8317db8883 +size 35389440 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..28d44b35db66fd6beda7523030432eccf8350d41 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d72eef6b6e82e65782b5f3130c03c5aeae0432da0f563d495d6b209ebf9504d +size 32829440 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..381314a3bf60805ec1bcdc8fbbf50d56a714466d --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d3358353304f936abe47d50e39b31de7353e32cd2e0f022dd0dd1f6c9df69db +size 19660800 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..963703a748330e32a11efcb1e1eac2280cca4cf0 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c3055c9b7d6b9de4660792a1eb0c986f149af994fade54983cff3a632d2639 +size 35389440 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4db0aa8211ef741351d04ffec9cf7255c370fd6 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9730e8491c5a1a95bec0d5d6bf6e31b07df4d13afac1c1c72e82415a923193c4 +size 31969280 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..a32da04247086b50760e67da3a0d88c45168c817 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493107e8c993395cce9d37b10c1f249d98898f402870def2a8c5787d706b769e +size 19660800 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..690d5e7dac4ef166d95faf6479baa5dd1a1624e1 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ff467c82a17080f7af581aecb20231147a04a0561f4965960c403f4b8560c7 +size 33361920 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb932f153909035c400029cf68f2b47b372c5d3f --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03297f838d712998281f28ad27187198d3125700f9efd126e48e035e07403538 +size 35389440 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b7dc7fedbe70532ce5c6d9ff0e0f79131fb911b --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f212447643d7d152ab1fae97e682d20129eaa2cfc62bc518c468114a1559c51 +size 19660800 diff --git a/tokenizer.model b/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899 --- /dev/null +++ b/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347 +size 499723 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..2ef41cbc275000b29afe157ba487f0530b8c26dc --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,35 @@ +{ + "add_bos_token": true, + "add_eos_token": false, + "bos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "clean_up_tokenization_spaces": false, + "eos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "legacy": false, + "model_max_length": 1000000000000000019884624838656, + "pad_token": null, + "padding_side": "right", + "sp_model_kwargs": {}, + "tokenizer_class": "LlamaTokenizer", + "unk_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +}