diff --git a/README.md b/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..6ef7601b3e9e5b2412ea7bc0a3fd2544eb35762f
--- /dev/null
+++ b/README.md
@@ -0,0 +1,3 @@
+# README
+
+LLaMA2-Chinese-Chat iOS版
diff --git a/mlc-chat-config.json b/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..5b76fe1cf925b5e213c3f8eea144cca888868008
--- /dev/null
+++ b/mlc-chat-config.json
@@ -0,0 +1,16 @@
+{
+ "model_lib": "Llama2-Chinese-7b-Chat-q4f16_1",
+ "local_id": "Llama2-Chinese-7b-Chat-q4f16_1",
+ "conv_template": "llama_default",
+ "temperature": 0.7,
+ "repetition_penalty": 1.0,
+ "top_p": 0.95,
+ "mean_gen_len": 128,
+ "max_gen_len": 512,
+ "shift_fill_factor": 0.3,
+ "tokenizer_files": [
+ "tokenizer.model"
+ ],
+ "model_category": "llama",
+ "model_name": "Llama2-Chinese-7b-Chat"
+}
\ No newline at end of file
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..1936f609759c71016f7a6cf4b34730c4c5ed3192
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,4344 @@
+{
+ "metadata": {
+ "ParamSize": 327
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 65536000,
+ "records": [
+ {
+ "name": "param_0",
+ "shape": [
+ 32000,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 65536000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 33357824,
+ "records": [
+ {
+ "name": "param_1",
+ "shape": [
+ 32000,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192000,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_2",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 8192000
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_6",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_8",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_12",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_3",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_4",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_5",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_7",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_9",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_10",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_11",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_13",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_14",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_16",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_22",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_15",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_17",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_18",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_19",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_20",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_21",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_26",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_28",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_32",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_23",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_24",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_25",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_27",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_29",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_30",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_31",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_33",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_34",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_36",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_42",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_35",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_37",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_38",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_39",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_40",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_41",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_46",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_48",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_52",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_43",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_44",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_45",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_47",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_49",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_50",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_51",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_53",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_54",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_56",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_62",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_55",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_57",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_58",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_59",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_60",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_61",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_66",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_68",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_72",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_63",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_64",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_65",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_67",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_69",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_70",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_71",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_73",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_74",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_76",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_82",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_75",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_77",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_78",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_79",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_80",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_81",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_86",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_88",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_92",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_83",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_84",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_85",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_87",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_89",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_90",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_91",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_93",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_94",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_96",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_102",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_95",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_97",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_98",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_99",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_100",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_101",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_106",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_108",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_112",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_103",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_104",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_105",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_107",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_109",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_110",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_111",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_113",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_114",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_116",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_122",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_115",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_117",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_118",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_119",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_120",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_121",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_126",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_128",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_132",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_123",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_124",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_125",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_127",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_129",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_130",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_131",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_133",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_134",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_136",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_142",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_135",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_137",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_138",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_139",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_140",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_141",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_146",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_148",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_152",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_143",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_144",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_145",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_147",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_149",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_150",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_151",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_153",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_154",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_156",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_162",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_155",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_157",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_158",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_159",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_160",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_161",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_166",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_168",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_172",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_163",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_164",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_165",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_167",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_169",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_170",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_171",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_173",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_174",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_176",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_182",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_175",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_177",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_178",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_179",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_180",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_181",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_186",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_188",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_192",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_183",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_184",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_185",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_187",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_189",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_190",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_191",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_193",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_194",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_196",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_202",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_195",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_197",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_198",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_199",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_200",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_201",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_206",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_208",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_212",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_203",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_204",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_205",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_207",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_209",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_210",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_211",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_213",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_214",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_216",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_222",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_215",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_217",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_218",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_219",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_220",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_221",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_226",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_228",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_232",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_223",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_224",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_225",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_227",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_229",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_230",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_231",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_233",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_234",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_236",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_242",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_235",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_237",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_238",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_239",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_240",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_241",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_246",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_248",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_252",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_243",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_244",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_245",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_247",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_249",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_250",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_251",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_253",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_254",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_256",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_262",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_255",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_257",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_258",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_259",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_260",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_261",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_266",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_268",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_272",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_263",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_264",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_265",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_267",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_269",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_270",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_271",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_273",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_274",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_276",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_282",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_275",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_277",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_278",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_279",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_280",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_281",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_286",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_288",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_292",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_283",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_284",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_285",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_287",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_289",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_290",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_291",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_293",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_294",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_296",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_302",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 32063488,
+ "records": [
+ {
+ "name": "param_295",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_297",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_298",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_299",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_300",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_301",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_306",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 22544384,
+ "records": [
+ {
+ "name": "param_308",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_312",
+ "shape": [
+ 12288,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 32587776,
+ "records": [
+ {
+ "name": "param_303",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_304",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_305",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 11534336
+ },
+ {
+ "name": "param_307",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 12582912
+ },
+ {
+ "name": "param_309",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 18219008
+ },
+ {
+ "name": "param_310",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21037056
+ },
+ {
+ "name": "param_311",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 21045248
+ },
+ {
+ "name": "param_313",
+ "shape": [
+ 12288,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 21053440
+ },
+ {
+ "name": "param_314",
+ "shape": [
+ 4096,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 8388608,
+ "byteOffset": 24199168
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 45088768,
+ "records": [
+ {
+ "name": "param_316",
+ "shape": [
+ 22016,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 45088768,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 65536000,
+ "records": [
+ {
+ "name": "param_323",
+ "shape": [
+ 32000,
+ 512
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 65536000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 32071680,
+ "records": [
+ {
+ "name": "param_315",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_317",
+ "shape": [
+ 22016,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 5636096,
+ "byteOffset": 1048576
+ },
+ {
+ "name": "param_318",
+ "shape": [
+ 4096,
+ 1376
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 22544384,
+ "byteOffset": 6684672
+ },
+ {
+ "name": "param_319",
+ "shape": [
+ 4096,
+ 344
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2818048,
+ "byteOffset": 29229056
+ },
+ {
+ "name": "param_320",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32047104
+ },
+ {
+ "name": "param_321",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32055296
+ },
+ {
+ "name": "param_322",
+ "shape": [
+ 4096
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192,
+ "byteOffset": 32063488
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 10289152,
+ "records": [
+ {
+ "name": "param_324",
+ "shape": [
+ 32000,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 8192000,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_325",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_326",
+ "shape": [
+ 4096,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1048576,
+ "byteOffset": 9240576
+ }
+ ]
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9dcdecbb1cbb2e728f94bc6feb181b09bdff5e22
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05a5a8beb444f22ad5f961f506b9c775d1fca044c1785f331767ab044da97b70
+size 65536000
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8df410084d8205341577bf702659a160c0aca74b
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f5c53b3b4351d73d1bdb99e6c3b0dc96916d0dc284732f396aca962f90ddf08
+size 33357824
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80d5718e578b65b4964782865678eb9efcc82e90
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e08b5e7fcee16bd14b027b01f5f23a5f16b86346771cd9621a064ad10f49d9f4
+size 22544384
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2dce5f2849eb4d8420826192efe907120f80a183
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:375496867c60eb96d3c42a3bbaf8b10bc31850aac3f5a1df0e9122892eb583d9
+size 45088768
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e1948d100ecce540be3172cd05789f09b4d8c593
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f43614f6d2ea279520d1550497be8da8b32ec6e8e832a38a5df3bcd5d43d4357
+size 22544384
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..05a4c4d3855a84c1ccb74aae86e32f2bf67d41fc
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f2a7a15692047df8f17fabc2530574f57a94e1ba425e875c377f6a1b1fdf26e
+size 25165824
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c4d1e15f2eeeb0061c3b3d3215e613d94d5f6a8a
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2a17a0b1cfcf9484741ba05f7f02eb0d49bd6c288bfe347ec40fdf937d30d5a6
+size 32587776
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bc70ecd7d37bdac042548a1ad9927f176d68a82
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c724ad4449daba7fcb17ffa18d9d94f774813f20919f45b4cae0411e90c7b480
+size 45088768
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5f643f996695c0230bc7723c3b393c7baaeb9c71
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d1b8f7d4b5b52fe98e48a0665c9d1a64e567e7bb85e06123ec46fc3233567d9
+size 25165824
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f908e12ff611dcfef83e58a7d7d58bd3b68a71de
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:703a94b9e91bf8459c8bbed0e8824a69a798b8501b30dc17fdd552317bf1d2bb
+size 32063488
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aebc363ebd0b5d7210b7ba8a840e201a28b7f900
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26493b0fc849aafdab877f9a40ba90d20079c89183f910b96aa2973d82b5eee7
+size 45088768
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6db1d37b319d1bda65bee2e00dcfe5c34fbcac6a
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8b975cf54a42d0f6fbbbc0742bb3872c487bc2178947f5ae7849c509ea7e755b
+size 22544384
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8d42a06cb76f8acfb30551b78225ac4010c08922
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2013ec52ac921c251864ebf75df30e6590cffbbdc35a9641d4fcc25d1adb8ed3
+size 25165824
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99e6ea082286bdde1d17d01976b4878c58ed1a66
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1705cfb3e13514686557ccb2f42df4f4236e56847e4e34fba132fda17f189a2f
+size 25165824
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d2d025ba05fa3d9ef5e94f2d9796a7b8be9c504
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d4b9077d7ef9e282b01529f3735f42a287806bb8bc3326158b42961e13dec7dd
+size 32587776
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7b6319d3c2ccb38eb64289fba46549ab6ec04431
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:155af9ad555a4cf4caee5d21324175447ed556adcc317991d73a8b19ce5c0e4e
+size 45088768
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0cb4bd8ff39082658f04144b7033c7402580602
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2c1c50328c9ae9f575ee36274d1c97725d1d70725d940a70caf9abeea4b5f2c
+size 65536000
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4ae0e61a98fe1db4da4b5e8578c2dbbf0c98ebac
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4f0031b6d0d28f9e239ef4e0b4c9974ede8b414cce1a999b60ff5c7ab151c6b0
+size 32071680
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8bbda63a2dc97ca8b6bb9c5bf62794fbc87a6e76
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4a206fe4e1b446c1a9db6bcd0afe5a77e49d0856416dcb58195e9b35dc12b55
+size 10289152
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5e49b63db858b012c777d252ca6b9455ebf4c5b5
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0811bfc87949736dcb71f4fef4f7f805242eafdad0923faedeebae8da2384c34
+size 32587776
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5446516748a33a8620aa973eb81daf9e60e6b1b9
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:58270e993e416f94a4a1d4e027cea8d3963e489ae05cc9c74ab4f39234a71ecf
+size 45088768
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..51eb93a9535824f2bda2cbf2b9d5f9e30c735508
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d1fffd15a967422bdc74e231281880443793e3287429f49c9b056d7a1f669a7
+size 25165824
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36ade24746511cc1abd3e8bf7b0361ef2eda4077
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a43a9efe24c34dcd6052bb9cb4811dc8070e34ce648082b33e4db7e521c58f81
+size 32063488
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec492788c091d08897765324af8040194c49391e
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c73930615bc3783d8380a128e97535f394dbf6997ecde9eac4f0686fe8826123
+size 45088768
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7e6a10821698527c2a9edff84d0f095d8e411b0e
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e2c28dd2feba612a07fcb03cb9b240b8f8e706e6d794d4144f59710478fed82
+size 22544384
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d023a169c6dd1c2d20c726b719b7de44d2653ecb
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c62cce9898158992aaa565dffbbe27ec8c6e9c6bff1fcda2784dcb88732597a5
+size 25165824
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cd1fe584311b91dd2142e3b1619cb9e18ab0cfe9
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:019486a86c826e31226c102fab4af38f065f41240fa9a6e600bfe0d487190776
+size 32587776
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4775f1f2cc8dfd9fa635112a2f220dedf98d7494
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05df16efdc5e69185f732c19d49f19591e1b987bd626f3b590ac887160089d4c
+size 45088768
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..353ef74c2b7998f91bf9035ab60d0a6c0487de66
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:397af1e897c9cf608fd5789bafced11fbd9982407258d50efb1dbfdfce1cb7fb
+size 45088768
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..15b587a9130a642914b5d3cb0b304a0f439ddfc1
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2b70f377bb1f283e6c962773230ea3491920f6bfeee47fb680f7da736ab9172c
+size 25165824
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..49d8f06e20e1d3ae8a3c36dd2b1dedf6aa04a8d0
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74edfacc80e30a7a649cfae0377819f5342ac4d5bde43c976c7bce28babaf229
+size 32063488
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..10f7a1d19756da0cbe82527dd0eb8f546fcdc3e0
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67ea9aae9e5647984a3645cb3d72da308b8aef3aa7c621cded595a0b6f087a50
+size 45088768
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5653d3f58269faaf72842fec8c1e796e8f20a91b
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f80f85477739856f776304bd626d8938a4c005a4a452fa0a9f421b3c6b89ccd2
+size 22544384
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b9989bc14103afca42c11c2643c618c9f747f830
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3df20a7762f22b114b9d5cbf8a08a069126f949c42678199d5a392303e5c6d07
+size 25165824
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4656eb635afef272f1bb890b74013c639780ab35
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e5238f553f03a16efe83f300d60d0f6137a8c3f2724782d6d5af79c460bc660
+size 32587776
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ab73d8525c443c769695597f3b52751e88578022
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38efaf942d7a56f1acb3281a58fc4708ad5d17cddf3469f295b190b4357a8c38
+size 45088768
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fa3191849b2f79d5115f0e7ad2ee8e905967194b
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb2ac0e1bd60a791e5548ae6ddcaff6258d33060766629fe0e126e786548d09e
+size 25165824
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bc5082d261711a1da19a0425477d0bc4fc9ced50
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3df028bd3e2bd1c5f38487968897967616dab000fbdba25ff0c984a3ad492e6
+size 32063488
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d452bd3b778501ab49201554b649ff572ba0ea99
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49a6ecaa1fe499daf48adc7940198cf1de34c924f4743d650da50d4852d7487b
+size 22544384
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de2a4e42bf1ae488ad526345ee0fc19c58524d7b
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f9e6a66b63fc533354b379ec28bc35ca0a34470473bbf2fe0a8562c6403bc1c
+size 45088768
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5cfcc7067a75c9797e6e02b3420be046af4141fd
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:125badd3055ff20a863986a04709e5eaa7d748e5902ba6ce1abbf099594b6e8d
+size 22544384
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..94f45e5c712c9b3fc1e68855d3eef7236333c4ef
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e2c49e5606d63ee4ced183674c5def9bf4d96446c9d9b202a7278d1111a73200
+size 25165824
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34530b484d7f53931c73192fa7b7412f5a0fe78a
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61325541206623692516411912c3b3acbbc879990fd31df48be3fdb91dc13767
+size 32587776
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..40b3987b8e7599903404697b5cc5737a742955dc
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8f4592b8b59007c256380efda0e57f74758e10a6905db0c27c7506c6d539c04
+size 45088768
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..35334eb6a50355d3c0ba46b61a388eefc0b5c8bf
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:261d66ced270fd0b9bfdd3d5562fb267d093ad29a86e04aa8d357c94036b0329
+size 25165824
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d6a2812d8be665225cae9e6c326b675f63f23cb
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d57ffeabec108ee982748b34707a859a725c62cddeb0834f0bd519349723e77
+size 32063488
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3bba41069c9aefc6c92037b1d05c21f18cef4b24
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3cd14ef84b258c21e4195193265202e6930af3621b7430aa138eda0686355d8
+size 45088768
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5a0b0d94d8c60d554d1eade685d658906174ad38
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:11090561bdabd9fb4f5e5788bf14463694a5fadb50f7eaddf9e5a8766d420ac7
+size 22544384
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e45b7f28ec53b981d96b659d23db0faab36dc304
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e28af7733e37b88e22fa8eed9542bd2cedc2fb6e5264cf5f4f63b6481425acec
+size 25165824
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..810b14074a9e01ff83210dff7e078b442964850c
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9383d2c20f909d30090da3ca82717861571d5237624cb17363b64039132f9d0f
+size 25165824
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2947601fbbe7810c9d6dc24da289c9577b8d2dd9
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a33d11152af57ae1cea623a2cb88a997310f4df455065bd1d9baf0b3a6b0605c
+size 32587776
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..27b1ee15fe2e725775be63cb599537e50b15b3f8
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be67b77600d516ee5cf98dd93355b413270f4f4fb989b57aa698b1588589d172
+size 45088768
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b81c49d7a169b4b043158d84043d8994811dac1
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6886594b5ce8c89607373a7675769778f57bf6521bf0984cb25dc6116630e4a7
+size 25165824
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34225b65cb109c2aefb667b50ecd28e929d0aa9d
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d61473da7ca02a3c50422bd372c0ae389298d30bcb35687a66748bed73418876
+size 32063488
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a202b444125c882f3da74b46bf24a5d90d8eb9b4
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b751f1f782ab43d992281d62f85b328bfd5af1f144595c645b01ec6bc30cfa6
+size 45088768
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6dceb1748178fc607ab67c6b34e68f67a4136241
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aeed9eac2665fe251bb6abef9f3af30375f2765057eff74ccafbb94c65ea8566
+size 22544384
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4876328b7dab47a9f420f99ec8b376aac6031a6e
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:99822e08599aa5c916e833bff6b04519660a049b5bf142bd53a3dd96a8e9bb07
+size 25165824
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a05026b6db0e42080e5ea2b46ecfd2df322753a9
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:99993f9ac74c14010435d03bec17c039c84e4ab35a86287b5ce8bb388a6b1764
+size 32587776
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a34d2156fb0a722b67d2537c9fedeeb17b05a8c8
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da8636bf5d391539f9ac09dfc4e313e1fbc023f7d0a6f1ad338167e1160d71ce
+size 45088768
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..38e5e059eb1ed7be2052b16073f839c4b88c8426
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:08f8846140e8939c4e18bc4259c220b2772e536aa01c7910aa6624675e19bf03
+size 25165824
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f40defdf07f9d1db0452bc2f26c9fbdd54334fdf
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:053ce8a663a32bb9818b7d4a0f30dac1415a88568df2d2f9473318bd2fce262f
+size 32587776
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d3db5f871d384fb896f93273f8d1744661134686
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5c1e27922215f2f43bb9391dead2468ed8ab2e468dd25ecff469179af2a0d2c3
+size 32063488
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..31e93ce1518ecd2e3c12e590acff0951bf2ea8c0
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e983abb12ecdb17519d76b8d0c24e245008051abe0e49d5437b00c9b63622a8
+size 45088768
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1209e5ad67b33caa8a45cd0724a35409ea7707a0
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9452d3c7ef584e8cd362b6b1cbd8b1d8e025e85051db5b3a2115bd58fe196ada
+size 22544384
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a35b164b58368f9dea90956d6ae914f1efe61ad8
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:262931b30d6a7d276622fc3ae854b6c031af04c00d3c25fb5f07f7095ae3f39b
+size 25165824
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..175aed1294446e6195baea8c033647d41f9957bd
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ffd85ebfe3865d914c0bfc00757c44bfe8b529b33051a32475883f1513ec22d1
+size 32587776
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1e8059706bbc072dd19284c9f1a1af6995a4274f
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48eb26cb02c6fae9f024a3aba2427c1959a4fab5ce01ca74ee216937364f3b8e
+size 45088768
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c3abe125ca314c9b02bd72ed4dcf527ec6ef1fac
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39e6f03302bd22e5c6d5cea88b3893ac73202caaa2655ab3cbd4e4bcb6db8e6f
+size 25165824
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2cbd5defa368153229db27af1fc6b224d3e74675
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:702174ae2a09ec5b7c9e12b57023934742049541770b39e712ff37a103b64134
+size 32063488
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3f382d13812cc818a8b5c2923126a4a78321adab
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4414422ac8f093cb2357f9e30ef8767ab3563562b83ec3152b212ae4f539c190
+size 45088768
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ebe0ea1792f7e9f76fd8398bed69b0a0dc6c06bc
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:200b65343166eacdfeacf6e035183aeeff3467786d46fb1ac56c1474eb357613
+size 22544384
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76276a3d6d9f256276075ae786022c7e2a4f9fc6
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:39de6a39273b155f64273dc1a059429f90f8178427f8ad34f5f3e9353051772f
+size 45088768
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8c27df791a0773bd50e9a159a19cace5029ad04
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7c46ea6c5c09f07ff59a1c6e03fd5af69e038d340b3a825dcdcff159951a371e
+size 25165824
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5dc1c516126bce7be2268be9de6896cce43b881c
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:634258411d499870f96cf5bc0a3d7a701e1a0cca8229293f87f2a5fbc08b0c04
+size 32587776
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a2bc17dfed916a5d3dbd0eb6e7873d6afe15bf4
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:508aa5a0ba1ef397bd66238733b0bb29cfe6dd11257f31c3b4456335545b9d46
+size 45088768
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b0dd6de88ba5174837595c2c1fc6e55e69dd67a
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a719483f9868ef754c6f02cb4f6d614287f90d936cd7b8065f0f6159847fd91e
+size 25165824
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da7a9e299a34e41541bd958a8e928808a2614786
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e6c2be681b71474d45c48870767e6d9209b1cbe745f6a7710d5ff53bbf01961b
+size 32063488
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29c0c8286f637677d8ba5eeb5b80fa64fb8362ce
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3817e162ca0f4e5045e1cd7361710caadd0c0b5f283fe5b0ec25ba6681090d75
+size 45088768
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cfd9cb17e9a3c6c665e1eccae42e9c0b5c96dfeb
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:059e301b02fef5cb5f4355b9267450b8be810ac1da78821c56553b571e42675e
+size 22544384
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f1f94c5c0321f0bc07813508ea56ad7a8c4f08f
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:942737d5c1c6a88aa33658ec84edf2fb93ff9bb845710703823c52130c8353f8
+size 25165824
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2e2dcb37e3ac2d0a138ab3f41a728224d5fa2c05
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c66f8bcfb124550182c4c69e7788e8c5938c55f109aba8b8463f421dc1e97d4c
+size 32587776
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8dd497647345b65f96a4a24f05ae1e30fc9fc71e
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ccd826dd669d38690ac850e88136ba49ed3aec3526af8c7fc5e341aba238df1
+size 45088768
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1be5f714b522429b1399523928d8864f780e895d
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cafe44338bbbf52f9f7b5288a0e4949e97fce9dea89b82de7d9c1fb32ce83de1
+size 25165824
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c5c71dc9a7fa17956e80654b29c00f5557435fd
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5329fdf460403748680f8936b967bffcae24a8e5754ae1c1eb6f5d8461b4f998
+size 25165824
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7912aca5d6aa6f361aa8ad6c37e6f3239afe699f
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28c7eae3a56b57fde9877bf2d9826737272b879245a7783a101d91512785466e
+size 32063488
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e2c0be6284ce68d0923485c86a2b43695f2e0a50
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:86e5d75a1b3f00dc76ea475e91eff37bd3d8ee8ce9841500b5d064939c441e70
+size 45088768
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30ed425bd8df123ac6bc34d6fdf703c97c748c97
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e29fe130bc103b451f8f6cca47983c6af98e5681e0ca26761442114c4d7bede
+size 22544384
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a4413bc402edb030dd918e9193280d85482730e2
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a91ed2c68b9082b9ffce4b0ea269ec5b5cd5bb3eb5106037e5f978be2e2da0b7
+size 25165824
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f062b56d1f662d09a46b571640a421585af94cd
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85957101fa5d9be7021c9dfc54901586f1c4b57002cacd21b30fb5c6c7f01561
+size 32587776
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f6d60871024cbcdd3d7120453872d64f61b93262
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:64027bee4f1e0cc76c591a624a0a8bc9652ea2f3cbd0a10ec7229e471b0e1536
+size 45088768
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..25de55b94d5959b7cc57200bd6856b11f5eb6ad7
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52fa01bc5767c9299217e2f8856f7367b36527a181b2f86e39e0be9bd5b76209
+size 25165824
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fd1175834f73eccaeac8459817325632f2c52317
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f9ba28b13c40b7c2fc09fdc4313709fc679965392db94e7e4cc187ed37a84317
+size 32063488
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26db2ab3151f8c0b1b01b2988e16e2440dd600e2
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:190a065d70cb7b2c097c5c08c937b96fc3cf4eaf32c491e6f563f89c01568e82
+size 45088768
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..539dc46eb2310082eee9b9e2793f3974c76df869
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0bee885deab230251f23a104c629ae91fbc7893a6955db1de9fd06105a29a14
+size 32063488
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54657ff492a7c936e2aa7a5147e6e0ecdf94fc6d
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:05a314a101943d5e878d59b30244fe3d702489fee0efe1ad5b57e46b792e2f0b
+size 22544384
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fa35b139831d6f1b820b07653b82d5d4032db4fd
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ce6f679bf83a7e6acb49eb8a5d52e976f8aa0f6756e7482c4b0880ba6dc23fc
+size 25165824
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58cc219ece5c66058197da6d50a65ecbc722e23c
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3b8a1882551989fd15365eee10758adebff03563c85fbab69c8be32a6b3f9d5
+size 32587776
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e2b6ae8859cfa7754c5feac9cdc473e1002d57fd
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b9018668d0605419b122e635cab72f5ea0a15290709facd24ef32a55f1dc326c
+size 45088768
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f09c1679b2333607eb7d967cf5e2d58555b73831
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb47cb8a00e137d1da1c8dbcda4e669b90226d2e50e1cbf4bc2f1d90832aa2b6
+size 25165824
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a5b71599d890a5c9d708d3133109aed3d4fb154
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d26ebdc34237e20683c3c48dc4ee677726cddc7ffe74828c1537e4f9884da335
+size 32063488
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cc72101fd9805ea12faf047d2056d0559893e27
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:713113409ee1bc55a5454356db8b78d8e3eca3be5929b8f02b071e619444477b
+size 45088768
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bd44b7bdca1b02c97da61f26b69ee8c1d9e7897c
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41f0dd1965bc1419b5b8af9f900091641c05a9becc05ecb83848dcd8e6f43ad1
+size 22544384
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..deed24d08c36ea5e8411c359993fbc0f7d600465
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:759eb89873f30054cac4ddb6593af38074f9aefa6945a1df56ddfb0073cf84b8
+size 25165824
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aeb9e94f2e3f96c272f3dd77af93adb0ad03cb30
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3f122d1aed7dcc38641649f0d8d42a9bb0ef9ae28eceb1151cb0c571833ce3ab
+size 32587776
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9defe93099a21e6bac363f910b3d45da04c328ad
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bfcf80e76cedee76efc42110273c4be5357bf6c0701793c5a3e282ad5eefe9f6
+size 45088768
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b13a30e87c77df74fa9bb0db1e0c78bf8e6c7a68
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:934c5492dad5444aad0e560640b0a0289ce9e428b67905b9b271fc0f5b24a00e
+size 45088768
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5c7f913b5bb3dc907eb7b77bb4aeb71f3a7c5c3d
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:efdf2c8227a50932550002a400acc9c0497921bbb13666e0fe65d3e317c2b247
+size 25165824
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9c9da6abaedc87497b24cc7e01b38ee54c030c68
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a2fbacb8eaddb9888eddd3b1b8ebe6dab4aa763079fbb572f8b5ded0a1b417e
+size 32063488
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bddd158b7d8c4d4ff79c03d8bfad5174467a525c
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5294eb14ce078a8a2f0752336d6035808520d4114232c5cb87465c210373f9a1
+size 45088768
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..01fde5b376f51cd224f0e18d3bb463581f4c3b19
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0fa3d4c63c6156ea3f7aba0c2e5fe706d2d5239692d0df37ebc51c04b6e9702
+size 22544384
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9154cb362eb4ce3cb73d6ecc4724fed40dadf850
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8dbe3272e6e97db2e1c69577dbca74247ff0a975dec4d1066995cd515f497f65
+size 25165824
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b6bf9798f7db4ba1671fbddb3776e4bfe021078
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:082490c2ea398a249b1729d235f50125d950fdb4c16bda09cde68acfb76b1732
+size 32587776
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36301148f7b230b6c43856a830922893177d8e87
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1a2f45adfca7da9e592b0ff29eb22858a40cfa060bab59b23888b7f67eac3a4b
+size 45088768
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d23537367e29646ed964b85d6e68f34a37e381a6
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d0d95f4e358bfa3e28e34f043792fabf720127e5bb9f42aa37a4bd65b454aba
+size 25165824
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3967e2fbe9f5721205bfc91c0c0b6e04776a5518
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aafd2e420c7a8065ffb3f1d5c7f98f8cd96297f97138c64182a9dfffd945e113
+size 32063488
diff --git a/tokenizer.model b/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899
--- /dev/null
+++ b/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..5557c019f635783532b53857546f2c72db496f76
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,35 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "bos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "clean_up_tokenization_spaces": false,
+ "eos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "legacy": false,
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": null,
+ "sp_model_kwargs": {},
+ "tokenizer_class": "LlamaTokenizer",
+ "unk_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "use_fast": false
+}