diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..81306b699a68101c179dcdf148ca46e914c46477 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +chatglm3-6b-32k-q4f16_1-vulkan.so filter=lfs diff=lfs merge=lfs -text diff --git a/chatglm3-6b-32k-q4f16_1-vulkan.so b/chatglm3-6b-32k-q4f16_1-vulkan.so new file mode 100644 index 0000000000000000000000000000000000000000..746542a4d7af58100743f65a2dab63737de131bf --- /dev/null +++ b/chatglm3-6b-32k-q4f16_1-vulkan.so @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f9457b6ee4fcb95ac32533584b69eab21842db59ee3c87ff2d6d76011ab160 +size 3438128 diff --git a/mod_cache_before_build.pkl b/mod_cache_before_build.pkl new file mode 100644 index 0000000000000000000000000000000000000000..415c6be752b77619a1e18cac27b04805c541e591 --- /dev/null +++ b/mod_cache_before_build.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6440a828b855f62f17aa495b7dcd9178aba8721c0fc58a673527f8cfc79fd3d1 +size 12677455 diff --git a/params/mlc-chat-config.json b/params/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..49df6a74286873c909ff45e5ac64eb92bfc55e84 --- /dev/null +++ b/params/mlc-chat-config.json @@ -0,0 +1,21 @@ +{ + "model_lib": "chatglm3-6b-32k-q4f16_1", + "local_id": "chatglm3-6b-32k-q4f16_1", + "conv_template": "glm", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 2048, + "num_shards": 1, + "use_presharded_weights": false, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "tokenizer.model" + ], + "model_category": "chatglm", + "model_name": "chatglm3-6b-32k", + "vocab_size": 65024, + "prefill_chunk_size": -1, + "max_window_size": 2048 +} \ No newline at end of file diff --git a/params/ndarray-cache.json b/params/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..a994f525a93b8109a4007aa3db6c5c75a7d3bb8e --- /dev/null +++ b/params/ndarray-cache.json @@ -0,0 +1,4069 @@ +{ + "metadata": { + "ParamSize": 313 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 133169152, + "records": [ + { + "name": "param_0", + "shape": [ + 65024, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 133169152, + "byteOffset": 0 + } + ], + "md5sum": "42fc524c24a453fd04b2987a2c369f65" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 27288576, + "records": [ + { + "name": "param_1", + "shape": [ + 65024, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 16646144, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 16646144 + }, + { + "name": "param_3", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 16654336 + }, + { + "name": "param_4", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 16662528 + }, + { + "name": "param_5", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 26099712 + }, + { + "name": "param_6", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 27279360 + } + ], + "md5sum": "aabbe9ded0b2d6f98bfd21a2584313b7" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_9", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "c89781afcb78a8f54b4753e28f84e6bd" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_11", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "54b327a2b135dc3bea5fb15d38c7c34d" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_7", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_8", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_10", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_12", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_13", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_14", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_15", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_16", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_17", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "0ceaf97e95270836ee88fa0417c320cf" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_20", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "d26947ee4d57cc68b6a6f4019210f605" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_22", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "262985faaadfcf5505639b0740c406b1" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_18", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_19", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_21", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_23", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_24", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_25", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_26", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_27", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_28", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "307480478ae463d5cb61272041a3bdfc" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_31", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "4f94c682807dcea90a471fc72225b9bf" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_33", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "dae9011148a39b3851fb8d54f231b75b" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_29", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_30", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_32", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_34", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_35", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_36", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_37", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_38", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_39", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "454341798cb64d7abacab02da606d1ec" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_42", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "9686c52643d07deb79cc6927df4b74e9" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_44", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "5446c5490b99f3434b6ca7fce9bcdf5f" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_40", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_41", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_43", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_45", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_46", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_47", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_48", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_49", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_50", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "151e7dc1fa66b670eec06f08076bd85a" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_53", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "a8c1c25ecc4d00838bd66e94e213b127" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_55", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "1fa79bddb918a32cb638a353b54d5003" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_51", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_52", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_54", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_56", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_57", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_58", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_59", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_60", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_61", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "b7b7cdb68c4903387e9a414b7b8ef6d8" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_64", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "4960df9f8de79192a4ab4c27d561e78f" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_66", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "55d89e37cb70d8e574f8238d61d93451" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_62", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_63", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_65", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_67", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_68", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_69", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_70", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_71", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_72", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "c902e088088b8fcc159034887dc6fdad" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_75", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "1310288ae2f6f279f8b17b4c4cb5a1fd" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_77", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "89bf6d551cd085292699e4f3181d012c" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_73", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_74", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_76", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_78", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_79", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_81", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_82", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_83", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "c7f2d197659b64d3d1a5166d7f7b1ea0" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_86", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "312cb2f5705c863409b169d9549bb257" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "4c6afd68424aa83e825f4437020ff308" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_84", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_87", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_89", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_92", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_93", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_94", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "00a8a765f80b213a665eeaa94c7c92f6" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_97", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "f2223d25bb387c4192a23176b466dca0" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_99", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "456aa67ae4ef769ebfbef14bc2a9f4b5" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_95", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_96", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_98", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_100", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_102", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_103", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_104", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_105", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "cc789c238d0c84e491993908c91b43b6" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_108", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "1150cbf79a26154896576e4d6a0586ff" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_110", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "82f849bf4441f21b88fdd9225a801b8e" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_106", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_107", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_109", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_111", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_112", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_113", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_114", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_115", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_116", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "885399dcaed11516f7d8eb0b73c5837b" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_119", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "42231ed36d80431a91cd21669b09be17" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_121", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "caab09038b7460f04462dcb4dca7712d" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_117", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_118", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_120", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_122", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_123", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_124", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_125", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_126", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_127", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "6167188a47399143712d90517860ae93" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_130", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "838a5afe52393575678a1cdf2d5ce76b" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_132", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "fb84677ba4af07bd8e80f064b717d743" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_131", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_133", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_134", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_135", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_136", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_137", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_138", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "afe211e902345c4fa09a7535715df1c9" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_141", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "511bb5a0cb4579e7a41c432e9d042158" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_143", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "857427edcd66211a6c3587437762700c" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_139", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_140", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_142", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_144", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_145", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_146", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_147", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_148", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_149", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "4fe126ca697186b12d7eee992655bc81" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_152", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "daaf962fe1e87c7cbbb082c84c815c48" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_154", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "6ac7f27fa76285fe75f3928d0626224f" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_150", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_151", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_153", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_155", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_156", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_157", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_158", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_159", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_160", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "ef4a64022eef83689fed2f7935d72b80" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_163", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "2d00eba684bdcebbb751e02db525de29" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_165", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "a3aeaf04fa944a1b2a97ac61953f7b2f" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_161", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_162", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_164", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_166", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_167", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_168", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_169", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_170", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_171", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "edaf19512d929c7c8d5f8d305b55d54d" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_174", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "d8ec270c76e1d0208a499051e534b966" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_176", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "2a556e674447a785903a14ad45ef3a92" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_172", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_173", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_175", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_177", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_178", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_179", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_180", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_181", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_182", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "e624e1c47fbabed975a9fb16965f00a7" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_185", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "7138cb07c69d0b177ce8cae55388b3fd" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_187", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "608d05d0923596aca8cbd6c10d40960b" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_183", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_184", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_186", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_188", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_189", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_191", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_192", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_193", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "089fd18fbdfb1841fd8cdd2f953fb875" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_196", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "2809c30cb7094df60d74b09433d1b521" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_198", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "23ad619a3b861e696a73f9df2277c749" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_194", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_197", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_199", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_202", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_203", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_204", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "9731f9e2d3786c638588a7d8c4e319c9" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_207", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "705919d96834329bed0f29d27bcd6e84" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_209", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "9432b521a7879fd4056332489e992848" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_205", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_206", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_208", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_210", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_212", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_213", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_214", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_215", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "be27db945f70364e149c7a45e9eb3c39" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_218", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "2c74488ca87d7ccc82f7ce73eaad1c56" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_220", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "5263e41ade304dc261e4cde09ef509f8" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_216", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_217", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_219", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_221", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_222", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_223", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_224", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_225", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_226", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "ae42d3d8c258d418e79b3944d968b88f" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_229", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "6cc194bef771d9f1b69be533ec63f73c" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_231", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "4393706f924a741bf5c15168099ff0e2" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_227", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_228", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_230", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_232", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_233", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_234", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_235", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_236", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_237", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "60f8df43e294b10f655ada24244154ce" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_240", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "b313e0f39e2dcc99c1b2a4c15dcd596f" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_242", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "c9e6ef74af7fc8d5a1c2e9d9ff9f8f39" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_238", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_239", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_241", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_243", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_244", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_245", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_246", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_247", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_248", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "e26d9d85c7247e38afb86c026b1fe8bc" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_251", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "f6e4785317a4741444ad43c49c1bc7c7" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_253", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "69a387818a53eeb636c332c739d8374f" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_249", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_250", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_252", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_254", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_255", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_256", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_257", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_258", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_259", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "a83744344f667dc9bb6afc07568a615e" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_262", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "1f8611df19a27665c9064368a199a329" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_264", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "88c7a3c97eba4f3f3e77c4cfc567f833" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_260", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_261", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_263", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_265", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_266", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_267", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_268", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_269", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_270", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "6ac73f00246805deba992a5d58800503" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_273", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "5b00d06d859e9f5309f2e99e5f1813bf" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_275", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "0b41e037d6b9fd716666f4fc26cd2724" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_271", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_272", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_274", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_276", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_277", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_278", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_279", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_280", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_281", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "12ea8d869579c8d143f4ae2db03ceb18" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_284", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "b9ced0d8c388f47cdd75e7037e72baed" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_286", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "d8f7446480c02648b5a616a4f9153cea" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_282", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_283", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_285", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_287", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_288", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_289", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_290", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_291", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_292", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "e819b2d60b3849f98bc1af047ce615c2" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_295", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "2ae7bf62dac77c085df5756ac1e71fcc" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_297", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "035e99b84a6cc22aec58d22586678e10" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 30598144, + "records": [ + { + "name": "param_293", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_294", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_296", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_298", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_299", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19963904 + }, + { + "name": "param_301", + "shape": [ + 4608, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 9437184, + "byteOffset": 19972096 + }, + { + "name": "param_302", + "shape": [ + 4608, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1179648, + "byteOffset": 29409280 + }, + { + "name": "param_303", + "shape": [ + 4608 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9216, + "byteOffset": 30588928 + } + ], + "md5sum": "7acc1017e1728c9ed9c5a77de2081abc" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 56098816, + "records": [ + { + "name": "param_306", + "shape": [ + 27392, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 56098816, + "byteOffset": 0 + } + ], + "md5sum": "623327b7ff58aed793bb144f5a038951" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 28049408, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 1712 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 28049408, + "byteOffset": 0 + } + ], + "md5sum": "877e4159205c7fd233f0180f377df14a" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 133169152, + "records": [ + { + "name": "param_311", + "shape": [ + 65024, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 133169152, + "byteOffset": 0 + } + ], + "md5sum": "cd0bff18427bb2b037825369d8c637ed" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 19963904, + "records": [ + { + "name": "param_304", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_307", + "shape": [ + 27392, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7012352, + "byteOffset": 9437184 + }, + { + "name": "param_309", + "shape": [ + 4096, + 428 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3506176, + "byteOffset": 16449536 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 19955712 + } + ], + "md5sum": "d4a42ea0489cf705c396b2f1befb3849" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 16646144, + "records": [ + { + "name": "param_312", + "shape": [ + 65024, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 16646144, + "byteOffset": 0 + } + ], + "md5sum": "2565842220b4812ca2e480865c30f09c" + } + ] +} \ No newline at end of file diff --git a/params/params_shard_0.bin b/params/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a09ea1ea0c0ac950c36ab639824170b08ad5381 --- /dev/null +++ b/params/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4f43ba35a8b17206ae7dcec9ad5431484c048de6a5d8be898c2f1f823688cb +size 133169152 diff --git a/params/params_shard_1.bin b/params/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0cf11a32c53c73d6fab1b814c76b946151ec521 --- /dev/null +++ b/params/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611b86fcd50b757f75fe1b1018afaaa046fbd8b84ffde1b4fd1f55cff38fc928 +size 27288576 diff --git a/params/params_shard_10.bin b/params/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..647776fc976b190d885378fa15c6e286a67e97dd --- /dev/null +++ b/params/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7709260bf229819628d2bb048596d769c97bba5b149afde2ab5c18b8cd1f0a8 +size 30598144 diff --git a/params/params_shard_11.bin b/params/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe97ad71a844f0ba11f35f0ecdf26ed81597e908 --- /dev/null +++ b/params/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39eb81bffd393e26b24c663f641fce38086ac4e96b2b2871ade057ef2809adee +size 56098816 diff --git a/params/params_shard_12.bin b/params/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b183d9e07951c8b4d0d2cd20a4939ddc6d14e3b --- /dev/null +++ b/params/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e69b7e0b676c4c95f82939d0f807b70d076778af6e893ca3b0cc84bd1adcd98 +size 28049408 diff --git a/params/params_shard_13.bin b/params/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc8acfcebb25ba37f35507cbb96a8d3e2f0dc7f6 --- /dev/null +++ b/params/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8dc507e758c8d982623b297f2d11029f90fcead7bffe610c41094d9e61290b6 +size 30598144 diff --git a/params/params_shard_14.bin b/params/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..3133dbdf2fc501d83fef994aa914347a97b7541a --- /dev/null +++ b/params/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10fa5d998f82be654cb84fde61c60923f636744fec3d046b037da365070ad914 +size 56098816 diff --git a/params/params_shard_15.bin b/params/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..93aca46ffdcc54073168d0730a161be512cc2220 --- /dev/null +++ b/params/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0629d5b4551ef44b2fbc0a9384c1801ef5e92d1b47f2553fbb9bcad3079ac12f +size 28049408 diff --git a/params/params_shard_16.bin b/params/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..4208d2f1c95bf8416147f61b13c65c1094370f51 --- /dev/null +++ b/params/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726cb887470b34cd30199db7d44b03654750d9f87fff69b412c6469b9e6b9351 +size 30598144 diff --git a/params/params_shard_17.bin b/params/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..29f88487052d0cfc2b20c660a83958567ba434a7 --- /dev/null +++ b/params/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58de044b2f46e5aa3a4beaa185e2f43f80c6999487404d83a3d9ad04d14075d8 +size 56098816 diff --git a/params/params_shard_18.bin b/params/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..15d0078e05a01e71ecb9569eae8fb78b7975cc2d --- /dev/null +++ b/params/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531b842ab75be93477d7640e6d9d01851d268d3eb8c28d62bed0e2cd98600ea7 +size 28049408 diff --git a/params/params_shard_19.bin b/params/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d555f2771879dc570d2c40b650a2059f567622a --- /dev/null +++ b/params/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a8c92f25e601d26b6e1f21d9c53527ce6a37a976832b324b87bd9455747f3e6 +size 30598144 diff --git a/params/params_shard_2.bin b/params/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcbdede6f2b85a037b7f85802ec23a111dc57b3a --- /dev/null +++ b/params/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8080cebba6d3b6d7171153c804c739cdfc06c87cd8e689a723b83db8973b9875 +size 56098816 diff --git a/params/params_shard_20.bin b/params/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c24c2f5f676a9dd6da8ae4cc4bf10a12b658e49 --- /dev/null +++ b/params/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e9ea27ab681bcc9c3d702ffa450137bfbe52f341acd2a6bb0c8a2a856a5353 +size 56098816 diff --git a/params/params_shard_21.bin b/params/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f040ce730707a0e832b73b44cd8b2a591ac787a --- /dev/null +++ b/params/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfb9cb3b101d1a98fe4643a4ac0319cb7eb4bce684ed44b8512c777c593609c +size 28049408 diff --git a/params/params_shard_22.bin b/params/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..f9c0120ae5ffa48453cd391cf25112cbfc6fbd54 --- /dev/null +++ b/params/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0bacd8ffd641395897081d9613cb3a7a8f1d589050c0c9a33ac22eb7c18778 +size 30598144 diff --git a/params/params_shard_23.bin b/params/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..045f4f0f9f6425193cfaa71b9d9dabc8325f5f81 --- /dev/null +++ b/params/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6e8bf2d82e46845f62af39db3eaa0392339c52dab847c755839039d49849fe +size 56098816 diff --git a/params/params_shard_24.bin b/params/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..a04367292ff2301243b0fd3863b24f4f612a742c --- /dev/null +++ b/params/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf9b5f51abb144667606ded352687cd8f590988769395ef29a8dfadf91bb818 +size 28049408 diff --git a/params/params_shard_25.bin b/params/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b97f27c16e8e50ffc8b07711e7fbfb69fb5bb10 --- /dev/null +++ b/params/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7719fb6d56c35ecf2979cb281668d742b7c9a399cd9ed0d337994033672417 +size 30598144 diff --git a/params/params_shard_26.bin b/params/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..d171b1fb56b2204e60aa8c8809e36be727e1104d --- /dev/null +++ b/params/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9a4a0f398cae6707407431253f8c41a9cc7001e7439680a3e6fc5247eae29c +size 56098816 diff --git a/params/params_shard_27.bin b/params/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d2f1f1cf7f0e71a8c3389ff01c750e211ca7e7f --- /dev/null +++ b/params/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6aed5e5fa61b23924bbbc94f920adfe1f0f656339faf7b6d4169366192be5ee +size 28049408 diff --git a/params/params_shard_28.bin b/params/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea2588e362e2db4a284697cee012ffefb6669a4e --- /dev/null +++ b/params/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c81be0da6a44ffdc1450c156b11f04a732ce997e94c624d55296ee01a1f499 +size 30598144 diff --git a/params/params_shard_29.bin b/params/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..22a535067a609276dfe23f5c728702997da231f6 --- /dev/null +++ b/params/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d539746402ec7c293956334d8454f0036170ac18d16e1d126bad3857f2f6204c +size 56098816 diff --git a/params/params_shard_3.bin b/params/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..5410549bcc880fb555d1b92d311a44b207e7fb9e --- /dev/null +++ b/params/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e614da732df246cfed96ee116d1844afc0452632b8fc408a238b03892710c17 +size 28049408 diff --git a/params/params_shard_30.bin b/params/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..4dadefd45ef4dd1b3e05f18ae8b5a68e153f0966 --- /dev/null +++ b/params/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48320202aa696acd748d46e64069a982b1a7a28d40924bc61ac9c29050525696 +size 28049408 diff --git a/params/params_shard_31.bin b/params/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ab85436c12bc671666762ff40695adf326b0ec2 --- /dev/null +++ b/params/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ec7ee1032dbb66272bf5b33205d294cf8312448560b368e65c5e17682e4422 +size 30598144 diff --git a/params/params_shard_32.bin b/params/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ecf5277216584f18549c23b99f479474fedf5b3 --- /dev/null +++ b/params/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62545e96b1bec86e1a60b4fadd39befb0780aecc1898d30516bb557f228fc4ef +size 56098816 diff --git a/params/params_shard_33.bin b/params/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bf92f428907dd59908c59df7ce678f93f173e64 --- /dev/null +++ b/params/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd74bab722eecab6ba1324c17d9836e58ae191a811729cd026e57f199145a553 +size 28049408 diff --git a/params/params_shard_34.bin b/params/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..029ed0eb180606b9d325584f11bce66d615f02b2 --- /dev/null +++ b/params/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72bbc0fc80dabab9b1ce0b53d7e2956f8b0e2f93405a7411df313f17228a019 +size 30598144 diff --git a/params/params_shard_35.bin b/params/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..f11edfde8ee6b542fee98cc0795ff7a0e9f100b8 --- /dev/null +++ b/params/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c674855a37b40934b350b526ca2866cf6053b33ef752206812090b74b7bbc7 +size 56098816 diff --git a/params/params_shard_36.bin b/params/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..552ee55de17592dee7b0e92b7e64d82e6dd8d4ec --- /dev/null +++ b/params/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b470de27131de6805dc75e42991fa466766e76332b0dad07d607167eebd967d2 +size 28049408 diff --git a/params/params_shard_37.bin b/params/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..6e31a9f63112247c2e29cbd15fc0a44e990a361c --- /dev/null +++ b/params/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071fac6ea8c79b2977f09770259c6ac5819e8e2cec09d416cc6ed4f18b90b36c +size 30598144 diff --git a/params/params_shard_38.bin b/params/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed066af9cedfae49dcd4737d70ad4a8a9ae4dd60 --- /dev/null +++ b/params/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7867a175b7652c94ea5ff2f557c9065c623b3e61f1a8ea641ae2fb17671b29 +size 56098816 diff --git a/params/params_shard_39.bin b/params/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6a593533685dcdd392a1cf4d7093e58273868dd --- /dev/null +++ b/params/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c450364969b2f4ede904166160d099f2a0dc2edc9ae2d95a5c77a3118b72564d +size 28049408 diff --git a/params/params_shard_4.bin b/params/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..f42ced1d750ac8fd886fae1555f66b573f399ba6 --- /dev/null +++ b/params/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b0e80dfed33ec27a5ecd61c87a082394bc68572fca7032fc10a4dc957aecf3 +size 30598144 diff --git a/params/params_shard_40.bin b/params/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0a4449cb8a34e1b51b0e08dfbaf9145f99851c2 --- /dev/null +++ b/params/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36462f4c2eff8dfddb076a930e6440c959395454bdbac2185b416fc0f3040a91 +size 30598144 diff --git a/params/params_shard_41.bin b/params/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ab75eb13fa2fc258371d3cb8a7cb33e2f37e568 --- /dev/null +++ b/params/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ec1476e1de02f4ab63aee6b7ce0d362dcc68a4719952c735cc1a9fc1795b5d +size 56098816 diff --git a/params/params_shard_42.bin b/params/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..9edaede410264e0bb10db8e2c6270bcdd7be433c --- /dev/null +++ b/params/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d389a4300ff77b99b6a636471654a97662766b1fc6826883db6ae75f27596192 +size 28049408 diff --git a/params/params_shard_43.bin b/params/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..865841c09459476a84634a8a0c4a1073e641ab16 --- /dev/null +++ b/params/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e0a4741a8c1b7be28e5262c3042833b77301827152eb711898aaf2902557ecf +size 30598144 diff --git a/params/params_shard_44.bin b/params/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..d60909f2271a3dc5b52dccc7815f062a072e796b --- /dev/null +++ b/params/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44a879399216f46a531ac173602d2670da8fb0db5294d7178a12f9dc87ac1b2 +size 56098816 diff --git a/params/params_shard_45.bin b/params/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..a00ee6d51c3a392f3205e5bfd8732c6398cf523f --- /dev/null +++ b/params/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b8b68c1a38b2aa92528679e4d6c67166443f05e33d563102392ab833afeaefc +size 28049408 diff --git a/params/params_shard_46.bin b/params/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee28af450321c6814b318d70ea595f3dca7829ab --- /dev/null +++ b/params/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c86adba88968d4dc7a78f9e95aca23019e027d8b7b8f0260066e1d1722b258af +size 30598144 diff --git a/params/params_shard_47.bin b/params/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..c157a209e2f139fc40ff445965b30ab3c51badcd --- /dev/null +++ b/params/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b94ea32e0e01dacc83d7bc44aade7eb4ecd98d9de4eff7b7ea92b31619d6a17 +size 56098816 diff --git a/params/params_shard_48.bin b/params/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..2dfa10bcabbc739242ffa5bb3a7eca37106a6598 --- /dev/null +++ b/params/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4d81a596a3df12cd6bf308b0b5cda808330a9df04a32e9d322fcb021f87eca +size 28049408 diff --git a/params/params_shard_49.bin b/params/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ccc6f41aa207fd7781292f1c24fa8a2c9defa15 --- /dev/null +++ b/params/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e62ca4f67de34e1ed63facb8986ec51ddb0b402580d751401d1e4ead8d000fe9 +size 30598144 diff --git a/params/params_shard_5.bin b/params/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1c41399edbe6ffd77afab58ad02241cc9d46ff9 --- /dev/null +++ b/params/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e64b584edf0a1bd68abae0a04f31905cd79aedba9894e55a53642cadaf2a93 +size 56098816 diff --git a/params/params_shard_50.bin b/params/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..23cd8d3ee72b80589ec699d640a100ad6a3e13fc --- /dev/null +++ b/params/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2bb64a0a2cf33c78b8941e5cb6b8895415a9ea7fe3a28fb7cc3a86f704e90a +size 56098816 diff --git a/params/params_shard_51.bin b/params/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..b34fb91f508ed894d70fd03b7320dfc30f8ecf7c --- /dev/null +++ b/params/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c12c8363a891498608756c1ddb9b0165d8fc54eada88e3f49af921d18820bd7 +size 28049408 diff --git a/params/params_shard_52.bin b/params/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..58a915214227b8a612db5ae66d52d186ce9ccf78 --- /dev/null +++ b/params/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4dd6e7f3585c1d29398f0a7c5d13c01230d375e999407556f64a11d98ea33c +size 30598144 diff --git a/params/params_shard_53.bin b/params/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b5963cc29c682f6d278245b3a030765007fc0b2 --- /dev/null +++ b/params/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6fb58c83bcb8966ed983472b18a01e8d6fb646db52d330f6ea7358409215b36 +size 56098816 diff --git a/params/params_shard_54.bin b/params/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..404eb55fe5f4e6982dcbd740cc4fa41d7a68da20 --- /dev/null +++ b/params/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb85d56f1dd760e21fb6955f20ca4de98ea76a2b9d079fdae84e9d55921c6971 +size 28049408 diff --git a/params/params_shard_55.bin b/params/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..25d12ce5501c3364d1e0a8f596fb157b4d3d8a66 --- /dev/null +++ b/params/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63eb931a69cda39b65fa04fa56dea279d263a19875d67933a73f39909bdd700d +size 30598144 diff --git a/params/params_shard_56.bin b/params/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..609980657649782ad8bff077b20a8fd0844dfebd --- /dev/null +++ b/params/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4fd51661241c3d3b9c361f62f6807dc4d5bf5b254e05ac032bde25cb22222e5 +size 56098816 diff --git a/params/params_shard_57.bin b/params/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..8483d82af6509600fd84ee4e7e747e78f59413b1 --- /dev/null +++ b/params/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9c09957de67bdc9ac7d0c7d75b00f007ff7db4b24f8ccc2adda9a066d7ac3f +size 28049408 diff --git a/params/params_shard_58.bin b/params/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc61fdbebb5b00496ed64667fd5b7d2781e0ae01 --- /dev/null +++ b/params/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1fb735c1804eefff48f5e08d45c7c2adff1f0f0b3808657da636939c0f2c7f +size 30598144 diff --git a/params/params_shard_59.bin b/params/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f2f13b53be6ad937422df0464924f39eb9be9e9 --- /dev/null +++ b/params/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c76f966300e05d3d6a22e49eaa64365c286d6250c5386aa703a2b6b3c3a7eb +size 56098816 diff --git a/params/params_shard_6.bin b/params/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..f11bbc99e740d651544c62f9bb130c83c4b8de50 --- /dev/null +++ b/params/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495bee1e6b0ee736258a6c23d298fd32acfa18564c4be86182bc34618204e5aa +size 28049408 diff --git a/params/params_shard_60.bin b/params/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..47e40fc26c0517c998790cc5228cbaa48f0d829a --- /dev/null +++ b/params/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a3e1382a18decb5d27cd27433c9094be3180b4528fa6fde940f9f8b6443b22 +size 28049408 diff --git a/params/params_shard_61.bin b/params/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d319d33efe60f61242986e0149201d14c962218 --- /dev/null +++ b/params/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28de5db63fc26beb38342a441c643dfecaa03a9a7d207aca40c14375717dd194 +size 30598144 diff --git a/params/params_shard_62.bin b/params/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..8df77dacc58bdb0437f940114c27335e95dcadd3 --- /dev/null +++ b/params/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1018ea0b3b52d9b48af41e1a53c5e647ea21e9594578ff5d7c65f294630d1441 +size 56098816 diff --git a/params/params_shard_63.bin b/params/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..131c8f1980f4bd1729d8f946e3c8ad1b731149bd --- /dev/null +++ b/params/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1145f7b7264054bce2b14b3100173059ebf9c4f03785b0c15f8a2efd4de3c215 +size 28049408 diff --git a/params/params_shard_64.bin b/params/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..057fcbd8a0dce7ed63b4232fa3d8baa8540cc2a4 --- /dev/null +++ b/params/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2dabdea3a4fd65c75def8a5b9dee52ea5dc5311e6d1ca0288ed3c2b3d673be +size 30598144 diff --git a/params/params_shard_65.bin b/params/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..04534f216c853e6189afa9d330a628081e67ed9f --- /dev/null +++ b/params/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf0cf35987d2959a4481333206a7b1623d97c14f6227030d69a56a86bcc81b1 +size 56098816 diff --git a/params/params_shard_66.bin b/params/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e3b8e6702276c57598938c7e4e7c5011504c257 --- /dev/null +++ b/params/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8ba6fa85be532960e2f995a133884e2ca70b4770e6eee87c055ac79452751a +size 28049408 diff --git a/params/params_shard_67.bin b/params/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..7eee2e7df82f52dafa2331df8c64ab65d4fc8766 --- /dev/null +++ b/params/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78e20e7c8d429aca5d0a0a4326de3487f1eebeaa6d5acfebfb313ea943379c4 +size 30598144 diff --git a/params/params_shard_68.bin b/params/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca1f52e9ab6fdcf353693abd7b0bfcc5b8c4574c --- /dev/null +++ b/params/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555f10597d1935fb119c4f162dfb8173564685cadcf2ec88b95761e2dd8e1c97 +size 56098816 diff --git a/params/params_shard_69.bin b/params/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..08b05d7072a1f2fe726f504b1d36e01aee412193 --- /dev/null +++ b/params/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1120b2575836d358c6b6be61111d78424e7dd25d5b37068220705098062dd813 +size 28049408 diff --git a/params/params_shard_7.bin b/params/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..17092eb5a84fd955e98d4f92a1b04be5af7dcdef --- /dev/null +++ b/params/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00bb038421aca04e1e7ec75b7d13a6a0cc115ccc1d11ae6f1d62527e9983011 +size 30598144 diff --git a/params/params_shard_70.bin b/params/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..0513ff7c9e5e8289e23d26350950fa84caa90173 --- /dev/null +++ b/params/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae81d7a0791adfbe048c93e297f681b597ee480a043cbedbaaa94eb73a2b023c +size 30598144 diff --git a/params/params_shard_71.bin b/params/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..21bc477fc068841712ed1414836efec2ff2ae560 --- /dev/null +++ b/params/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a446209e5ed039000e2f27b9004d3495f85fe46a22f3460cee694b7c852d29e5 +size 56098816 diff --git a/params/params_shard_72.bin b/params/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..4206ac6ecea6cc67ae3e9e3495cf05958fa2d57b --- /dev/null +++ b/params/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3113d78f20b5734066f5ce0cc92e31f4504c0d6e8a009928154f7150cabd86 +size 28049408 diff --git a/params/params_shard_73.bin b/params/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0bffe63d2bd3ed4b355278c1114451288686d9c --- /dev/null +++ b/params/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f7eb8d6457b3df47db450ff2af8afb4e6b6d4f3c8ee0f07cc4e10fda97d214 +size 30598144 diff --git a/params/params_shard_74.bin b/params/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..027a57d5bca62470ae01a2ebcb0a7ca2370c298f --- /dev/null +++ b/params/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a50a00540d3eb9d670802ea5ca89a486e6171768ac391958f0d601ebd61ee4d +size 56098816 diff --git a/params/params_shard_75.bin b/params/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..709ad2a947e38982a435446f034c66717509c36e --- /dev/null +++ b/params/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64555888f8e132e64f80ae52f707b58aab95272ae115afed253990ac683d2557 +size 28049408 diff --git a/params/params_shard_76.bin b/params/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd057bd4ff3c95da5112af6f72f39c9d6dc44898 --- /dev/null +++ b/params/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6c3a551cae0c3275e5f00365f312bfbacbb741607d0a90e03100e09f325f92 +size 30598144 diff --git a/params/params_shard_77.bin b/params/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d9cb231674af26f8f7fef32626b75bea8355c51 --- /dev/null +++ b/params/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd814bf9869499b4afffb49541095510ef4559cf36c470e4b57db0727879bc76 +size 56098816 diff --git a/params/params_shard_78.bin b/params/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea0f1d8f42d03ecf8ce0c53a2189a755f795f252 --- /dev/null +++ b/params/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba03d50f2b2acb9e16c6a4be424f253869468c4ce9ee2fdda161deda7ee0763 +size 28049408 diff --git a/params/params_shard_79.bin b/params/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..6264cf2dd6c3ad73cbf1a0cfb105754bce465e88 --- /dev/null +++ b/params/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726e700bf8880515c162445cbea0d43617f5db2e35301cb82dd1d274270ffd0d +size 30598144 diff --git a/params/params_shard_8.bin b/params/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b327c88b7b09f6a103fe4ed1b9d1f7496102de2 --- /dev/null +++ b/params/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e19859659b05e8fdc30b5c7f868c0bc26b08924c36487b05515f2f74a386a61c +size 56098816 diff --git a/params/params_shard_80.bin b/params/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..b95199af2a0f95a063971cb20f01ccb082c72e0c --- /dev/null +++ b/params/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80df60cf09f93a4e77d0dd3fef8ffa9c6b54cbc256b130b723ccc7e0dc3515d4 +size 56098816 diff --git a/params/params_shard_81.bin b/params/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdf1fc232f6d89af8572821b2582b12aafafa22f --- /dev/null +++ b/params/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29635671cb10d688c5d3adae541420fcd01c9efb3f0c385d771220aa1c09a785 +size 28049408 diff --git a/params/params_shard_82.bin b/params/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..b157036af593892fc2ddf5715ba5510d80f8dc6e --- /dev/null +++ b/params/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e536d08d575cc6b82c96f3492a802c906b7e34341678b0151e7d39c9d9140832 +size 30598144 diff --git a/params/params_shard_83.bin b/params/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..47b1e60e41c136e1652e9bb579d4129bb991f723 --- /dev/null +++ b/params/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9aec2d06b4818c7d091ab1b1245d544b474d0cc60992997b5967705601713df +size 56098816 diff --git a/params/params_shard_84.bin b/params/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0f20d0f247df11dd272dd52b2798fe5a3c987e5 --- /dev/null +++ b/params/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35155d16ae9ad0fa39183b6a919edddf4803e586c20445760519e1f1a9c6cfb0 +size 28049408 diff --git a/params/params_shard_85.bin b/params/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..a87a29f5fcaa20d68340a1f20a4e80187bee8ba3 --- /dev/null +++ b/params/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9567eeeed3472f6d15ed26ca42ab54428f9df63c508edb56bc4f89430e201591 +size 133169152 diff --git a/params/params_shard_86.bin b/params/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e5f16d5c98373085fc757ce9ad3f6cd57c713ef --- /dev/null +++ b/params/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e18035c143e90b4db6591cb6a5de16d1e9a202cdd1689916ef8eb0b3d5cd996 +size 19963904 diff --git a/params/params_shard_87.bin b/params/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..5de76f3a528b1a5f6b5f0f270212cf74a9d1aead --- /dev/null +++ b/params/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690195ef5c0e695fd3105bceed8770c0f422055f745d7e91d38ec7c2ed337c3f +size 16646144 diff --git a/params/params_shard_9.bin b/params/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ab9cbddde574239d7a8e548888daf92d50e85c5 --- /dev/null +++ b/params/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194f963c42dfe46ae628c43148b1d488a1a1abae0bf362dc1293c8ceb5e910a9 +size 28049408 diff --git a/params/tokenizer.model b/params/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..8a8007697b7cc3d3868dcffbbebf8c1f2bd690ba --- /dev/null +++ b/params/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7dc4c393423b76e4373e5157ddc34803a0189ba96b21ddbb40269d31468a6f2 +size 1018370 diff --git a/params/tokenizer_config.json b/params/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..79b212c00ecdde03c51bb791f7fdfc25f4176ff3 --- /dev/null +++ b/params/tokenizer_config.json @@ -0,0 +1,12 @@ +{ + "name_or_path": "THUDM/chatglm2-6b", + "remove_space": false, + "do_lower_case": false, + "tokenizer_class": "ChatGLMTokenizer", + "auto_map": { + "AutoTokenizer": [ + "tokenization_chatglm.ChatGLMTokenizer", + null + ] + } +}