diff --git a/README.md b/README.md index 0da1f9dbdd674dc9362c9c5559bb8227248950f6..d37c929983c31f0dd0c7bc385979356b3158b401 100644 --- a/README.md +++ b/README.md @@ -7,18 +7,13 @@ tags: - encoder-decoder --- -https://github.com/peytontolbert/agent_kernel - - -http://peytontolbert.com/agent_kernel/ - # AgentKernel Lite Encoder-Decoder Browser BitNet Self-contained browser BitNet export for the AgentKernel Lite chat model. -- Source bundle: `/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500` +- Source bundle: `/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6` - Parameters before BitNet packing: `113507328` -- Final eval loss: `0.9985759307940801` +- Final eval loss: `0.0016785785555839539` - Browser entrypoint: `manifest.json` - Runtime: Model Stack browser BitNet WebGPU encoder-decoder with packed BitNet WASM fallback - Tokenizer: AgentKernel byte-level BPE attached under `tokenizer/` @@ -26,7 +21,7 @@ Self-contained browser BitNet export for the AgentKernel Lite chat model. Web app route after uploading this directory to Hugging Face: ```text -?modelStackManifest=https://huggingface.co/PeytonT/agentkernel-lite-100m-bitnet/resolve/main/manifest.json +?modelStackManifest=https://huggingface.co///resolve/main/manifest.json ``` Serving notes: WebGPU is used when available; Safari or other no-WebGPU browsers use the packed BitNet WASM fallback. Large model files are fetched by the browser and cached by the app. diff --git a/agentkernel_lite_browser_bitnet_export.json b/agentkernel_lite_browser_bitnet_export.json index 20ab930dfc1ceaaebd3f28cbb8b12a7b456576a3..0713b7d55ea90e1fdd566b68818d74db9d7d6490 100644 --- a/agentkernel_lite_browser_bitnet_export.json +++ b/agentkernel_lite_browser_bitnet_export.json @@ -1,15 +1,18 @@ { "artifact_kind": "agentkernel_lite_browser_bitnet_export", + "dense_dtype": "float32", + "dense_float32_include": [], "dense_tensor_count": 43, - "device": "cuda:1", + "device": "cpu", "format": "model-stack-browser-bitnet", "layer_count": 109, - "manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/browser_bitnet/manifest.json", + "manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/browser_bitnet_hf/manifest.json", "max_seq_len": 1024, "model": { "activation": "silu", + "agent_policy_heads": false, "attention_bias": false, - "attn_dropout": 0.0, + "attn_dropout": 0.05, "attn_impl": "eager", "d_ff": 2048, "d_model": 640, @@ -19,13 +22,16 @@ "kv_cache_paged": true, "masking": "build_causal_mask", "max_position_embeddings": 4096, + "mlp_dropout": 0.03, "n_heads": 10, "n_kv_heads": null, "n_layers": 6, "norm": "layer", "pad_token_id": 0, "positional": "apply_rotary", + "resid_dropout": 0.03, "residual": "prenorm", + "retrieval_head_dim": null, "rms_norm_eps": 1e-06, "rope_attention_scaling": null, "rope_scaling_factor": null, @@ -39,7 +45,9 @@ "version": 1, "vocab_size": 8207 }, - "output_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/browser_bitnet", + "output_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/browser_bitnet_hf", + "quant_exclude": [], + "quant_include": [], "quantization": { "activation_quant": "none", "modules": [ @@ -158,10 +166,11 @@ "spin": false, "weight_opt": "none" }, - "size_bytes": 80235516, - "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/agentkernel_lite_encdec_manifest.json", - "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/model", - "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/decoder_repair_respond_clean_from_freezeemb_retrieval2000_train_01500/tokenizer", + "quantize_bitnet": true, + "size_bytes": 80257831, + "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/agentkernel_lite_encdec_manifest.json", + "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/model", + "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/tokenizer", "tokenizer": { "bos_token_id": 1, "config_path": "tokenizer/tokenizer_config.json", @@ -173,6 +182,6 @@ "unk_token_id": 3, "vocab_size": 8207 }, - "webapp_manifest_path": "/data/repository_library/exports/agent_kernel/models/agentkernel_lite_100m_bitnet_15000/manifest.json", - "webapp_model_dir": "/data/repository_library/exports/agent_kernel/models/agentkernel_lite_100m_bitnet_15000" + "webapp_manifest_path": "/data/repository_library/exports/agent_kernel/models/agentkernel_lite_100m_bitnet_v11/manifest.json", + "webapp_model_dir": "/data/repository_library/exports/agent_kernel/models/agentkernel_lite_100m_bitnet_v11" } \ No newline at end of file diff --git a/dense/dec_embed_weight.f32.bin b/dense/dec_embed_weight.f32.bin index 45ae6abd11409ec953b3484953b0afd1c32e636a..989775d5f09ae65c31ccc4acfb36659942d63541 100644 --- a/dense/dec_embed_weight.f32.bin +++ b/dense/dec_embed_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0b2d9d06dc96048cff8f30867bc4c520bcb7586df46a0325c95b6a93a84aeeb -size 21066240 +oid sha256:78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df +size 21009920 diff --git a/dense/dec_norm_bias.f32.bin b/dense/dec_norm_bias.f32.bin index 0a19f774863139ecdc007010d12dcd102749db11..3622e96e24f8e325877e840563774d38968eeb70 100644 --- a/dense/dec_norm_bias.f32.bin +++ b/dense/dec_norm_bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bc56aaf3ca92b1288564ce350a4714e94a6021ab1a54402de1644d717312a755 +oid sha256:5b5e96cac42589a663a9f5682082013889507d15b2134376aa286c1c002b7fcf size 2560 diff --git a/dense/dec_norm_weight.f32.bin b/dense/dec_norm_weight.f32.bin index 8f4505aa6b649ec05b6abe5b318c93f47736cdaf..090e714b93eff0f23d3cee7287f75cf2387dc2e6 100644 --- a/dense/dec_norm_weight.f32.bin +++ b/dense/dec_norm_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9db5943f63cd2d6154e730c9fed0f644a1bbf7c7ed77add76e90b84c1aa4ef3b +oid sha256:f3007750a249fff13b6d5325bdec87cf3e823d773e9b4ddd8661358e1c88bc4a size 2560 diff --git a/dense/decoder_0_cross_block_n1_weight.f32.bin b/dense/decoder_0_cross_block_n1_weight.f32.bin index 457148a1aff804511df2e19a2c56d9efc89433d3..26b5daafbbebb31750cc0a30637ce6279ab7e507 100644 --- a/dense/decoder_0_cross_block_n1_weight.f32.bin +++ b/dense/decoder_0_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:891fb6b04974c8b901b28c09ae7ea6e5e0cdc726a71f6d17b07f1a375d4426da +oid sha256:9e321bd4b5815ad26ae4a2c222d73c2bd84b44c67aa3ba4a3e7425389c6eb783 size 2560 diff --git a/dense/decoder_0_cross_block_n2_weight.f32.bin b/dense/decoder_0_cross_block_n2_weight.f32.bin index 62d547b0de05fb6062d7525b5dff991be54ce1ee..ac7ccf85388afd26af2d255870c3a203c515e34a 100644 --- a/dense/decoder_0_cross_block_n2_weight.f32.bin +++ b/dense/decoder_0_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a719c7ed5cf7db904f9077ad94985d06a65e2d38a64340465579147ffbac8c5 +oid sha256:e44330e6d5b15cb95b080f739e6fe708f9915ebfc33cab76c01c6c4c2bb4e51e size 2560 diff --git a/dense/decoder_0_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_0_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_0_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_0_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_0_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_0_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_0_self_attn_block_n1_weight.f32.bin b/dense/decoder_0_self_attn_block_n1_weight.f32.bin index 4a5f5ca9879fe684a59270d6263fd060ee8b1982..886d6711c557d6a65c22fc8bfa3b8797118d823f 100644 --- a/dense/decoder_0_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_0_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3ecfb7e994fc3be415d9ca72f228f0a6fe1bac9ed350e75ae883ac75d4c5a431 +oid sha256:aa1687c4e058f3c05d691ed6f33ca18be4ec4ca67ddfe2806b29bc4926a06d87 size 2560 diff --git a/dense/decoder_0_self_attn_block_n2_weight.f32.bin b/dense/decoder_0_self_attn_block_n2_weight.f32.bin index e50a97383ee5c6b4dee22e22b95a13f37f886785..74b316e08c83f42bb1f8c9758bd7cb91c4ab1e19 100644 --- a/dense/decoder_0_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_0_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33d786b3efc9c3443b12cd66a09c63bd595e18ec0c9eb07fae38297f7005bf84 +oid sha256:aaf84ca53571564ef264cd69f05f68a5feae20d67c51111440aa38971a927f0a size 2560 diff --git a/dense/decoder_1_cross_block_n1_weight.f32.bin b/dense/decoder_1_cross_block_n1_weight.f32.bin index b8f7eb544e66b9012e3b9f0e17b89637e16de3d8..10505ae0eed5d0cc2177b9bb12c8a4b6cd6f3b55 100644 --- a/dense/decoder_1_cross_block_n1_weight.f32.bin +++ b/dense/decoder_1_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cbd55183838a8ab6e77bb181eeb8cf43c54e6fdec064a948915193df754f7cf9 +oid sha256:3ea07312d131aecfcf9aeca759f7da272db7f8669faaea13adaa03af9e74cdf7 size 2560 diff --git a/dense/decoder_1_cross_block_n2_weight.f32.bin b/dense/decoder_1_cross_block_n2_weight.f32.bin index 33c30617c9c024155490f9cc905147ce06f259b3..05652d9691d9097b0e6fd6286fba7c67db5fcfed 100644 --- a/dense/decoder_1_cross_block_n2_weight.f32.bin +++ b/dense/decoder_1_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5e01f19710f000878795ab523b271d8b34893f6c377f610bdd0eba9f18574a70 +oid sha256:a2d7b097f261522851525b00d4df45ee76aba6fd6d1c467bc592e7c75f7d0e21 size 2560 diff --git a/dense/decoder_1_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_1_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_1_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_1_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_1_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_1_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_1_self_attn_block_n1_weight.f32.bin b/dense/decoder_1_self_attn_block_n1_weight.f32.bin index 546fb364a79944b593d74ae089050dda5a56dcc4..7317edc286597aece75db7df67fac8a687f797bf 100644 --- a/dense/decoder_1_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_1_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3ce6ed00aee268de7d08e6e9acdecb2ce494e53740f49b397653063f65708af9 +oid sha256:6e04d7ae884588db5de7ef2072346f6e8b2066b26ed9f5847645221ed9539942 size 2560 diff --git a/dense/decoder_1_self_attn_block_n2_weight.f32.bin b/dense/decoder_1_self_attn_block_n2_weight.f32.bin index ec90ceebf9fff168ab1f15d330a8d67cc7d213ce..4de4e536a23a8fbfd2dd2699ea90ba355ba96786 100644 --- a/dense/decoder_1_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_1_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3aff504c8c158ad32e0d53fcde49f9c3d9d2c6d8c6ffac4793913ab8e9fc351f +oid sha256:c0b1278f7154bf8b2234bdd368fbce9e7bd74601a1c793f56fa4f3586a7f7b73 size 2560 diff --git a/dense/decoder_2_cross_block_n1_weight.f32.bin b/dense/decoder_2_cross_block_n1_weight.f32.bin index 66219981be6137921e1686956c737b2dd0d7892f..e7c7d6bf4d7e83092b4b50639827532a51e8a38d 100644 --- a/dense/decoder_2_cross_block_n1_weight.f32.bin +++ b/dense/decoder_2_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:074691158ffb33267b6d1515d51dfccffd776d308d77ca10cd42f5c9e11d16b3 +oid sha256:28376ace409fa2952ac2990043be9b9c983aea3195e64ca73a2c6ba4a7679303 size 2560 diff --git a/dense/decoder_2_cross_block_n2_weight.f32.bin b/dense/decoder_2_cross_block_n2_weight.f32.bin index a513cc54005de59d1644b1c8ea6221411a10ab14..2db1410596c033c7d829c6e1f9d2ee31574b2b61 100644 --- a/dense/decoder_2_cross_block_n2_weight.f32.bin +++ b/dense/decoder_2_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:252019fc3c4e0a4b6e8d3b4a6612fa119688c8dda754f204055cd8276a1136ac +oid sha256:1feefaae8826e4c2ad02d385f9b805519b96a7db7fe49052f1f8a8c693309339 size 2560 diff --git a/dense/decoder_2_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_2_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_2_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_2_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_2_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_2_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_2_self_attn_block_n1_weight.f32.bin b/dense/decoder_2_self_attn_block_n1_weight.f32.bin index 71e05fbf9bed9d1658d0fdf0a402405298868372..faa93371e998f8e6d7b7e222e78ffb0d48f98b89 100644 --- a/dense/decoder_2_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_2_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:142d7795a7359da525adde3aa5342706ad7fddf0f79e984b0d6f95a3fb7074ec +oid sha256:3731b30effc4197d021d7ed55349454c585246d030d74d9299b07aafa7b367d6 size 2560 diff --git a/dense/decoder_2_self_attn_block_n2_weight.f32.bin b/dense/decoder_2_self_attn_block_n2_weight.f32.bin index f4f5d38fbd0464ae80ed5a194559543c7a9b3e12..3201c70a4e87c4878423b1d8df408270fb26eac4 100644 --- a/dense/decoder_2_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_2_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5c5cb7840e3107062925817a43bd242b3fe2fd4a7786cc1a9460d9312c1b6eb +oid sha256:632df68307a27cfc2054c13a9b511180dce6e735c8c79dc6a420e984ffcc385c size 2560 diff --git a/dense/decoder_3_cross_block_n1_weight.f32.bin b/dense/decoder_3_cross_block_n1_weight.f32.bin index c07649466c8094a95dabe08acdb301435456ddda..41bbd30eae01f1c1bf2f1f46ee7f80ce52566d24 100644 --- a/dense/decoder_3_cross_block_n1_weight.f32.bin +++ b/dense/decoder_3_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15ae5917f2aa04cc28786948c54d7375493275ebabe9e5ffc2d6b53825b7776f +oid sha256:9e8c667419c8df40c09c7e194573444198f3e0f8d057e61e301b293928695560 size 2560 diff --git a/dense/decoder_3_cross_block_n2_weight.f32.bin b/dense/decoder_3_cross_block_n2_weight.f32.bin index db3e63562af832dc53e58393803ce4b9aa9467b2..1f06ed42face3b870bd41a2a7f8e4dea6511d51c 100644 --- a/dense/decoder_3_cross_block_n2_weight.f32.bin +++ b/dense/decoder_3_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:caccd589d5a01abd27c8661e131ee691f8b6559a4330aeee886cb0492a73aeb3 +oid sha256:770f911b6ec49b1da40240580ffac220c6308585bb36d1151a6623a5d46ef740 size 2560 diff --git a/dense/decoder_3_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_3_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_3_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_3_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_3_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_3_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_3_self_attn_block_n1_weight.f32.bin b/dense/decoder_3_self_attn_block_n1_weight.f32.bin index bf98c1c0a090301ab25f8c9857ab68f4c1555b04..54dd34f73265625f348f1c7548a53e5b6fcc9dc3 100644 --- a/dense/decoder_3_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_3_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ee7056ae2fdd0937969db21841862681e470303fa423918e28d426c6ea032dc +oid sha256:083fed8849ddd08ad81f0dd422aadfb0570d1f11079073bf2f85121fcdd57274 size 2560 diff --git a/dense/decoder_3_self_attn_block_n2_weight.f32.bin b/dense/decoder_3_self_attn_block_n2_weight.f32.bin index 8c85d2c4b6f97fb97044d3f466ee8b6dbbad7a25..bd7108fd87bc50abfe0c6fe0106bc09861d28b73 100644 --- a/dense/decoder_3_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_3_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a560a1dede092c8a7dde8fa9b96baa535ef09c717dfbd8943a0d15b326d9f9d5 +oid sha256:115676e9f45a24b93168c64e085aedcadfa8fe199d1a2b06b9ca67ba3615385c size 2560 diff --git a/dense/decoder_4_cross_block_n1_weight.f32.bin b/dense/decoder_4_cross_block_n1_weight.f32.bin index 49ea8c254f622ba8c53fdd0a55c907c5a39056c1..cee5ac597b25f5d51a987a2142c074f5dc2e8a4a 100644 --- a/dense/decoder_4_cross_block_n1_weight.f32.bin +++ b/dense/decoder_4_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c043209537341e6dc5f41dcf6a351fb4265565500d454fe64c667ac7b06c7e33 +oid sha256:b15ddc920e96f925d4bb97e943a92a38605ffd1e1f5a74373654daef985e377d size 2560 diff --git a/dense/decoder_4_cross_block_n2_weight.f32.bin b/dense/decoder_4_cross_block_n2_weight.f32.bin index 4cc6e94e234ba8991872dc4179c84263f0f76dd3..016906a2e277e5f166ed58243ba645a715f2583b 100644 --- a/dense/decoder_4_cross_block_n2_weight.f32.bin +++ b/dense/decoder_4_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:598e5457b0d29193b07509b15b611a39769cdd37c70e35c9ef33339988c1541c +oid sha256:23021c9331a4ec203014d4d33f2a846ad81702b6da07a3fdcaab2ef30a4d73f6 size 2560 diff --git a/dense/decoder_4_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_4_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_4_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_4_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_4_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_4_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_4_self_attn_block_n1_weight.f32.bin b/dense/decoder_4_self_attn_block_n1_weight.f32.bin index 679cfc453b6757b44f47fb6fad46b276a2fa6ee2..20d0bae05ad4149dabc069ea10201d828da816d0 100644 --- a/dense/decoder_4_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_4_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77f69a1f0ab7f6664172e335f1bacbede678a34d59234098b531a41f08eda87a +oid sha256:f3ae1bf89ed7cdb798ec9b786ff358f126b58fb7fb6fa2b93d217a243318aeee size 2560 diff --git a/dense/decoder_4_self_attn_block_n2_weight.f32.bin b/dense/decoder_4_self_attn_block_n2_weight.f32.bin index 2fda57a186eecb5dc47f58646c4391d38360cbad..f1c4b77cacbc9542b23491e957ab9c90ba737a7a 100644 --- a/dense/decoder_4_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_4_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2c4fcbc99f4fcf2182c7ed689ef906b7135326b75644ba9155239e6ca65c1591 +oid sha256:7161e760f5e51f0e019f3ddf6285c1d31819100682234328ad54c9f3fb26768c size 2560 diff --git a/dense/decoder_5_cross_block_n1_weight.f32.bin b/dense/decoder_5_cross_block_n1_weight.f32.bin index 8c7f24cc90288250912a64a3481523253c3a104e..ceaea2850948b11c6532213fb64fa1f8f5a16356 100644 --- a/dense/decoder_5_cross_block_n1_weight.f32.bin +++ b/dense/decoder_5_cross_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:744b9f0653545a86ed4b7f963023c78c74637332d473b374e61fa19d72795ca7 +oid sha256:b49407ae4ad043d9c524839c8e197cfaed22ac0f9755458fc8dfb5f9501f62e5 size 2560 diff --git a/dense/decoder_5_cross_block_n2_weight.f32.bin b/dense/decoder_5_cross_block_n2_weight.f32.bin index c1ff865fb2734d2de2a2b828d62086c71ca87ec2..53224c5436f7d9fab730cce4a66e107a43bc4e4c 100644 --- a/dense/decoder_5_cross_block_n2_weight.f32.bin +++ b/dense/decoder_5_cross_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:41b98dd7de3c29b4b66996542d2b1f835d8729bcd09ae96689de78daa16c2041 +oid sha256:d7c9bf8b3e50171e0aa8882bc82629636d6afaa7ce2b36f3612a9a79e40a5840 size 2560 diff --git a/dense/decoder_5_self_attn_block_attn__rope_cos.f32.bin b/dense/decoder_5_self_attn_block_attn__rope_cos.f32.bin deleted file mode 100644 index f1b59ec62beda40196f73de80338b8e0d7c87097..0000000000000000000000000000000000000000 --- a/dense/decoder_5_self_attn_block_attn__rope_cos.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b -size 131072 diff --git a/dense/decoder_5_self_attn_block_attn__rope_sin.f32.bin b/dense/decoder_5_self_attn_block_attn__rope_sin.f32.bin deleted file mode 100644 index 03f25aa4301fafb62f299dcc47169442a478c068..0000000000000000000000000000000000000000 --- a/dense/decoder_5_self_attn_block_attn__rope_sin.f32.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f -size 131072 diff --git a/dense/decoder_5_self_attn_block_n1_weight.f32.bin b/dense/decoder_5_self_attn_block_n1_weight.f32.bin index e5be877c8a434b25a462c203715ee4c60ef97725..fd9059fd2d3675c35dbde96ea1b0d3b35e54f7fb 100644 --- a/dense/decoder_5_self_attn_block_n1_weight.f32.bin +++ b/dense/decoder_5_self_attn_block_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1fa85cc37348e322bb9b80bd0c8775dabc0e8ca898919c86bc3092effd31b7d1 +oid sha256:5ab4801dfa1f732a06dd0d14acfa620dbcec11568fdf8c5e333b0deb154f1a51 size 2560 diff --git a/dense/decoder_5_self_attn_block_n2_weight.f32.bin b/dense/decoder_5_self_attn_block_n2_weight.f32.bin index f4048ca46a3ca876a006c899496f05db62a9da34..b87092d3b3f239d5616c08e1694713ffdc7b439f 100644 --- a/dense/decoder_5_self_attn_block_n2_weight.f32.bin +++ b/dense/decoder_5_self_attn_block_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2277d03a4376433872684796edfa38c6636a096944d5d8c9031b2f13bdcec68f +oid sha256:c5666fab5237df5532e10c7c08ecd276dce4be357b11819655deea19d3d6b0e9 size 2560 diff --git a/dense/enc_embed_weight.f32.bin b/dense/enc_embed_weight.f32.bin index 45ae6abd11409ec953b3484953b0afd1c32e636a..989775d5f09ae65c31ccc4acfb36659942d63541 100644 --- a/dense/enc_embed_weight.f32.bin +++ b/dense/enc_embed_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0b2d9d06dc96048cff8f30867bc4c520bcb7586df46a0325c95b6a93a84aeeb -size 21066240 +oid sha256:78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df +size 21009920 diff --git a/dense/enc_norm_bias.f32.bin b/dense/enc_norm_bias.f32.bin index 527d4418ba82835e914930297664f7517f71015a..1174610675f6f6153ef9433e7be3c3cd8a71ae45 100644 --- a/dense/enc_norm_bias.f32.bin +++ b/dense/enc_norm_bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0f7a17d8d5a7e35c03338862b11b135d1a0816358f766706d2f83179d4bafc40 +oid sha256:73c7b6e76072acad2244afc73657d29377fd189a8af9bc41daa14aabb346606a size 2560 diff --git a/dense/enc_norm_weight.f32.bin b/dense/enc_norm_weight.f32.bin index e802b50c656eb60f88fd6b18091fba4147da6c92..cc9c7179c558281858559d09d4a2d2ac85bf1aa1 100644 --- a/dense/enc_norm_weight.f32.bin +++ b/dense/enc_norm_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:323e132c6135d519e191f4e98eaef83861db8531b4971f7dbc32686258e791c0 +oid sha256:fbce78fa3910cca15c0bec29f929009612f7f5b94d1d083771ed0b114bb2a337 size 2560 diff --git a/dense/enc_pos_embed_weight.f32.bin b/dense/enc_pos_embed_weight.f32.bin new file mode 100644 index 0000000000000000000000000000000000000000..570e24ddcd3c1749e30d118291338c6af4e5efc2 --- /dev/null +++ b/dense/enc_pos_embed_weight.f32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e06124cce8055432e8e6a7a9a9a2a6e39ac672071f23dea5872bd19c51e4d9 +size 10485760 diff --git a/dense/encoder_0_n1_weight.f32.bin b/dense/encoder_0_n1_weight.f32.bin index bcbe3323b9661541bd7c5b3bd2bcc0f226cac127..bfe3df8fa1f30c6b817595e1e2c167b5477c082e 100644 --- a/dense/encoder_0_n1_weight.f32.bin +++ b/dense/encoder_0_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2fca0cec706dcc674c02b5ecb68458f347cc18cbe0b5783ba08764863ca1211 +oid sha256:146bdd3c5419ea957cba0919904c3fa3a18345399e1190e38b1697c5bc56a18e size 2560 diff --git a/dense/encoder_0_n2_weight.f32.bin b/dense/encoder_0_n2_weight.f32.bin index c383d998c9e9d953b2a3a864d822755b90f577bf..d9827eda87b4e8974da478bc04cbc15bf8bf86a8 100644 --- a/dense/encoder_0_n2_weight.f32.bin +++ b/dense/encoder_0_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5592bab55e8eae12dbc21470a64a4f145450f19bd28292ec789863278e122e8 +oid sha256:2817160dc2b42d5f8de29fb566ed4165dff109f084f8a5af1766e544a7fea509 size 2560 diff --git a/dense/encoder_1_n1_weight.f32.bin b/dense/encoder_1_n1_weight.f32.bin index e697d38db6d489f028c3949618b5025f48b21d72..56cf81d4203ff908433209e35729a3f93771d91d 100644 --- a/dense/encoder_1_n1_weight.f32.bin +++ b/dense/encoder_1_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9efa97efc788129bea077cbe83a7d35ce84e7d90a5cdbfd87f490fbf9bd26b3d +oid sha256:4b3b5cbb90b337e7c217bfe73872429a99ef7aaeda0743a01e7c78b496abce08 size 2560 diff --git a/dense/encoder_1_n2_weight.f32.bin b/dense/encoder_1_n2_weight.f32.bin index 395458ff8c3f4b71f6963951ad5f9358e70664d5..c0eb4495f190f58ba91204c285fad3c458076032 100644 --- a/dense/encoder_1_n2_weight.f32.bin +++ b/dense/encoder_1_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:80da1c04bd2f7b3f1784986cfdd88a86f4a820b2e0c6ebd1b6b1ac4b7bb59645 +oid sha256:2030393e0c8cc4554a10187e03f03e541a380227d3b64c3f6455aa23d8295be6 size 2560 diff --git a/dense/encoder_2_n1_weight.f32.bin b/dense/encoder_2_n1_weight.f32.bin index 52d91fb936100e5762f0082b60ddc445b170ee24..0eda91b2903b1d9f1fc84ed7915f043d16dc51c1 100644 --- a/dense/encoder_2_n1_weight.f32.bin +++ b/dense/encoder_2_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:73b9240c3a6ceb6a628d5b63cb7cee6f5f4f0e1506d3e59ce8422692f9afe87b +oid sha256:203d16e2f34a9fb6059e24d8bde0b3d2e85e8edbeaecb2eac7c647b9c81f1dde size 2560 diff --git a/dense/encoder_2_n2_weight.f32.bin b/dense/encoder_2_n2_weight.f32.bin index 0929a5dbdcc11bb38b59c56076ba8e9ae2e1c24f..908ff35f29dd10ebdc88b85e2726195662c765ea 100644 --- a/dense/encoder_2_n2_weight.f32.bin +++ b/dense/encoder_2_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d4af0825ded821252546f8d1c587f59d9108b6ad5b3fec91f49de34dbf827133 +oid sha256:a223438f7de8e65465b9c95605748e0152bc1b92d77b72d3af2a41d9ff108927 size 2560 diff --git a/dense/encoder_3_n1_weight.f32.bin b/dense/encoder_3_n1_weight.f32.bin index dc75326c7456754f734fa6770105a5f5dd37b033..b85d1397db1b0f983c31c817a3266aa85991e722 100644 --- a/dense/encoder_3_n1_weight.f32.bin +++ b/dense/encoder_3_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f7c7eafb79d56604c3b69489b6b4a0147df80e7a2b615f86be7b16b985c6a5de +oid sha256:6f97f7dc429e26a0e2950787e5ec7c9fa3c3ab9b8ddd0fc1279c19908fdb9868 size 2560 diff --git a/dense/encoder_3_n2_weight.f32.bin b/dense/encoder_3_n2_weight.f32.bin index c848b2eaf352df1106aa51288388c3fdcb43da4e..93b047e41e67d50a7a06051f71b2229c46fadad0 100644 --- a/dense/encoder_3_n2_weight.f32.bin +++ b/dense/encoder_3_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f69753e55446c6c2229018625ad180851a84470fbdb5c89e34f3c4424b17906 +oid sha256:9754f40fc928fdca4359684c41888d1b3d6af817936af59b161f3824b32534ff size 2560 diff --git a/dense/encoder_4_n1_weight.f32.bin b/dense/encoder_4_n1_weight.f32.bin index ad0c270dec560a99ad36656229bea6c4af4bda3b..6767761c92eb82f978cd16220ae11176113c7b1c 100644 --- a/dense/encoder_4_n1_weight.f32.bin +++ b/dense/encoder_4_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fee47b193f6ed6749017d6c8c2a74cc469e9011e30ca33e2b0e73359eda018dc +oid sha256:2195f562646510d2e377c5d219dc1341d32001ed30b4d54cf754462cbcd175a1 size 2560 diff --git a/dense/encoder_4_n2_weight.f32.bin b/dense/encoder_4_n2_weight.f32.bin index 8d6e07ff47bd285fba1378381531aa3ec4a402ae..f8b83df2d8c8b5c37ad0a31a3bbdcd8f05a8cc2b 100644 --- a/dense/encoder_4_n2_weight.f32.bin +++ b/dense/encoder_4_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:14fd5b086cde7b81dc01556e455e1ea895d13ab062471b558dbea32b2d842b13 +oid sha256:75fda5bbfe2285970162c18ebf565ebe3e4032b2751b4bac289409a0ed8cb12b size 2560 diff --git a/dense/encoder_5_n1_weight.f32.bin b/dense/encoder_5_n1_weight.f32.bin index 4fa5c1e409ca803c5b846e0ff53a994b628a36ad..725fa9930f76b9d503537e56a8d5320233437a07 100644 --- a/dense/encoder_5_n1_weight.f32.bin +++ b/dense/encoder_5_n1_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ccefbf5d0804e7ed9f0a693b26826dc330a5d0985d521b32c8b0ad8df02c149 +oid sha256:eb288cd1ccb8e5b7d5da5e6fa88afd881471b0bbbd355e14adbc3b885385e71f size 2560 diff --git a/dense/encoder_5_n2_weight.f32.bin b/dense/encoder_5_n2_weight.f32.bin index 922fbf7bf5ee9a8ce4f5aaefb3576277d58ae848..e8e3b1bff53e8e970c4b3e22b3ba5dff8fa9c777 100644 --- a/dense/encoder_5_n2_weight.f32.bin +++ b/dense/encoder_5_n2_weight.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3445fe77c401b32595a7fd403f3cf3445041b9333e71307d1efc5f902736a040 +oid sha256:75218ab909794e1396d0a651023851988cfea12c5085c9230b883188d3a66ae1 size 2560 diff --git a/layers/decoder_0_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_0_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin index 841e5d1ae9089f0cf1c55622cca775cc7160128f..4d3f7253dad96d659da89776b499aeab2bd801c4 100644 --- a/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dab1fe7b8a9c0d16962d04385eb4bd8278ebc6b710048e308f4e952815704a89 +oid sha256:08479bdf9b9e401f6cb67193a75376c4d033262548fdb311cb43304639416056 size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin index f54cfd7c83b0cbb310a28ca75b4e0fc2385bd0a7..b4f1271c29f9a8183723e46a3dc7d50e72821d0f 100644 --- a/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ccda5b9b61ca846d301dbf9745c708b2167137998117d3ab418e8afb2444d49c -size 2560 +oid sha256:5f1804fd15e3d2f211b606b28e53cf7f6c9dba0b41aca6331c21267374a2d2af +size 4 diff --git a/layers/decoder_0_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_0_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin index 90e8a0777dfed0625b4011abea6cbc4be9abb9fa..18056eeb8a6cc2ea57f63ea0971b2bfb64015166 100644 --- a/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a27b0efed3dc1b8317570f0b1c8c69dae70290817b2e5a6e6f2ce3be3793e0fe +oid sha256:626e1354171e0957b38f6a2477c00951a23c6817ed63da0407e5eaed32d7a8c0 size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin index df24e4a65c8e29ba230b55fd78c64ea29d3d64be..56010644de0f4a616c4594282f3a2135211c025c 100644 --- a/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b675f7d7585183acc3ae150ff7795d89028ad8f54dbd834b84f42d02b3d6a4f -size 2560 +oid sha256:5a9d7dba971eab55495a66c347f16b6f87381a569377479629f0afb1e024b64c +size 4 diff --git a/layers/decoder_0_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_0_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin index 70653036712ef3536bec7f709e64856adf754d7a..8028d6d956fd77338d38f08d3471f7cf36020262 100644 --- a/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cdb4e6bfba40293068056ce54f3e4c97b0c3b1a0aed88969106d1e9d3a0aff7e +oid sha256:af7d96d094f15aec2e3085ed7886bc977551a73ec02f8303de8aae92c1a9dc5b size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin index 12cbf852b3dc012fff90ea60d07c27369cdd9533..695f011779160f830c818c879f9cfee562f47b35 100644 --- a/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7b2f4085a97118a209bf0cd98997c037aaed5437047cac9405c2cddabf5565d3 -size 2560 +oid sha256:8dd70c2cf3f9bd573a92e6e26febf05f647c9aa2a96be406653c820ad0236fd7 +size 4 diff --git a/layers/decoder_0_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_0_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin index 745ea9f4a9c8e7bc3fb34f5fc949c486174672f7..487fc1472adecd7765cfa50a9a6f390ac2ed9d64 100644 --- a/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bce666c81785261a37d521f07d4d33311234b80a61f376301b81c66fc45c37fa +oid sha256:e22c38d92ffc3b80e9e671365641515aea6d6752bc5daad7093fadf0cc824d6b size 102400 diff --git a/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin index dcdec27b0387a4ddd3007a063f83f27c388bdf04..fd9b029614e0a3e7acb56c3f0c53a87218dfbc05 100644 --- a/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a5caee871504a64e3511d4abbfad95d73af3cc09261c05b6c0f536bac8b54161 -size 2560 +oid sha256:66caf7ed5c1928df1a13e925b9dc0668f373d962df677fe30849d7d651490180 +size 4 diff --git a/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin index 218768f55a05e31d42dda6861c908713fa02177c..85b64a0a2039933abbcb61b578d9a0d6317c6256 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d1c7b21f7a5b3247e98ad66ad7e06b4405cd982256e530764ca6e81b14fd441 +oid sha256:05ca09aa97d5c292ea175fdba1462466841965246c1f484fe65a8796fb730d6a size 16384 diff --git a/layers/decoder_0_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_0_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin index b033bbb10f37562e0b9f1dbde240e04d14e1b827..7d29104c1f330242ff560848a21e627c24c99b67 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1b0ff6a2225621176cd52511c077eaa16aca405450460acf1ea1e0733fb676b3 +oid sha256:01a9eafef410331309602cfd32771cf501cd4c49ee2288717fdc8f8cf3103056 size 655360 diff --git a/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin index a8ecc638b4472150dbdd22eb2fd175f02b10301d..fbf74f62208aeacad2665f459abb80ce91cf198b 100644 --- a/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11410d9dd859c6356330fd0ff8c0f5d0ad6cd29d2498e14a3e5b2f11e5d78acd -size 16384 +oid sha256:334cbe3fc324d58e30e72661d54c03ed1085c27b3d642851df99d165861e2e23 +size 4 diff --git a/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin index c00cbe555e4aeaab298bdf0e8bec871535ecda25..88835e4d05972df437a37beebf2c6f5d90ca85c8 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad99b45a62019c799b3fb1bb85547e9c2f260f88ce0a791e7cbe6a66b22f4cb7 +oid sha256:cd523a559d16f295950e4eefba07a2f728433c7ead25c64bfd23ab91107239d3 size 2560 diff --git a/layers/decoder_0_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_0_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_0_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_0_cross_block_mlp_w_out.packed_weight.u8.bin index 251b442ea38257bf434b9ba7a3e84bee0345a7e7..49cd93462a841ffa015f416d4dc39dc83c505af5 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8b98787aff27d2c5c2ef02ee5a8e2d51ae48477440c14aeb3f80f518bea0086 +oid sha256:b9506f4167f7524afe5d3b1acc61e8ceab2d3137ec6f4b545d24f9ba31c8c7bf size 327680 diff --git a/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin index 51341bebe00b8c904e5cf49595945fac259a5655..d3424b1d93d27b08e228312a2ffc07bff5271f68 100644 --- a/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_0_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1cf7d1512bb52ed1cd21db60765567bed2cb48f248fb81b68b82a0bf01991a7 -size 2560 +oid sha256:711af3f0d6d03e14c13f3536cd4c46f20a8b727fbd25b2b2e7f1b97f60194c1d +size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_0_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin index 1a8806e4c4843f3e0289a13d0fc156603b81aaa3..ac485348f5e6687cd4896e5b5876973c5c69d630 100644 --- a/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a315b12d0b86f25cc04527a71f8743d9bd1d3cf0bd4908142dd960c0b086b956 +oid sha256:a08b0d5a4abc10a63261efd14e67113fc454547474fc7473a3391a2682d92f58 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin index d93aa49eb53c5e2773e63c30002b775424ff637c..3d61e58da69421a72ab03fbe76d8c14314ddedf1 100644 --- a/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28cf54f16e3af1f8b4c98f645e3075e9b88f3a87b118056bb1da4c086895bf07 -size 2560 +oid sha256:0e98fb82ceccf1cce50a58a31c2bc5aa778528de7112166fd3a3d9e0d8d160c4 +size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_0_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin index dbdf71a36bddbf0756ce1cc4a643e560e13c96e8..e58c243ce38c81ab9ab744ba7e0a4b81cc174afe 100644 --- a/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b68167c060a0068345304b71046c1b220738cdb1fca03ff28daef70e12414b0a +oid sha256:41d3f58c4e1c71a5e4238ecb90580beb3ecb66d82074d462f6bba66410488ed4 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin index 62e3bc365cbc7524e058b83caeff8b6612864572..2317eb184a954eda57d7b43daaabfbe9f0218400 100644 --- a/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3ca8fa5888fb89bbac7e20dbe4a6fc50f040b38977ce0ca892da7464b2e5a8e1 -size 2560 +oid sha256:9335b23e739a7ea4fb3e2a1406ff9a264afc8cb3a6aba655f76ffb98a965e472 +size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_0_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin index cbe08f2a7f951e34dfece5fb37392122ba041d2f..00f4de64304e2d48f4ea7d1aa754736334f87ca9 100644 --- a/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9bffd32c4471bcdfc023a17d068eadf47632e0da196f2de8afb3c0748852ba89 +oid sha256:b69a0802082960964d365f01736cc207853276e8ee31f16a62d67a9e9f6fe4e0 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin index 97d02ed31d99f10139ed72baad7e6945f7c6e8b6..e83483419836c028e9e8a70e8c5a5716ded5edb2 100644 --- a/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ace432da1e7b4f9731947428b48cb68caa0a3d9092a9da11dcdb4387fef97048 -size 2560 +oid sha256:cce1c626617073725f601763dca680ec47d2133ea70f7d8e6d2c4834a3534860 +size 4 diff --git a/layers/decoder_0_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_0_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_0_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin index 07eaa0c40a2cc5479ef392248591f6ab75bffbae..50bff1c85bcee512d5d8c24293b53d79eb89c93c 100644 --- a/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e8e19b7b1b4afb0ba99f550b05516e6f49b5b717d1f3494c0e2b2e8aa95782ff +oid sha256:4e724fdeaa3bf358ce60a23b5819f16e3d6953d27345b59051bcca52b6d535e2 size 102400 diff --git a/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin index dcb264819c85d74de64eb15b2162e0be51667175..1f47c5fcf0e451bccbce3cffdffd9f8e80caa3f0 100644 --- a/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f7db1205ef1a06954b3ec54f2a6f25c354d2ec62f647087dd59159bd66b5abba -size 2560 +oid sha256:0164f5b76a21689a3217a3a14b333715ba53ff3515d6a47d993062ccf1eec43a +size 4 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin index b87792c9daee67f259e06811bb3fce0401a3229c..646def13831b267e7bf6b8c66a9075eae5b1d2de 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03f4c36fe4f7d830223a0f442b9b15a6b82a10dd37f139d1bcf6b67b097b8f5b +oid sha256:e31392b1c36010e0789ec0b99e127aeef5058181d02807917ff9dd091777b9fd size 16384 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_0_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin index 045b3b72c87b71477b612b35e38cc744cc66f789..48dc364acb8d54be8be37dbd62e4e6ff4af16ecc 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a93390ed156e0b0fe0886c537b4c223efa58119a2d3ef74a509feffb8d3a5faf +oid sha256:9cb2abe959183ae123b07b3ab1db7b98eb21a72e6775282e1793ec1efd6a9f51 size 655360 diff --git a/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin index ea28523fe9db27a733617194769e89c460cef8de..1c9f038853d05b20b2b3e3570b56122255a4961d 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:42a65fe4d99200f8d73192af4c23ece3b905554d184fb1ff2f245916aa1d00a7 -size 16384 +oid sha256:203c7722acd5a6a17458bcace023040352b430777f2bf1668ec64ef00774bec6 +size 4 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin index be4c862512c2b7e1962609a39d235c2ab26eef96..abc34761058ba64c824e02d87de6912c1c3b4980 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65c03a26b3b5cc37f42318ca20e55cdc4fdb3df11b031aa1056c5fb7311717f1 +oid sha256:d483dd0a73a79a2a5a78cdc9629f7658f6e6eecdd50647fbf1df6a7784a48d4c size 2560 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_0_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_0_self_attn_block_mlp_w_out.packed_weight.u8.bin index f075854127558492a3e521f9e37b5a7c790a9dfe..88654124584cafb53be8b7e7bb2d4c29667b9cd1 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e3ed6900ac4cbfc0c66404135ed3357764c8bb91b14481969406d10651d6a380 +oid sha256:66ebf71cf9aa0930f98edead53d5c6557294117e52c6060d3e515385fb8b7c21 size 327680 diff --git a/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin index 7a0a5c229f5702f9d4ee4c0573f350e43125e6ac..c386f8b7fc2cb43426940f632c5b566c7e2bc140 100644 --- a/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2e1b173e866f97309124e9e65ebfbc84a34e5855125b20ebca2ff54f16b1b793 -size 2560 +oid sha256:2e3753caa7aaccec574fe60f6e7da33de305c0698012ad5f666cb78f7b9a8207 +size 4 diff --git a/layers/decoder_1_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_1_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin index 4468bfb413313e6cdaa9579387059ff611dbf100..9489e02ae3b2fd9326fd4616cddbd41a1a229582 100644 --- a/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:32252c6527d271f9dbbd442837e8e20d81077dfedc331500d2a6a58e3a2fe846 +oid sha256:92da8351ea49f3e5e5cac3fa2f3ec616b2ab1f2c2e0590f77c241eeb1edb3d4c size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin index 932e964991ef0353646d1190eb4f1105d4494297..05159fe5aa0d86dd8fda4e39281d8b705776dfa9 100644 --- a/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dd2d3910474cb1007ca2b9982543b5cbb71d8b001752a8838c35fd817d81e01b -size 2560 +oid sha256:48d46cb7803af682dd8b3e6358e5a8829f3031e6051774bd606815dcd32022d7 +size 4 diff --git a/layers/decoder_1_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_1_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin index 7d50e4858f2d975c81401cca7c7c45b9b8b27521..92c6c6840b39d383dcb8b0bcf211bf85effcf366 100644 --- a/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10cffac7ec80a010b58e7ac2c1e528d083b61411bb7adcbc3ed46ac5bbaeeb1a +oid sha256:d40ee2db7dbc602afd3cff0b7046e7571092feb5bd2acab9d751fe39b8f0393a size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin index cd8ec4ac1080074b61a246e5132aa17807fa5fd7..67afdf8413deaac99d01541fdc42c7e05e0eea14 100644 --- a/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:56e9ca708e8eab4f2439a734b9a8f20ce70ad57d3a113628e5607d0da9c4daed -size 2560 +oid sha256:19b42d8f06375451e83c749579aabb9e152ed409def93381d8378f2b80ed4bda +size 4 diff --git a/layers/decoder_1_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_1_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin index 0657fdaecad961f407d8ef882c1ceb0fc7b11a0d..ed89a4a0f31ae0df1aafc36bc2fe051b98419293 100644 --- a/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:08be78ad3df0180ff637243fbc2ed3ca5e46c1b983ac09530e90f78e68b25379 +oid sha256:fbc0c47e3e99833cfd35d714791c5a20482d1db64a1dd2524f85cbd90a09d5ee size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin index 0b186c16b65ae00510d5c3afc77bad338f69c2b7..bed5c6927d1cbfcdae3f1cf1d54bfc53d360cbaf 100644 --- a/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68798aa8d4fb447fd0540177b3c2b2d5056c3fb17b6262da551a3f821090e174 -size 2560 +oid sha256:22a56325517500e9aa144b6c45c43142c71f2f3785a0ca9f368ba92b33b6a10a +size 4 diff --git a/layers/decoder_1_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_1_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin index 6dc3e03c0b585ff036e09a116617166996a3cec7..1245be489494c571a84f1612ce62750a9024fd4c 100644 --- a/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c719a28098be92cc1ff0118fbe3b9bcb49d0f374d06ad4619198bb9f198b6519 +oid sha256:a3d150e880dc3d1e210143ac8f14431ccbb73e26e2182f2695eaa133b01a05de size 102400 diff --git a/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin index fb3fcee0d1c2927acbc11a68dc1529a7a9f6efef..157ab04631e046b8b9377a1a24fa36800cb4a107 100644 --- a/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:54941c4e0b7edc9d9658ba42cfa5ce0652836fd57a274141bad95df2aafd52df -size 2560 +oid sha256:4f426dc2b506ed8e8b0dfc6436e74d16ab7e2650a494946f7b92c66cb14b8753 +size 4 diff --git a/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin index c71948fffe3e28e399fa842f98c7e696b59dc9bc..ae43fa79b1e3fe251ca64a5de085a3d7083ff967 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c12df42bd62e067ab734a5fb22311d1b8e0eadc2a3a8a0d3eacad5d4ba8edbaf +oid sha256:353917073379bcde4b14d13263453d8e1ea0f9efc761a0f5a25c45ca30cdb7e4 size 16384 diff --git a/layers/decoder_1_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_1_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin index 905456b2036ab35398a6985e92a21fd40b0c5fa0..810c44817253153d017402d8a5d6c9f35ea30830 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:147f2cb807148dd9b9903e5aab63602ad272f7c7287d366858e25bb42dffc7a9 +oid sha256:7e6ce561de8adedea09bd594dbf820ff345a4b839d7176158594223c2f23c059 size 655360 diff --git a/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin index 6403b6decb41c9dd66937b9c0bd46a96b3fa66b8..8fa501ce7547f3873d9d4bd2f1f9e01d0cbe7de7 100644 --- a/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0da7709e16e4c7ca38ffb1d9c3c815e2ddae7b5191c07c107c80646085238205 -size 16384 +oid sha256:5f5bc5b85387c70f0ff0a8a6236137247179cc750539ade22badb819f046a146 +size 4 diff --git a/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin index 7992c808c7122ef0557ab1e1abf9de79fd8d3a6e..274b75aa0a79db9a57a60f8ef4c3588dcaebfb99 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:177029674ff23caa5d0f64d5d59ab8c30997300c226e9a1d0769d4198b3bcf9e +oid sha256:5483e84f88674f52dc3f127ace0d01c79d4000fadbc51ebf1567deb2a5c3a617 size 2560 diff --git a/layers/decoder_1_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_1_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin index f69fde51e2c2511d1ee3dfb35b0f2bfebe664f68..f5f5b6b5624df7b9a08bc4902786a268d9fd0a16 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ec392d9ebad88b0211e4325a5526cadb95b11687d74c57e375de0f8a05072b2 +oid sha256:388cfedf59b1d4a8a3b3caa5db87ab91b4914351dd5bb0a88488dfcbb24bec4d size 327680 diff --git a/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin index 50c55c0767d285143b59a2f117292a18ef181337..5e1606468495edc1d33d7832ff6ee1d2ba30cdbd 100644 --- a/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_1_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cfbfb56d430de308a8d3ed35905aa51ea32f1cd3aa97942652b43a6add1c3ffd -size 2560 +oid sha256:fac4e93a918e7832ac8e7d7bf7295ef64aa7694f874856f7a931bdee21d2f2c0 +size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_1_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin index 5a11b5c3dc2c350d5bbd1c891366126db5d4c9dc..466b2575b354e7427af0dbc322bd6684ac9f91ff 100644 --- a/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1ef7df6ce7c7cf79e720be6fddd8fb86dacdb6067ce088e981e5cd11c053d588 +oid sha256:6a36f2f65841904629925fbcfa84e126aae8f6e9c8abcd6f72a8ecd7f22ccbd7 size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin index d29e8bf6faa8220a4609fd10b7c346d03a50bfd1..46ee38ed34a8b14a026e8eea4f63f1010b51bf2c 100644 --- a/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2622bf47efeaa15ebdbb9f9eaa930af498683747212acaee09496955364fe787 -size 2560 +oid sha256:846e22bc9fcb3f7dc3993852f8d0fd8befab13ce081324a3abc1fdc56fea413d +size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_1_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin index 813930729416094513321eb6f7ee9a769021fbe7..24b19bb829e7f230b63d91bb022b397316b20079 100644 --- a/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:04ddf127b2c76986e4d0b3b9c36e1dc8bbf404b314b836958794ab3ba5e198a4 +oid sha256:17b81e31d14fd2377646cc5351be3ff7299c4025b1a65ee0bc0378d6d69ef4ba size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin index f6d9497416923139d65edad958e0b09adc813f72..06f450f625c6141d67a203ffd6a92c5c467d6c8e 100644 --- a/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7e63be7ea82af79ae38e684120c0ce922ee52f6b2cadbfb11fde9545f5c91a64 -size 2560 +oid sha256:63565a86aae052794d7e726aeb21584a9e39c52a2646ad0454ca7ae4cb1e575c +size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_1_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin index 3e395327828b1f708ac2689ed53f7b808d799c4f..9675e33416915d75312999299bde1004c8ea2ccd 100644 --- a/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d8a8b78ec75e0c333663940e9f8a74b44f7252d399895df9b27da2b4037d157b +oid sha256:f62eead467ee63a5bb17213bd7744956aff491ec56204820143ac249b8a2dd36 size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin index d20616bf18b5c41254d42e4e98de196c2232dbeb..0a81c0325828426de8da2363ad0019eb5eed3dd4 100644 --- a/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:332eb215c1ba8817f68d134462324f799236b88c7a050bb63ca6bd0d4c0d7753 -size 2560 +oid sha256:49d0d891621d97a6caa308fc53d029f8d89c6437a02014014fcf8198275bf19f +size 4 diff --git a/layers/decoder_1_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_1_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_1_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin index 31ec657ee940aca4a31c2c49f3d2d0e714f639d0..cbc4b35a60f498c56baa1099481dfc1b5715b17a 100644 --- a/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1e55dd6de5285a9a895c2fdce7c57f32b37d0882fc31a2ec66c021bb4707886a +oid sha256:306f969e226ee36dc20a66056ac851a449b7810160bee0166aec85710cfd51fc size 102400 diff --git a/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin index 0d7224c39ad8cb44d78aee283ef24e1454a586a2..24d553bfa30f5a840e4daacd2e8602fcb447e942 100644 --- a/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e26e8e075bc0ae64848a79d680a9603d5a67b1319ad22e86613e95c382e37072 -size 2560 +oid sha256:3b2c300fcc22571bc36c6819fb412f49fce02d486d528946416d4e9f7f1b50b3 +size 4 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin index e0f0a2c2ec1d5839b6fc9c7ae66c6409743013fe..1a9986e7558ac6a5caa93029426404f94dea540f 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db359faa9d174bff94c2274019c8401c9b9cdd5fec5c3c7da9e7dbe7627723e4 +oid sha256:cf73fdfbe8b4919a8011de646e3cc5a1d8438fc08cc1d70403453f39d8bf5a9b size 16384 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_1_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin index 4549043cb7d384736d7dfe75053239a45834c976..4a047bbacabb788c138712b407d1f4e0a936585c 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:da5f2bb8654af32349bffb9907ee0db606fa63df16a5802c29700cc33b9de975 +oid sha256:c035ce58f51ad9bdb3869a4b4fc5d49a9fdb3ae922c8748d04d5fcba076eaa0d size 655360 diff --git a/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin index 84063f7d831b8492115230e4cb4f9237cd74daf4..eb4eb4fc0824b3f2bddf5e3a364ea7e89d5981d6 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8cec28ced33955f68fddbbd870c2a0b0fd969eb6b478b3a4cdba0cbf56a6fd22 -size 16384 +oid sha256:0848c8fa964abf68b054126ff610f8525c1030c0f0c8c061d865dfacd66c938b +size 4 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin index 89d0c5a6b108d870be2ab77228fe6eecd4a9c038..61dd7f8b4a710c8a8e4e44c223ae93b1c823fae5 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:013cfd5cdffcfff5bc159d970f94d01811f6f3d118fdea9ac821333f2af399b1 +oid sha256:5a1f09f3f10cc9731a269ec34ac6e5f721ae3e6c08e84cb33cc46050de33d962 size 2560 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_1_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin index 6bbca6bdd02ef0ee5f7f4ddcc1ddbf6781d09899..c4fd5ec8671a6588d5895f6dfb6bef1f3cc34398 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b4ce6d83159561062230049e832bcca18287dd68f40d60397aa23e6045562bb2 +oid sha256:72b1bf0497c3af46aba032c7fc0225c6bab53539728f100131faf88e474d2424 size 327680 diff --git a/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin index c60d243cbfcd023e53efcd8430d9d7a08c892aeb..60154a0769a16bd2433a828414bf64ccc8cf95db 100644 --- a/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8a8117d6d4b72628c9ff1d88b3e39800e567f1b816abd017d5531f0a270b26e -size 2560 +oid sha256:5e915f656a0ab9ceeee2f2570b8be4ab2e190c0a7324d2fafe35fefa0d560d1a +size 4 diff --git a/layers/decoder_2_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_2_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin index e21e0b088df312af49456ffd2ecff2dbf6fd0a35..ec7378e31101c95588fa6b9db63c6c7b1ea8af54 100644 --- a/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:40bb2ca08a1c0b8dfb988b7e61a5b57aeedc55c20e9d0c35caab4aead2966449 +oid sha256:41e7cb11fe40d3dd71fd9261df9ba5919bfe1e13e81b34feab2ec682a2138d60 size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin index 2544790159458b9bf6239a7264a5ef6e70f446f0..125e0aa007fa73cd193833b146a158953de34fc6 100644 --- a/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f07e412aef0bbb6ceafc7c6c99708ccfbc1524e6ce038191e2a4699a415ee870 -size 2560 +oid sha256:75a0324241350114abdff35b66cf04401eae67cceb15c6d94f3ebba0e357b07f +size 4 diff --git a/layers/decoder_2_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_2_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin index e87cfc1fca4527b4366b471af53557300cb94312..f22e88eaa4dc6cc88bd9227dd247f5d1bfb46644 100644 --- a/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f83084ce3d183412dc6709472bc0957af6133a40d678a1be8628213eafb0bf3 +oid sha256:6f4aac9b6307efe0813bb7133ff5d32baaea2aa869e1ce4585bc3253e465cbe9 size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin index 2f911178078709c18ed916491c5ea70136ba8105..fda051e982e4b6601f6ec33f57d29617302780bc 100644 --- a/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a5b0e7833c17a2ff33c6f5eb2ed13740aff81b4507ac20975dfd68494df733bc -size 2560 +oid sha256:054938dfb43c4787837f7db97a0a0a40e078b5ef09aeb61720d07085e262a8b9 +size 4 diff --git a/layers/decoder_2_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_2_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin index 31d82f6f0027a8353091c3783da8a207532876a3..432110b7771297a850939b5088507d461ee0e259 100644 --- a/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b751950d3a076dc83467a2ec55298c5c9cbfd95dafa26ccbd43d28dec2573c70 +oid sha256:609d07290090c8ef4302591373e4908b287aaa745a422eea94ae9533d36e4233 size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin index 32b7b09b3d66d2c2021f75379bf2712ab3ba108e..94f6b8e1e6f194e495a13576b390f6ce9c36af0c 100644 --- a/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:37ed7b5a0e185bc2c19807c5853e907788af50c18a739852d1a6a0d35df1f430 -size 2560 +oid sha256:4d319778f3e29447ddf90f96449fca67c89b32a91d0c812fc37f6a90ccf19765 +size 4 diff --git a/layers/decoder_2_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_2_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin index 6312ed36b62976269b36b6a11ceda730fb7948ef..79fd59fa7f06e539be30c158005ffa375db9762a 100644 --- a/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e084d111d06a9a0d76aa499e744722550d05eae2f1772f271811db88098eebac +oid sha256:aa561b95c482d3e84dde5b670b1dccfe3f90f9f54cf5129447cf126ec6d0f0bd size 102400 diff --git a/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin index 147e774fba59911e9afdfc40b9ee9c69009283f3..b85b416920ae27b3e78b1a7f3f1e5b1e21ac7dfe 100644 --- a/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:155a3ede99090e94a080e9e4264f7a66af48394caac960c0b4ab7f29c1a87f25 -size 2560 +oid sha256:00710a7d695de7913cb4ec8b60882839a999e13a0ff2f7100d17112df55783f8 +size 4 diff --git a/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin index a0fb455899559e5ed5ed02d306a312a7077c5d55..a74d3ad8660b6fa64309419d7147da479c98cbaa 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b544ea371ac2c1203d9d2a9c4e5de96cd267bf48e12ab9bc642489d2bfcd35b9 +oid sha256:c215a193ec6d3dacf0e99800d066f1a703f83a25e37cde9eb29cd3c5e98f1089 size 16384 diff --git a/layers/decoder_2_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_2_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin index d8766bbc490cd3dd3de73ac50a0ae94a2c3a439a..ffdd297757032a3b4b2d0db0562a88075040ee82 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f7dfd5b21df56ff51cfd9a989001a8bb84f20a744a16a52444ebc0360fc823e1 +oid sha256:c61cc24ec3441640300dd8819e57df7aee2859e12cf4921e8c927ca73336fd62 size 655360 diff --git a/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin index a988d9ce0cf4dc42d649ab9dcfe5544568f51241..c19d4783c3dde697c1b61ac3e2aa55f5742398b7 100644 --- a/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:024294b499c04b0f98736ba1cf71a1eaec1569908cc1b7e7e7f29a2e2288e70a -size 16384 +oid sha256:9d8f7893980dca5cb4ea179cca82881fa0a975afc060c7bab202d84b7c26c0a0 +size 4 diff --git a/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin index 458794d227f244bdd4b51ef9f626ae392f01a7b7..3e9caadbc27e4b8e425e368bb7d859f4610c4b1d 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7fe1fb1a00d470795ea8ca416523f2b87da5de8f8370035df1f12a9235e93ff9 +oid sha256:dddac929ae3b499247e4babaacaf9085b3b438edc00ecf20b769b87ba906b57d size 2560 diff --git a/layers/decoder_2_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_2_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin index 2d7f6cbc0ab25a6ef87de91d426b9bc485e8c8c2..1910fce040cb9add0793d06b6d5d00a19aaf2a08 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84d5e83faf90d19110eeeb505a3036848cb5df357f5cb1bfdf69c4f0b6724bb6 +oid sha256:1a5a777485495e3453ac1efe529125b6e41c41e8c6c91b573891bae2ba664c5c size 327680 diff --git a/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin index 8287ff292b0ad213c5d84363cf4514391e5ea96a..bbe070c1735bcb59dfd3ef153aa35923ec1fe618 100644 --- a/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_2_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6104b6247af8eeb849065c5f9a5c5cd437f68906eed1f755500db50589d9526f -size 2560 +oid sha256:27a4aeebab0d1a35828177169e6f0f6b560ec3e41994baa94cc361357a52f8c0 +size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_2_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin index 368d59e4d1ce0b048069053dcce7fe01dc196287..ad22cedc42e619e30849ea6a58058bb3678d3bad 100644 --- a/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c5a7b17bef87ae00765b3af4e06e5bc4baa47572a11ff28b4934974f2545872 +oid sha256:8b705241d97aca82476624e41fe3c140ae7d9235f5f3a5b5bb5e12d3b870924c size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin index b3acc8aa10394e010127f56411587d257b18e888..4ac9dc136e0076c135cdfb1b695ca4ab812e49e6 100644 --- a/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2eb0318a2e6b38b19caf9921aa01fcf72468fde21a11092c82e3b2e01e6bd1de -size 2560 +oid sha256:05bba73e8e543abc881c7eaa776bc92dba6a2ae60242763a4c3dca027fc9bde0 +size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_2_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin index f3f12c346fe173bebebcff82d0157bd99617213b..5fd60bc9d64d2e6ac052040f1f780b928b138db2 100644 --- a/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:24304fd6258f3395e3d0a6de4b278540c71f7c33ed976cfa11f756d19195785b +oid sha256:ca48a2627346da038dcddd11d166de40fb13bef35721e2f145dbbd02f6a812e1 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin index 73432389d16dfad7041ee5fa7fcbde0b9b602f4e..79bacd773957daf8c6ab4af187a66e33261417e1 100644 --- a/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:32bc8118f0830b955cb008e5d7e216753b01852f8d26f64dfcd65e11c03192c5 -size 2560 +oid sha256:5f32c56c00f6599aa359c568271168fe2f9b703d3ae525fd6f5c90e9e8fd1101 +size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_2_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin index c1e41a28576d7c1b17aa009335832e22845f2859..0acb508a8273b51794a9bff422ea803756179530 100644 --- a/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee221a90adfb6b2827509d51b0ce244828bef9e3a9a262f1dace51ebdaeed413 +oid sha256:1d13a29954664d845f2cd98812e1fabee6a9e170375ba2bc45d23c52c54d6451 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin index 5ae5cadee07de12c1d6bd61cd32f07e9ebc0d218..745af3f417b2194e5f4e90d0b8940687c631404c 100644 --- a/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b8cf30ab162d8091bf588b85a36a288e2a4ae3b5d045ac7dfbed1a3db6b2161f -size 2560 +oid sha256:47251edd0a08418643195800fecf0e458182321181477a15ab3010913b118b47 +size 4 diff --git a/layers/decoder_2_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_2_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_2_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin index 35099b5ca290971a71a5a8fe200f32378bcd44fb..c87d39df894d9f7764c78d3481f5075e3d7bbb15 100644 --- a/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dce50f6236c1def1d66af65586f306a99d60f81370f6dde81b665f352f15ad30 +oid sha256:063dedadd12036857efe5cf02e6c5f8a72f95955a10f2d505b53f2bf970e2009 size 102400 diff --git a/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin index 6a48d89482397eb23b7b9473c2039422bfd04daa..c53b4062687acc69a12ae535e022e7bebc62191a 100644 --- a/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d54124058055e97d7d177cee143b3d9af8c7ae40eb47052a706db0f21b1613a4 -size 2560 +oid sha256:03d502752c8a6f1756549584a3b7322b0e399d227df984a716fbe9c00489dfde +size 4 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin index a5a1a7e3174b4ef28fdcb435ca232d827659e68a..dc51cc256a825dd1eb57f21181f763e2546aed2f 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:927295ef6316c7afd4c4d8b8ed649f5b1411fd993e764fe08c896e631c4c9566 +oid sha256:6d2d6bbf68f226d911b8685478969e47862d6c77135f4e59b26a523ad5fc4ba8 size 16384 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_2_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin index f4bec0e85979430af2109dcf64a3d84a9cb6465c..e236913704893fdbdbb85ac53290d545104ed9b3 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:814fe93187b306522f2e2f44366604c6136ae8e88770e0baf172a0d9f47f8d6a +oid sha256:7ad63162b55e63274c9df645f9cb8f876ebf3f69f3e79b3d89c9e5043f95969f size 655360 diff --git a/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin index b46d9bb433ec49b5621f3f75dd8d1045f851a2c7..ae16d627340b45aa3cde403e0bd3517f0fa6b56e 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57659daf026b8a58f21b043009c202151184cf022d11d005d1049f2a953b1719 -size 16384 +oid sha256:c4996743a1807ca846a22787da890efc8acdd1cb2fff49a0bda050d21f60bba2 +size 4 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin index 739f1d57ec0f60314fd63fd7199debbc59891296..dff0733fe744c409bdf140a7b6cdc4010053c38e 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7120d39a97140da8f52785ce16a5edf7d8584912e24a104d4f70b3b7a0b48ac2 +oid sha256:6630012f9386a03840589168e20887549e8047f3024c6559cd31468e9742490f size 2560 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_2_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin index 44d869ed1b38ffc599d21c90492ba47a9a875df0..4ea9970079efae9cdd8ffade57ec0e8b111a852c 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:455d1361f4c8a97e9c2a7fa480b72762655e69fe447b77dbd6defe4637089c7a +oid sha256:e84e1b4da3cbda5ffb8d639a5df25579890f33ec1b9e3533afbe5a8e64b6a9e2 size 327680 diff --git a/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin index b247112c7d98d463382ff0ba42f313fbb1208b27..e906a7d6e4e0eb74583554b9b63acb757d8abfd8 100644 --- a/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3278f0004d71004a3cf57ec8ecd600c7216678e032f239e03f712eff375070fe -size 2560 +oid sha256:80bd2688eb5c2aa9e027729d0ad8228ce2900fd43452341b728ba098c5cecbc3 +size 4 diff --git a/layers/decoder_3_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_3_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin index 70a73dd3b6c1661e6d542f89a3f3c7fe6ed4632a..d001a16b0bcb5289be2f0f35a46f1779bfe512db 100644 --- a/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4615506b9de6bf246a308393f0b47bc554a89d0e8a86859f06fb2e9cb5455557 +oid sha256:8105f4ef6ee1fd9bd42f78e0bd9c1f982a2cd3ad899e41826cf0e5bf5ad05007 size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin index cbd1eee1adeb39714d34171f9a06176a80c8049a..09d390f985c96443d518d6c65db0685c6d0dcace 100644 --- a/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:98e293a04fcc5eb815240f8620bb42ab961696d25df43a0a1456549121fd1dda -size 2560 +oid sha256:d75a9affb73da4e16bc9a90f247fd084576544b1e658dfdd636fc21eb34c0d2e +size 4 diff --git a/layers/decoder_3_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_3_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin index 8c5c650996dd929cb898fe6e680f0bafd1f4dfa9..8fe5c2bc08313cae4ef409c7b39a68f69a69d94d 100644 --- a/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33e89992827e578d2db3ef7bae29f9ebec8db7b4d5cbca90ac1567824f08d59b +oid sha256:65549080d4995a379029003c546796c5ae914910b0ad1dc250691fd22a4f8417 size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin index 3cd12d6d815576edfe8c79845f5476d365a276f6..c629803658bfdc7226f729385152fa406e6efc79 100644 --- a/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4e26d26400a65d13fd45f45e212c75884fcfceb7d370dd2fb958c66384b6825 -size 2560 +oid sha256:03938795c6cd8f22b6a622f93e244251d3b96dc3ab422a45604eb9c21c7f0d1e +size 4 diff --git a/layers/decoder_3_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_3_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin index d41ff3fd88105856a990e910154f2d4a481d16e6..0bd3a721c28a211c5ec459f38df16f2a88b34dee 100644 --- a/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0c754c1c26de9b5f045269a549c4e78715f400d08a7d5ac2fc3a56f4d7ccb2e +oid sha256:aee3c8de55436c54869b5e2275c9aece2a09a18464b1af113bb0ff8be47f750c size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin index e0fc8283dee88434266778ecefa56e6ff69ae545..1b9f189ef7f75523b2a667faccb48b45ef187a5a 100644 --- a/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed490ffbfaebd2130ba5a0bc7158305fec49152aabf872e11b438cd898ee23e9 -size 2560 +oid sha256:72fb79ed33a2c5752c4eb020474046f673be865b858e0d99c68914d10ac74535 +size 4 diff --git a/layers/decoder_3_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_3_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin index 7c7a579529120e8ecdc8e83b61403c054d4edf90..acb421fa91272ba960c7d49031afd7a927ccf715 100644 --- a/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b66c7d11f1d89055a23b186d56e13c83f897838ce3d316fcab2857ac5f14de93 +oid sha256:61023e45baaf3879bf48cea3186a42852bec4ed5f042183803772d7463b70f00 size 102400 diff --git a/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin index 54114c3bc2ab9808df4bd8284bb2d39d792e61e0..233709741a5b48b01ef5e7464a59cd769bd1826a 100644 --- a/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:61d4936b988663a9b7ff66eaffb0adbb160653377f09b42f03840186374cb111 -size 2560 +oid sha256:49dc0865e16ceee877c011c75f72eadbac2c734c3645fb2ebd9309e61bf6cdaf +size 4 diff --git a/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin index 95b2cf83e785cc6e379c50b64c266c7891e5a68a..51ffb2aa5594ca980899e69462a722e262c5f5c2 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2a00b32a39221435a08beb98b5df5a7fef1a9ca45087f09c5dbca2d1ed6fd67f +oid sha256:0d2cf34775e4122f3f773a7000d1e36329f250e8cba0c12154c1287f2ed640c0 size 16384 diff --git a/layers/decoder_3_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_3_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin index 8d3f2276f325a98e4dba080501882d0c2485c009..b2ca6603068c5c1345b90a9a4fcd367565604a94 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9d50b29b673d876e72d051ec8dac1a997b48b6d279c3c0686a15d6d1ca17cc20 +oid sha256:fdbf9731e6997780c963cc037cd8ea297db91d72b9cd75b33e8ea651aee7dc61 size 655360 diff --git a/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin index 6d374bd3624820e348be20e6c625ff097bfefae4..a5d5fc9a81490baf690f3568774e97fdc2d1581e 100644 --- a/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2aaf1731428de4dea2b2c94d92be1605a5914147820df01b613bfb938ae2641 -size 16384 +oid sha256:5253e4d1f1d0333ecec00ba3ad5da6c09855b22c2c47d64d3a032c36027b8c13 +size 4 diff --git a/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin index 2f5f4d66573650079344ac2a2a5c2e7f68379534..5cbfc49d5a01a167951eeee6c3cf1c45e141343d 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:404606177696da2165733d6f8af43fec6228499443d8c463d17d4888578e8af9 +oid sha256:acc4d0806de36f892e17b7bc0ddccfe679788b28fd05347071aab28246142515 size 2560 diff --git a/layers/decoder_3_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_3_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin index ece66d1488fc41431cbe06ce5c070c9f0ea6c1e6..059e5cbc0d7d66b5758ee895c1f87214da72966d 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9edee44179fb49efef2f42b3ec5016df1afed8835787720d1191cd4da4ebdcf8 +oid sha256:93bb7dc6c659ed2b3787d09cb0a3b196e5d0fd2965bc269a1bee8dc280d6e6fc size 327680 diff --git a/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin index bf4d5df69a6ec1374b5b00aa7ee436ad7ddc0771..7ec6c4b98bcededb33965e690cd0e05534a38b8c 100644 --- a/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_3_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d16e05105856f137094f69b422ed1c30b9f8eb90bc8a9ff205e9493b0bbe73dc -size 2560 +oid sha256:3b1d604246796ef8e2677732742d85621d7586140406b32fedaca157cc6350c2 +size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_3_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin index 4125e0848aac1f1b327b89fdd010893e701ce808..6e906dda2ca4b31256d6a6d09560b01c9af3f5e7 100644 --- a/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d0ab575d0b279fa4474d7b9f00647929f35685ab76cd3643c6433a46e8ed4de +oid sha256:bace7d74ed3d9800393c16f73dc1d5edfc7e335e80b25862492756f04efeded2 size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin index cd4cdfcdaa754d9628b0adfef1c5148bd6685b5d..235f3f8f265afd4a9fd7009de7afd394d41c2122 100644 --- a/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:71249b7aaf64de63e50bf8f046bd46570d7e95512373946b35ae69230d0f7ff6 -size 2560 +oid sha256:e4adf7959163fd8a9fbd35076cf99bf292ebd9fbf10db3aab0363f335a43ad80 +size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_3_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin index ff3cf004097b0cc375b2ae0cf1bfbe509a713dd0..1ad5fc13a9dad707f9b8e9653022ccea43c46ba4 100644 --- a/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:baa3747fd7115ae1207676b6f0b7a24c143394c391efcde887fd7d04535c04e6 +oid sha256:b03dadf7d238896ba81b0778ad41d57be94c7dafa18a0eed2bcf083d333344ce size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin index 8acf871263ae6cc99f506b7706906abf41a81550..06dbfd420a25ab4323c9304401393cfa549ef4c9 100644 --- a/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3bbcce09479da4f651ffaeaa820380ac3d06546fbf304dc3da300953c27c1d06 -size 2560 +oid sha256:f4187a6eefd5fdd64919509ea071d950e1747c9546ab9fa69d1caa234c175c81 +size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_3_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin index 288ad448f23f3ff895d3adcddf479c9f0bbf9623..0eda57f18e868b9a63d31445a19e8774249d3825 100644 --- a/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5492c34a0278505bdc4e822ac0189fcca8b8d729015236b78ae9fd1ddd8784af +oid sha256:8e60525417ba8a8826caa9835f1c73c530c8fa0e6c371461165809f230528161 size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin index 9009641eca0b4bcf18157dac74e95db02b460f78..6b6e46b0c58428598729cffe0fa26dfb29a5800d 100644 --- a/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:80a3ad5ecce3023ac262c8972e0ae7c26da488b4efbc97d9d37a1e2f69e1ee30 -size 2560 +oid sha256:391c8ae81bf21ea2bcb1244cf9e9ad32d873c5c06b83a7fa75da229fde0fc411 +size 4 diff --git a/layers/decoder_3_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_3_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_3_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin index 99c698b926b1e518b1326c3e8c4922316fd281cf..e136f13ce5d3b372f89cbd1357e613364d3a8672 100644 --- a/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1372ee94bdd78746b74f299fadfdb2542584b82e774f2897213c2f80c3d97b0a +oid sha256:9282bfc70ccf622291e17fe2b9d1cee2812e73a66fa8f3aba79369541bff4841 size 102400 diff --git a/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin index 677952efd7436d340d6704c9872fba8fe8c1fdfc..32eb3950f47fcd8fd5570abdc7adf675b6fcc899 100644 --- a/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39b616adaf778fb8765fa0d429aef8dcaca66563ec1a9bd7b101db0a3ec08ec6 -size 2560 +oid sha256:0564851be9a55276d9a60a6784b8674feaf663ac7fb071f027caa0f244c97071 +size 4 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin index 3e183e45cd791e50841d6abf2e20156c0dbd2e39..870007d22c818c5257c7fbc8ce6748057fb8690f 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e7fa2b9db048551c93fa33e511d2a04b57b1b699e3c567d7c2013b9acf0fe5c2 +oid sha256:c6f37b9c581395a6b65481f3f77556e773d35842ede2ada8a98604a0b670f648 size 16384 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_3_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin index 374daf0644bd777daef24f8041525d7078e2df76..262a4c2607f2a8475858c3e33f6de21ac70a435e 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed0f958756cbd0c9eeb7c7ffab33a2de6bddf84d8d9482d7ca640dde9e1d6dbd +oid sha256:52bff5aede2592e837d1cb076af815d440b21210b384f4cfaab5998155008af1 size 655360 diff --git a/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin index 1adf9d0de2092f8c7be8d7cbc3708f308ac322e3..79537db40f8eeea171022e2978c6c4d4d378ca10 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f46afa8863a3d2d1734daa2ffefb013a0e16e3d996c118ac27f4d40713a4bfc3 -size 16384 +oid sha256:93bd0593493ea584d8263a622757475f44d54afc26c7e3c8ec3f2be2c6d65e56 +size 4 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin index 29a7dd53bd67308537d0efd30b0fb15bb6a295f9..f420e3c7a1623ed88dc20ad2d429c014424d642b 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ef4e426cc678bdc2145f566ca1b752cb5126a1cee5ba1596670727c07102551 +oid sha256:f68950966a1c83f11814cb0f919e4bcef8566c7756be781c635f4042b80cdaa1 size 2560 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_3_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin index d3fb65fe202e2040ea04d2443e82af7bf3362798..fdbce64ab054962c80bfaa26a8d158394dccd961 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9add00e6c4822b6e42e9fe755d1e64de6581345ef650c5c3997ffcd5f28972db +oid sha256:b833a34b79e1a6e90a9d5738edc0fd96058669853377212d0b6854f7a115e421 size 327680 diff --git a/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin index 89df340e47f4d505d3c4545e49c49fdcad485835..8cbc386e78e0131ce7afe05949f7b39558415644 100644 --- a/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bd1ba26139a6268ff548cf38f4254585c7cf9705fe8e98e3e466060f130251ae -size 2560 +oid sha256:b660f513eabe0896e1eae74471316b75cf882f2b2ebc96b5d96dc48b117f9b68 +size 4 diff --git a/layers/decoder_4_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_4_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin index 53ea465be629dc84fe105b5d1c1f29568c32c9c8..ae057db93f9fef13d40f4e60f542a751b75915ef 100644 --- a/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4c3875278ad62825f74504bb5c9cfbdb3c707607219de5000eb33d8d4bd93523 +oid sha256:31524643e06ef3020f262caef697c874b75e408d9c2f11b749d8a9b1b7e9b843 size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin index 124b87a7a5592ad5fe0da200b76b51e99512fac1..84cec959864c75a0405df0d3d0dc59911d0afc2c 100644 --- a/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33667cf828fc4b0223668f61a4d19df07fc65412645b23d9608986fae8f8299d -size 2560 +oid sha256:3f488d0b11a99264984291678bcb679df9190a00385e4b73e46790555073e217 +size 4 diff --git a/layers/decoder_4_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_4_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin index a0c591695cf1d0718147f87d177020cd19caf9eb..acfd9e5773996646fa9dd22bae4f18cd461b673b 100644 --- a/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d779dce49505f8f4796061d9c48b8952f8a2744ef886baaa84762cd1e22e110d +oid sha256:0a03bbbb018fbbb45c3d7587aa68c507ebf5befaf82759c55cf15878a1b17065 size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin index 197080419f051c28d7091b4a0354b17ba4eb60e1..ad6fcff873847a78ee6f54096bd5f4e256fd159e 100644 --- a/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f45aba4aa8b028ac833a520a51e9152f61408b8d644cc8be7263db6920f07784 -size 2560 +oid sha256:1da26be124ad087738062d6177cc05257be78c2d2a956abd0bb3b161e7d8b0db +size 4 diff --git a/layers/decoder_4_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_4_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin index 0ebb5fae4bf50eadc146eec065cc1ae17b18e491..e7d450850a241ce67774c7c4e48f86bf3131024c 100644 --- a/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ce1a77e60422d32c2f46934a766d426bf038344f2e7ea0c5b0dd7c5c7617aeff +oid sha256:4616bfc7b4ee6594a074bf87afe0b3de1aee8ec0467067e68a90cdb55e4b0893 size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin index 28aa19120209a74431b58da8624f8dc8bc95bc87..800e44df66dc41cb352e8521c2c5f6414dc9e9a6 100644 --- a/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf0662981cf96dd423851b49062f15376ae4902938808056f0d0fbfa35c0e0ad -size 2560 +oid sha256:3a2e3d1ba069ade3259a5f99d9b0bf9224de6ece09c62beea206b23d7b9b1fb7 +size 4 diff --git a/layers/decoder_4_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_4_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin index 0e211ede293fd377769cdddfc5583dd4015f2db5..f83ecfc2f8f5a817b13300b8caf1b06115901176 100644 --- a/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:691ee8830941075f454a8bc70497aab974a86e2faa7ec004d05be1b460d26faa +oid sha256:bf7de31509287e5e5fd652f3e15f78ab4fdaa35dc31007011ef6d13d4a78ec3a size 102400 diff --git a/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin index 7144b08a95a1c27e359489fe40462a6b9e56c14b..b2be2099ecbb0224ae0cfde5a83813be0b3c98c8 100644 --- a/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:756df02cb043bf56b2b6a6c2b49f91415b744a8d9dc48398081f26d671bff9ff -size 2560 +oid sha256:529c7e330c43ee50eead8d189012170c1ec46fb4e33389e614e40ff8f6c36d85 +size 4 diff --git a/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin index c0d18e48edf6a14a4fcc44def5da16643751f77b..0e819d5aecb8fdf306fc78cc4546e0116ccfb1a8 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:99c2ddd2ef7cfe781327186d74be769db274772bd22ec56ef8dd2e4d93f2ce20 +oid sha256:1a42e9a422a18d500744229a74c9f4e5d29cbe5f5c29e827ab99eadeb9a4316c size 16384 diff --git a/layers/decoder_4_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_4_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin index 34822d8a16fbbb99462906ff863ce2d3bed37de3..4d265b1d1cb5fa291ee65906ac0f2810a11689f2 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:64bdf33d4af3bb01b77e21ce7b6878be698ade724636a6fa6ebc7af697eb9bc4 +oid sha256:e5dd270c2a9e69b837cfb0bab4b43c57989bf83ce6c15f7b9cca27a32fedacb7 size 655360 diff --git a/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin index eb1943292c6fdab5bb2e17cbb24fed1f8f9f9838..fce2e910e9522cc6dc5bce98d8e524b32148895e 100644 --- a/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9ea4cc4f63e9e30e08037ec2717237a21ee76d7382aa25d823713ed9afbe238 -size 16384 +oid sha256:cbd99c99c9af6c3112db595ea710801a67c3b231c89ed68ccd1e211660bf58de +size 4 diff --git a/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin index b676daa3aba3d67d8d4d790cb91c22a7be5fd4da..220c27f6dc5a84ab0a97b31b5e5904aecd79b19b 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7698c41fa41db9e931e0866ba25316c02da7112774a03e79089e70b405fd1856 +oid sha256:9e5fd75ca05f0cff37991d42a5a50a5de092708bdeb663d2a9d074fb6e2603a2 size 2560 diff --git a/layers/decoder_4_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_4_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin index 302ae9cb4ffeb46619ac6c857900ce8afc6c0260..1d732bf5349f525afd09b52e48f2a87ee524425b 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2a9e4d3d7740d4bc4d0bf9c8268544f28dae5c5cfa56120c3566c26c7391afd5 +oid sha256:7ce2e9e96e8008fe75b033c97729382205c3985799b6cd344012cc9273796ff6 size 327680 diff --git a/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin index 8efc0a13d79280104f420fa03795ce03fd4a65dd..82f20d8400773281e90fb18c93328a07d93043b6 100644 --- a/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_4_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a07ee9fa0e3d703f194c12d30d48c1ed2966c42260413329a52a5bd06d31f82a -size 2560 +oid sha256:328ff35703d7b9a3c5c531efc74c40d7e5f0bc5d6590f58974752967e569406e +size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_4_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin index 210e5f4909bfb2346dafbe1d52ecaee733dd2e6e..f377e81fc2e2d90b025dd3fdce230c3cd8a8c94b 100644 --- a/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2c5749cb807ddcc419546bc4eaf90e08426c81bafc0d08f988bb5a0864058884 +oid sha256:91ba999d8060f5a3081c848f64e8b14a7dec437ed842962ede41d18dd1c210aa size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin index c0a719d92f4e198ad6a7352df82c2c416c2da1db..cce37c1e1beca5f288ddc7a6b740d90c9d5c54ce 100644 --- a/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:54dd0e2297946d77d8c8b5f3dcd7f3c116d90a5b7ed4fe5404e7de7bb749922d -size 2560 +oid sha256:4f2f42b8ce0a5ff7a5211a44e6f071a777df886ba6cfa87b941a3c3ea57048de +size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_4_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin index 6008f38b50be67f02353ea427d86889991a7d187..a0d3bc2e0ee7e946a42fed36b5a984022b084d05 100644 --- a/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de4d3f36dddec5d85edbd1eea9336de4b84d347253de4e759c539e25e9007040 +oid sha256:a4c4f008decffa7ee25bc837ee608ff3020d840dab661d75ddf158e59ea0c1d8 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin index 0008db861ba65f0fb673e9bdec3fc208a818b1d6..7f26cbc651bc872a8288c81f7487c571aa0728ab 100644 --- a/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dc479e96cc27e74edb0cfb05c035f6c6f135e64e52b61a26b3515a5aa7cd196a -size 2560 +oid sha256:703dc8c734ebcc942733bb5d6e2dde21b48df4829a2c2bf654947ed4dd2e7cd4 +size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_4_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin index 74fd33e96f668c18c9a655cc5d0d4617abfacd27..efabe4a820ef9bf2f97cce0f47039e117fdcb4f6 100644 --- a/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6fddf10d6206a2fda4146574c6e35aafde38ce57ac9d944e8776e45b38640d02 +oid sha256:705018b26a50bfd8f8db2543ba218eee04659da2bd2f670029751cd846a4da00 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin index a2b93ff8b6fc2fd34312fdbddfd61ecbf09fa6dd..073b189a93e46f6b2625b673fe8a4b5c3effa999 100644 --- a/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:365d59cde5cde0d76ae1056f9b6f9a7062ea4298ad7846db9ecd6e30fd63a19b -size 2560 +oid sha256:ae7f62151c5884804a9eaddd9fa36f5b4c457d092aba8d78d8154b8eb1ad188d +size 4 diff --git a/layers/decoder_4_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_4_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_4_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin index dbbd2118eb0812b8cdc9c7699c5f31cd3927dc34..7cbcebe6c0ea1e02bd0d2d540303b8c6af805217 100644 --- a/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f0b5bee4f6752aa8804110605497b301456328c3fd8f92f800e5aceb2b58ac8 +oid sha256:b1682806f928cfe008f5ad7cf8a62ff8f31312ee864685836db9469f6e536fe5 size 102400 diff --git a/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin index 81dc626123f993b901a1695c38cfc85f3f471ad1..cabf4cdc1e42e0e336dfc899db90b2be9966365f 100644 --- a/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:34685d4ff05fb0c35a230447f75d913faeae21a103c8bc3731d1f628dc27ceb1 -size 2560 +oid sha256:471259b8b6c1958cdcaf03f3d889ed4269ac077a514397511f7a6826a5dba552 +size 4 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin index c3509d7399502fd3918466716da3860c3274318e..b17a86b4dcc628512fb5b995f371c8c3ce3d4a8a 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8b0d86432bf25ca0274aea9be29ee3dc8867e07e7cc6fd60373ca8829f0e929b +oid sha256:5548b21f0b218bc045dd0c1ec40ece79f43064b71830d6b91a8e075f07fb9339 size 16384 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_4_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin index d42bfa82e1ccca729e832b36187ebe1a81a51b3e..04f45bc4ff503fd56457783df83074c31451df80 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39887530c7398e4ba170dba80b6425c9aed66e6acd35b5364c872f1821263579 +oid sha256:4020ba9b97b8a890b0dee73ef2f31ca49dbb4ad2d80e8498c71e2753c1663876 size 655360 diff --git a/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin index ad76bdc44fc2c22ce52bad1694ec5d3e290c072f..65b8b6db89743476ca1cffe61e507218c900ff74 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c5e055cd129678d616322fb600fc710f0453ea70c6befb41f6f666dcd898da94 -size 16384 +oid sha256:41f956e7d96fa10803a64f37e87d3c384ce48e2efcd7785468eac768fd0085ae +size 4 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin index 3a046276a18ff9bd7087875ae858b80f56aaa037..d8a73e644dd09a0b3419746851c5fd72411e722a 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee2de22f8151f93d09c7d09fc3b523ae0b62a9602b5f06332e3f1b24c56115ba +oid sha256:060cbb3793b9dc02486280df05b2b834e626637b4dfe7838d4b4f159b84f01c0 size 2560 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_4_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin index 30c6af5ba62937b620242af07fe37f9db8b73d46..e3fc04e6ef82ebfb1250ff67b60e584d3c2b1748 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:701990d2141da402c51f03194222e1d7260ab6011e694ff0e61fb4eb93ebd6b6 +oid sha256:38cdbedb4b51266fbb4422fc7a9fa03ce073ef2234d51f2f46396bf2ff99520a size 327680 diff --git a/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin index 34abb4df0d751d4714b359c1bf531b279d8798e1..98b9e652290c95e2be8b59c42966219d884bc888 100644 --- a/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8a52afa4fe59d22780b74a03679c037bb852d1136808c38c6f65f1211b4a4911 -size 2560 +oid sha256:1f5504e7f4c1c0adf3cb757f77667111ddec260d2f98562ef5f07124f3bfc39a +size 4 diff --git a/layers/decoder_5_cross_block_cross_w_k.layout_header.i32.bin b/layers/decoder_5_cross_block_cross_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_cross_block_cross_w_k.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_cross_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin index 4f4e9208e1015c248115704eace7e9e4dc67b6d4..03be026eb79efc2a86e477fadb139c429c541145 100644 --- a/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ff57e7d933af1dbeb6ff7608257112e011ef1bb58c1e4550834b4374f300ad80 +oid sha256:8342ee2946efbf8358c5ac1084462bf9bc205d8ba3a861a8e9fc0b0ca27727a4 size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin index 15505467ce2a5b7a0f6766a4dce2535f0b5ffbec..eb12d6b03e8d0805e00c81f719733db7fd9ea6d9 100644 --- a/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eeb881a1d106ad608534ca10ca458ae0abf9e2cac941bfdafe380686025013d6 -size 2560 +oid sha256:57a1556ffa48c12c84a3673f0909b63d09dcc23e63ad61b108718ce87697a20a +size 4 diff --git a/layers/decoder_5_cross_block_cross_w_o.layout_header.i32.bin b/layers/decoder_5_cross_block_cross_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_cross_block_cross_w_o.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_cross_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin index acf052845f8b7853c704d9a808aac96581436df5..68318cbe82e7af1be77d4f848260caf8e013a7c1 100644 --- a/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e267d346a55332f235a935d667179f493c829e90d09a7b2e667452667832d14c +oid sha256:dd328e224e0ced6111c0f60827a3d64cbabd59082f1f45483271d0f73a287aca size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin index 0ad2aff55517a947c5f4176216e4d062cbf01626..7975dd72b4b4d166278027a97665b48fdbf7a3df 100644 --- a/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f319c054716b93dce66b0908086acf3c1a07ba5ebc55d15a45a7d54c92050513 -size 2560 +oid sha256:50c843aedcc684ba0a5d6541d3d7a431502dcea46994c8374269112970727833 +size 4 diff --git a/layers/decoder_5_cross_block_cross_w_q.layout_header.i32.bin b/layers/decoder_5_cross_block_cross_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_cross_block_cross_w_q.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_cross_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin index 0f91a6843b4f214ae948f4ca578ad9fac3b5d87c..43c9265aa562e1c6556f62eb507706e5fe62639e 100644 --- a/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c5dcd16f7f9ab08348414c39abab26115e8ff33e36fb7348a2c62b5c413de00b +oid sha256:7b975bb3aa36faa59373a89a11ce871ea2286260d6285d40814516b9e1993580 size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin index 55175ee345dee0b7b017ccc3ab13a6b385a78658..27c07d2e98e612278be442d95cce427c0d19e693 100644 --- a/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:22cbf5b9acb47633ab9cb6ad7de2b7165f0c15ee371d274a23b0d2f0203afa34 -size 2560 +oid sha256:7f0e41304cbfd55072ad386c5da6970259e29bd09325c00ea3da3bc9704ee52c +size 4 diff --git a/layers/decoder_5_cross_block_cross_w_v.layout_header.i32.bin b/layers/decoder_5_cross_block_cross_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_cross_block_cross_w_v.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_cross_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin b/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin index 11cc5b512208b6a061863a7e75dc769364ee458e..ab40c0ce19a7be6b60ef2eda92d10535a8d1a490 100644 --- a/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_cross_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9784b965d55e41ea7f9a3214632e6408dfcbe021404905bdf787e579660e2a4 +oid sha256:9f9eb5e98403ef2ba3df649c0670bf1e3bd7e456b7ec9fe6ff6ae63a546d100d size 102400 diff --git a/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin b/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin index 655024145b3b4db27cd5f18fa6062a2eb0c8415f..00747fc6de4b4a0b903890bdf4888d48ea800f5f 100644 --- a/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_cross_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:071b5dab363a13142def242b7cb5bd90039646344b14258cdb807ad2cfd50624 -size 2560 +oid sha256:5a2b1b58e2a938ffac91f830ffe24d862d2d1a3f641796a9cccc73871cd89498 +size 4 diff --git a/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin b/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin index 93673c9df9b2096e3b032a22715130cca701a4ec..ffe7b063b6e6ae3fdc1a9a93735d41cdeff1c80f 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7adbf3be58996a63513302c855e26b50ca5e09f71be5e024856660126d8d18e1 +oid sha256:ebfe00189def83024b2f04f083dc0ca6effe5dcdd379970582cdce4b7461786e size 16384 diff --git a/layers/decoder_5_cross_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_5_cross_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin index 368344940058d0a31111e7365e077cdf7a80d6e1..ad5cea4bea74bbf40b1f8f03bca71b01d0b74640 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f0b7415b003709bdaadbdad025c40e417708947587b419b4608c51bc954d81d +oid sha256:25d3fdd07478a9fbd57e57775db0038bfa039b15fe323bb8373e5d3d76bf8ec7 size 655360 diff --git a/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin index 1d53b534ed01bd05ea10af5ef138f2b479262afa..a158a3b47cfb9b8934c9d4a1d42cd7e01823e8ef 100644 --- a/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6adeb822555f5aa9a5c40afdc2c2189444f687d97124f9d32b4f4f498796b52 -size 16384 +oid sha256:cd530857b08c9fe35b573115654d2b23ab3c2a93b39f9238ca420b40f42ae569 +size 4 diff --git a/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin b/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin index c98223723f8758c6333c876b4ca1af5c3d4c04f4..f2535b5051895f59623c07d7300766850cd6d1c9 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a01b04fdfe3e63d331eea3a1fdd245621e69e3dee97d9eb4d0df7a4a747c7a1a +oid sha256:9d635dbdf18da4b8934862a8e5105e8056b0dea0d0883c365964d94b1270a236 size 2560 diff --git a/layers/decoder_5_cross_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_5_cross_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin index e7baeae971371e4866e9dc4c419eefe5aad93ba2..ea5fe27508bc332b6a72969f18131dd8704f2ab1 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fb30694fbf89d6dfa78ccc0bd167365c8264a8aa6988dd4c5cddc872c73e243f +oid sha256:177d7c4bad958d79e536ba68d66d66d0971834ed869f1e5ca49040db4610d56a size 327680 diff --git a/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin index 939f3ff09ccf46fee2e3de36d3415d716c235799..a57930f3bc1a9a478879ddddf332b5fe2a9b86fe 100644 --- a/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_5_cross_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7027d96b72a45c6e83a44a76fc6743262877e6783c965d7b8ba82aaee34fd446 -size 2560 +oid sha256:78c2bae093d73a281404ef5e8e0c1c441f2a4a97e560ef68a4af4c73aee4cc04 +size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_k.layout_header.i32.bin b/layers/decoder_5_self_attn_block_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_self_attn_block_attn_w_k.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin index 109d2a3b8c575cc2993a092494dee323f13718cf..4381eb58247163469cdcd6d80b2d73f92805eb70 100644 --- a/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3ef72c857d0463d779455d464cceca3556a5308c6b5cefa85b4e5d2b7036ba4 +oid sha256:43946fb26e7fa4fe90888545317f91ce7dd7dc80339271914038eb7a8a6534e9 size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin index babf0b9ed205a05ec52c5b7ebcb625e4aa7ce2ab..bc3346e0cfa0916ed7fafc65df035967d80f4cab 100644 --- a/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1696afaa802b7df890080fab4b2148db46aac451061ca56d67971f7eb15ed9ed -size 2560 +oid sha256:a8a5b74730bc699c1734b0f115c2665213f0b9b22f30a3345001554da141996e +size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_o.layout_header.i32.bin b/layers/decoder_5_self_attn_block_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_self_attn_block_attn_w_o.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin index 5fded03dccfb7008e8ef48a4dc81badbae0a0be2..95b3d44fb1ee3285bccf333678035cb7ba3d0358 100644 --- a/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67b98a2983d6281d356e2bdee9c55c93ab827279c23438508d8af4f37b78929e +oid sha256:c76e70f5dd66747c201dd205fbbe05881d7f49346e32c6156fc708d13c8c3340 size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin index 58ed74d49132e351901c366eafed62340d4a4e5a..1d29e357096cffde145217756cec75b6a98d55ff 100644 --- a/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:41f4fe30c5f18229023424b02acfbc5aeca6a33406c3d4102ffe57f437b392cd -size 2560 +oid sha256:959180edcc34bc6313cc1b8af6ec69ff1b5ec9e43a6ad6f0e0af7cd39f2a9cb9 +size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_q.layout_header.i32.bin b/layers/decoder_5_self_attn_block_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_self_attn_block_attn_w_q.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin index 482fb745858e5883d73b41e72366fc5b44479e33..c1227124e45c5d7695d0a4de1afb2e53010189b7 100644 --- a/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0823d35b6cfc35c11009c68fe3583c980e3a51b6d473194d11e2f378b508ba33 +oid sha256:820c8b917dedfa7b94fd8168a696940b32885dc20a6fb0423506e773efc2284a size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin index 552428d19163d284b567c8a2d1fb96dcef1dfea0..f2e41ddb42f554622a4b9746e0d8e2491460528d 100644 --- a/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:811c5513fb65eb2a4aa83753c9c60b7201c7e47eae248153fbfce96540ec12f8 -size 2560 +oid sha256:de28049a482ce86e09aae54b4037fb595650cd33e7947abb29e9528019872250 +size 4 diff --git a/layers/decoder_5_self_attn_block_attn_w_v.layout_header.i32.bin b/layers/decoder_5_self_attn_block_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/decoder_5_self_attn_block_attn_w_v.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin index a95c04753210031b71d4464022fba173271fc101..91b58f38a74494ae63d83bef83bf6c7b288cfbae 100644 --- a/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:71df327a240d414357000156bc4ce569ccdf02203a8f6c2997c3e994a424fbd3 +oid sha256:e9cd3f10c5ca5524ad7916a8bac067ef9898cf9f53a9b6a6ae15c190a0d71a4e size 102400 diff --git a/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin b/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin index 95b601c905b5782aa376b78a099b7fdf50080478..94490ebe6427f4adfd1bd6fd7de54848d6dc5e20 100644 --- a/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7fd4d47d4be6dc31c2add3f32ba8b2d2dd25cd2ba65a472dfc88404dab1e60d8 -size 2560 +oid sha256:dc59d8f713e7157ea3221dba1f622b898c0245dd4d0d34327d920006e3ba09f1 +size 4 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin index cef8bf9cce1e0cb03d816135a0e61a74bd1efd51..158deee54726481d7861336871fd05f7fd6ed712 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cc2627ea7e1f20f1f0bd4dd22c40a0676b93389dced88ec93f076c04d2977e75 +oid sha256:9c011e158b3eedac0e294b2ded17297c587a790c50b6dc0c5bfdd795fce6e431 size 16384 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.layout_header.i32.bin b/layers/decoder_5_self_attn_block_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin index 3b33206cf7ebd9b462e9b566d50b956aacbbc387..832a9a421d490be70771bf56cd26d611c07e35a2 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9f332a3be87df814615bd0c5076861d892480726ae149562978734a69cd89eb5 +oid sha256:324d5b0baa2bd143549f6b876e4847bfb14df87e6f4c5f2ed8c38f80f7a1bd60 size 655360 diff --git a/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin index e43d0046ed7efacd331d77d0757024611c73b852..ee693394235eb7d21a74ed038edf4f691edbd89e 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:269e730c81acfe542eefe0157297240e1f909ca448d555e6aebf0ec2d22e6d55 -size 16384 +oid sha256:ff71e0cb9e0cbd714cfe53000e4c6693e243b3a528dbea9bbde5a9791fb76cd1 +size 4 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin index 0b80bc5db5b5e6b5693c5ba1136b4e87e73dd67c..b0922ad50c244aa5fcdcddd24040cd1a3a60a00a 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ce93bf1e56f8944815bc3feeacd388fae0f0d65a826beacd5f4dbe652ae0a17 +oid sha256:934ef203f64706d6f3980935dca28accf5fff8c05d3595244f878091ea0ef1a7 size 2560 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.layout_header.i32.bin b/layers/decoder_5_self_attn_block_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.layout_header.i32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin b/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin index 628e23bbbcba373011f9ec382e935391ad964b44..9d0acdbf898f0fa7396eea1bd867054ae7a4a07c 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1ee787f01158b228e633fab235a13aed3ab1ef306930d66f5374f1f3639495f +oid sha256:d11e2e2807b998655988a6994f40b12f1147bfcb09e1d212a6ceddf86a8b9d70 size 327680 diff --git a/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin b/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin index 7030070b8522d1b07a115c11440fb6e1683e425f..6df5f9bef45621e7fc215f785435813fa4e6ddcd 100644 --- a/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin +++ b/layers/decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87656f15f2449f30ce1a19ea2b83134086f71bed5d05923029fae7baff63275c -size 2560 +oid sha256:e57b7781511191ee1c6211206145643aecfeed5fd10e2be8ba5d4a79fda582e9 +size 4 diff --git a/layers/encoder_0_attn_w_k.layout_header.i32.bin b/layers/encoder_0_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_0_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_0_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_0_attn_w_k.packed_weight.u8.bin b/layers/encoder_0_attn_w_k.packed_weight.u8.bin index b86780633408b85f8070796e5abdfeff72d28edd..8f3b423d761e0c3db15e146655c3d68183ee4101 100644 --- a/layers/encoder_0_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d52f992b0910b497849db037dcd3b211399dde003b3d5dc1c4243030aba97bcf +oid sha256:0d358351e42a919e6f41efc8d3d8220d202c7a2592a36b18b1e4039c0312c49d size 102400 diff --git a/layers/encoder_0_attn_w_k.scale_values.f32.bin b/layers/encoder_0_attn_w_k.scale_values.f32.bin index b755ea94953fab31d4fca33000968e4797473dea..3de43f1952844bb84ee9816cc53603efdd46a457 100644 --- a/layers/encoder_0_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb8a7e3e25b769081f540e81ace05f88ab7e7bdfe6369c062c4287b4dec83362 -size 2560 +oid sha256:363a2535ff463d2406751ad619b676aaf8f5043f972b10829d70e5c5370541e4 +size 4 diff --git a/layers/encoder_0_attn_w_o.layout_header.i32.bin b/layers/encoder_0_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_0_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_0_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_0_attn_w_o.packed_weight.u8.bin b/layers/encoder_0_attn_w_o.packed_weight.u8.bin index e902e893d500b68bbe4f8bc5a0d4d852218d022a..32a9b9c7f0841c180d5cd02ee95f1c7044a018b0 100644 --- a/layers/encoder_0_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:150c446d048f21dc70c7bf8257c066c366b16c66fbdb6e2e1a1696a7f825f07d +oid sha256:83c19e24982850a0703bc51352e8d2dcf2d9c58cac17c3fb58815327b0117251 size 102400 diff --git a/layers/encoder_0_attn_w_o.scale_values.f32.bin b/layers/encoder_0_attn_w_o.scale_values.f32.bin index 4f716b5c75a67f2b6ff87bdda3306eea6e9adee4..ca77e93d137926244e618da59bdd3524f8b81537 100644 --- a/layers/encoder_0_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4ca4bd42c680d34759243aa28d4287d7b9ea25b33cd612cffcf186773e64fe7 -size 2560 +oid sha256:92e6c93ca7bf5dfca57fdc636156023c476dba44daa150855c770b191b2812d0 +size 4 diff --git a/layers/encoder_0_attn_w_q.layout_header.i32.bin b/layers/encoder_0_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_0_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_0_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_0_attn_w_q.packed_weight.u8.bin b/layers/encoder_0_attn_w_q.packed_weight.u8.bin index 207c1c4e1641f458ad5398e21a49757a19ac6341..407c189ecfda62da8e5c9a963e5bc4e4930bccad 100644 --- a/layers/encoder_0_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7ab06bc015f2be6319e3507d9bc4fc481ee92c5cc2c7c27c42f2fddfdd33497 +oid sha256:951c976f47b39ba620a2703f97b02ed8e753ccd8bb95a9c61ed0911139dd9009 size 102400 diff --git a/layers/encoder_0_attn_w_q.scale_values.f32.bin b/layers/encoder_0_attn_w_q.scale_values.f32.bin index af9b1c9f59b2b89e9b236cfac7113eb4534d1598..41703350a4f30bc5604f9e9327cf4f77bb7928e0 100644 --- a/layers/encoder_0_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dff7f19bccf1d55789a281957b398f254a65589e6cb304eb7281f66da102a1ec -size 2560 +oid sha256:58f656d894a6673181860f8ec88093f0a6254b00ce39b1cb1e108f1615e638ab +size 4 diff --git a/layers/encoder_0_attn_w_v.layout_header.i32.bin b/layers/encoder_0_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_0_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_0_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_0_attn_w_v.packed_weight.u8.bin b/layers/encoder_0_attn_w_v.packed_weight.u8.bin index 4a4a300b0fa9e776626c6f5fbe3bb1dd03bd2f3d..5eaeed3f134d620ed27227299e63407b97918e4f 100644 --- a/layers/encoder_0_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_0_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:108581897257e33bb4fbc1e55704ca7764944271553d0ddfcc722a18a112521d +oid sha256:5f2fd0f6297addda94dfd003cc2902fbce3b926e9d3ccb9fbf56f118ba987bc8 size 102400 diff --git a/layers/encoder_0_attn_w_v.scale_values.f32.bin b/layers/encoder_0_attn_w_v.scale_values.f32.bin index a9b8cd8f95c02a1e7c43dc04f7eb3f033853a1e9..25372cd53fa79954dcb28ffdc0ca963dcd4ea49f 100644 --- a/layers/encoder_0_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_0_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c7271620555a6f171073cc1282d421ce99c44ac9320608a8eb146546ddc0fa4d -size 2560 +oid sha256:834cb863484c883b449cc141b0d11a1441c8d5d4c6c00b76092e54b1b9726ffd +size 4 diff --git a/layers/encoder_0_mlp_w_in.bias.f32.bin b/layers/encoder_0_mlp_w_in.bias.f32.bin index 08168feb30ef8891883a7702a54fd793eef17eb6..ead6960de9171ec5fae21b03b26f1ea5257adcff 100644 --- a/layers/encoder_0_mlp_w_in.bias.f32.bin +++ b/layers/encoder_0_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0c76a21f7135f7f72f7c900a5774522e72fe8ab934d5ab5fccf1dfc79eca530a +oid sha256:3a2cab48442eaf53044fbe153c8e3688fdd3ec3c035f8edeeaf67d3bcddaf4ff size 16384 diff --git a/layers/encoder_0_mlp_w_in.layout_header.i32.bin b/layers/encoder_0_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_0_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_0_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_0_mlp_w_in.packed_weight.u8.bin b/layers/encoder_0_mlp_w_in.packed_weight.u8.bin index 8bf292f5322d61f951de17116af14e894dcb5568..674fa3acf782c8c9f2b0ae9df6ba757a5693c249 100644 --- a/layers/encoder_0_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_0_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:004d7e5054f2c9e259a2c13919c8df7f5b111c7ee22acca01a704acdd021471c +oid sha256:8084c90cad779fcfbf3a68dd3d751dab75a495d6798f8d125b67ee076582c72a size 655360 diff --git a/layers/encoder_0_mlp_w_in.scale_values.f32.bin b/layers/encoder_0_mlp_w_in.scale_values.f32.bin index 88d4016d846741c30fb087ae565319648fae43d0..02c1c819a6ad7e2fcca6b7dd8d1dd8e28ec4e422 100644 --- a/layers/encoder_0_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_0_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4214d23605eea19d324210ad68ada5225528050abb903d19acc8a0e3268db8f1 -size 16384 +oid sha256:fc25f4d74c3d8a0be61dd9b7b006c93e806bc6dc048c05e98596e8542c1327c8 +size 4 diff --git a/layers/encoder_0_mlp_w_out.bias.f32.bin b/layers/encoder_0_mlp_w_out.bias.f32.bin index d41da85f468fd006f939063138cd3c9a9dd43158..527e989d1ef91566d8c228d161341c0c2c446b25 100644 --- a/layers/encoder_0_mlp_w_out.bias.f32.bin +++ b/layers/encoder_0_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3645d2a14f59327bfdb2fdb9a25d1fd73f210eb0d09d4ff9c1282216684f8411 +oid sha256:6d95b0054d8d8c155e33665b1fb3c0dd454478ad2a95eba4316160883bdefd47 size 2560 diff --git a/layers/encoder_0_mlp_w_out.layout_header.i32.bin b/layers/encoder_0_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_0_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_0_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_0_mlp_w_out.packed_weight.u8.bin b/layers/encoder_0_mlp_w_out.packed_weight.u8.bin index 60fa66021a0b61006e4046860dad277888be378d..1eb16bb162078c0bb7e09a0459bca264ca14790b 100644 --- a/layers/encoder_0_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_0_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1834b3a1cfd59a330317fc20b6e5175e8efbdfb49d0cafe2187bda3da18151b +oid sha256:2b475a637893e79948117383cd9138d44690a04653e49985b355e6e63693a783 size 327680 diff --git a/layers/encoder_0_mlp_w_out.scale_values.f32.bin b/layers/encoder_0_mlp_w_out.scale_values.f32.bin index b3a36bd96875d9fe1d9dac1677840589c3b3e459..45d2f02ce80d6ec51eeb85f00c39c315907dc5de 100644 --- a/layers/encoder_0_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_0_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:55ae56768383392cdb0ce3dc1cb7e328065bac7b4d564636675908f7c7e2b5dc -size 2560 +oid sha256:827241212e161c00a58bf08aeb8e001a475599cfb6786c2945b15dc39afe3dc7 +size 4 diff --git a/layers/encoder_1_attn_w_k.layout_header.i32.bin b/layers/encoder_1_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_1_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_1_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_1_attn_w_k.packed_weight.u8.bin b/layers/encoder_1_attn_w_k.packed_weight.u8.bin index 46af50b60eed4aa2b9720ce65d6024518514c788..59fe38d9c74b082bc5a522f1457d54fcf7da91f0 100644 --- a/layers/encoder_1_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab05a077baeb46cdcc1d4aababdf59b5bea3aeffa68d20649de0e9fba1c37655 +oid sha256:27b7e94565efaf4b3c1518f3862c56328a9e2ecb594cdd76f52e8ecd87cbaeb2 size 102400 diff --git a/layers/encoder_1_attn_w_k.scale_values.f32.bin b/layers/encoder_1_attn_w_k.scale_values.f32.bin index 9c3deec55839041658c02f5b4f50784d172132c6..b605d00d3609e305f1c23a2aa45416d677d4b097 100644 --- a/layers/encoder_1_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5cbbafe639997041e3d9f1af4841ad61ce3fb4a01051527147ffb82ca3d7be5d -size 2560 +oid sha256:8e90310d7f602900c61d1ec0029aa69460d20598de178d6755dd8b6c42b109ba +size 4 diff --git a/layers/encoder_1_attn_w_o.layout_header.i32.bin b/layers/encoder_1_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_1_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_1_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_1_attn_w_o.packed_weight.u8.bin b/layers/encoder_1_attn_w_o.packed_weight.u8.bin index 11f9f439d44f8c0cd482feca1c8e1a4f7a2da493..b04d79240c774e6da71d3af2b012e6050d4d2a9d 100644 --- a/layers/encoder_1_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8983ff941314f11b1763fcf4151acf8b5f253e1edaa1af513393064e51170db2 +oid sha256:e1d4ba087cb7fd9337ad647b9ef35af6ef83ef1a9e2611f177e7e76cec268d67 size 102400 diff --git a/layers/encoder_1_attn_w_o.scale_values.f32.bin b/layers/encoder_1_attn_w_o.scale_values.f32.bin index 810652ecd0e9e7b729deabc164ef0567448113d0..a9c317936a7ae2dffdf4f62434397553bea772f7 100644 --- a/layers/encoder_1_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33dbe8951b3b693cdb8142d6eb69c78b4e8759f288cc4a5318104ac02c80b843 -size 2560 +oid sha256:94401ac4905ab9a6a51cd297f505caa81434ed03ba406ef6a8cc3e1759b2dbcd +size 4 diff --git a/layers/encoder_1_attn_w_q.layout_header.i32.bin b/layers/encoder_1_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_1_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_1_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_1_attn_w_q.packed_weight.u8.bin b/layers/encoder_1_attn_w_q.packed_weight.u8.bin index 988ef5dc11a7868bca5a9b0b5c75c930aaeeac28..3ea902f4dabf0a83eee3730cbf16def49b2f83ca 100644 --- a/layers/encoder_1_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:243e87c08f505a34c72a257c31da63f389f0dc9e7709c1f3993b621936c1c5c6 +oid sha256:abe92f5a662e92da5725883968212a2e90a77f05e8499dd0eb5c3134279535cb size 102400 diff --git a/layers/encoder_1_attn_w_q.scale_values.f32.bin b/layers/encoder_1_attn_w_q.scale_values.f32.bin index b2ff700e4a4facd93faef860360194f9b741d19c..49bb85e3b3606634a2c6700ae93891f9e0532836 100644 --- a/layers/encoder_1_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c3176454b5a9bc79ffa3a5b1426854dde1075fc8e95df718dbbf1e74c6a1a7d -size 2560 +oid sha256:f92420a0087a6ad79021a64f1300eeb7d53c4146df1e5f92c339fdd606d4808b +size 4 diff --git a/layers/encoder_1_attn_w_v.layout_header.i32.bin b/layers/encoder_1_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_1_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_1_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_1_attn_w_v.packed_weight.u8.bin b/layers/encoder_1_attn_w_v.packed_weight.u8.bin index 1a2b51145d15cbac4aa869039054f990b1891edd..01936bbb65b84db4afec8ea43805531459cd63a9 100644 --- a/layers/encoder_1_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_1_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ba47a4c2c9493d604c2deccdf301f26327fd24aa4f8dea97ad227e1f6079297 +oid sha256:fe4fc47da4a97ad0fd49c5dcbb7175aec7a0d2f7fa4f9f82c2703ca88cd13b76 size 102400 diff --git a/layers/encoder_1_attn_w_v.scale_values.f32.bin b/layers/encoder_1_attn_w_v.scale_values.f32.bin index fa5d295f83a2a90112dc52849153d943574d6e4a..41ea50bb3c825bae6a05b3f44f9f7f6f2a9706a6 100644 --- a/layers/encoder_1_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_1_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7c225f027928a3506f88c02591bdf37ef8024f3facede11ed9b6cca961e01252 -size 2560 +oid sha256:b2efaab082de4926716917ed6472d67ead22eaf2c71ebdcae672069a4acdf9fe +size 4 diff --git a/layers/encoder_1_mlp_w_in.bias.f32.bin b/layers/encoder_1_mlp_w_in.bias.f32.bin index 80369e71c89e88730436b45984efd7865bbefd0a..f26d9732d3acdfc366b610a5e0da1a31654bcd26 100644 --- a/layers/encoder_1_mlp_w_in.bias.f32.bin +++ b/layers/encoder_1_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0f7ec6b18dc60d7e34e54202e2dfa23161d0d1f9f236dc3793175b36787c33f +oid sha256:025bae5bd7c6d3874c23d1348d4d32d7a5c399e719416f1b22112784599348f0 size 16384 diff --git a/layers/encoder_1_mlp_w_in.layout_header.i32.bin b/layers/encoder_1_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_1_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_1_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_1_mlp_w_in.packed_weight.u8.bin b/layers/encoder_1_mlp_w_in.packed_weight.u8.bin index d511f861b8671444bb2fbda4305d0c07e63c9a95..b96adf9c5b5efbf5874c691042f4fc8689ef5039 100644 --- a/layers/encoder_1_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_1_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2bb3428b472adfc90eb54828a2ead8b0ad6fdf2cc7b66675380493c22b20a62f +oid sha256:97ff605bae210a9b872523f788aa25bf06ae8da80eb62537ac6ba898ab0cd4aa size 655360 diff --git a/layers/encoder_1_mlp_w_in.scale_values.f32.bin b/layers/encoder_1_mlp_w_in.scale_values.f32.bin index 3445e7c1e960e6d82a0abd91ec0d65f933537822..7872341c42242375f88cf68f62c1ca20961c3e98 100644 --- a/layers/encoder_1_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_1_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f9da662769353c2563a0ede9f3d0c1f5a2c555ba0e0fa7fc44e3e618bd84c67c -size 16384 +oid sha256:b14e688ad3655e5d1c26fc671f68d4911632515459181f058a45f5cc218a7973 +size 4 diff --git a/layers/encoder_1_mlp_w_out.bias.f32.bin b/layers/encoder_1_mlp_w_out.bias.f32.bin index d07015e8f4f863da40418e78939837ba878672f9..5db7d2719241d4114d8d5952b61e9b6037069824 100644 --- a/layers/encoder_1_mlp_w_out.bias.f32.bin +++ b/layers/encoder_1_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03b3887ae51c6b0037db1fd1f0de55da60433531a813d71fbde60aad3999a919 +oid sha256:44d5985a564ba0032aee0a81b081ba706266d8e085a12c7f44d688918c8f4811 size 2560 diff --git a/layers/encoder_1_mlp_w_out.layout_header.i32.bin b/layers/encoder_1_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_1_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_1_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_1_mlp_w_out.packed_weight.u8.bin b/layers/encoder_1_mlp_w_out.packed_weight.u8.bin index eaa78a7491234cb44c3f69639128e20c25a8bd56..dd0edfa94b369b394a9c753ea3ea370d12dd9c4c 100644 --- a/layers/encoder_1_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_1_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f22a3ff9267da588582fb278a582b05fe01b82db9926673cdac0ed2365c01c5 +oid sha256:7742ee5975e591618aabc5105a207b0f78065d02ee41cc6b45ac88df12bb4c1c size 327680 diff --git a/layers/encoder_1_mlp_w_out.scale_values.f32.bin b/layers/encoder_1_mlp_w_out.scale_values.f32.bin index 2aae18031e2b338920b9be1d685ddbb2f834705c..4ea101333c51488f29697b1dc117b2b5fc6e176b 100644 --- a/layers/encoder_1_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_1_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87b9271c50947f716a47673bc3d02148b87b5b907984913150bafd5fe213fdbc -size 2560 +oid sha256:d4519cac1203163e20411c81058fcc9e15b2715b873377d9867a23f75a878b8a +size 4 diff --git a/layers/encoder_2_attn_w_k.layout_header.i32.bin b/layers/encoder_2_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_2_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_2_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_2_attn_w_k.packed_weight.u8.bin b/layers/encoder_2_attn_w_k.packed_weight.u8.bin index db35181baf788b27d4b83fa67ab400231703aa3b..106b3a270000a0faaaa4590c06d703fd1eaf3713 100644 --- a/layers/encoder_2_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3969a8412ef274fdd8d1cdc0e717e65f093fea4b81ea1e4b86946396353282a +oid sha256:32ed7fb622aff2cf751fbd3986344f581380fc2d004517e2b3b7ae111fd31bca size 102400 diff --git a/layers/encoder_2_attn_w_k.scale_values.f32.bin b/layers/encoder_2_attn_w_k.scale_values.f32.bin index 67d45e82a452afca99cffe78cdcb8abd968075c9..57a0e0131721803e5756cdd97818510711560ae8 100644 --- a/layers/encoder_2_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:23558f8ad5065804514f605ae8632576452de53ce75d1ec1b8dc407891c59f84 -size 2560 +oid sha256:8607a763ae93991b49232ae2fd052fc67c7709ef43d9074d8bd91c940a2f4217 +size 4 diff --git a/layers/encoder_2_attn_w_o.layout_header.i32.bin b/layers/encoder_2_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_2_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_2_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_2_attn_w_o.packed_weight.u8.bin b/layers/encoder_2_attn_w_o.packed_weight.u8.bin index 842d703e30dc6f6ff65597a5905ab2cfef61d65c..38068583e6fe1a3a7cb2acf7bcfec3f331fdff67 100644 --- a/layers/encoder_2_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47d3496f29a2bd312b933e603109579534f189ac81bb9b85df90ca5489ba1b42 +oid sha256:4cd3154e5a261d3671f9255147f5c7c123b89e391fa8d95d0e0d8f0aee5b6824 size 102400 diff --git a/layers/encoder_2_attn_w_o.scale_values.f32.bin b/layers/encoder_2_attn_w_o.scale_values.f32.bin index c23d5f58003a302eab089a31ed1775d5298cee74..a0c421e751599cc645b9ae2bba873e00846a61c0 100644 --- a/layers/encoder_2_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4af4886a665b8eef127c37bed55363902266d84244dccf22aba98b57944a36c -size 2560 +oid sha256:bd285179d72698f1f3ec0a18f279f4656df36d31c859f2b106ec8b01caa99dad +size 4 diff --git a/layers/encoder_2_attn_w_q.layout_header.i32.bin b/layers/encoder_2_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_2_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_2_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_2_attn_w_q.packed_weight.u8.bin b/layers/encoder_2_attn_w_q.packed_weight.u8.bin index 883ad638becfe6c9a54cedd68a0a7d6d70337a6b..03d05c49bd7d34feb561a56a1b739891d070fcec 100644 --- a/layers/encoder_2_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6eb5f07dfaf3775aff9c4d2b6401f2a03dc1d62d7860673cfbbc4503a67ffdf8 +oid sha256:4046b1503f400adae06277ce337563059601462ea3ed824adc1143d2bbae8d25 size 102400 diff --git a/layers/encoder_2_attn_w_q.scale_values.f32.bin b/layers/encoder_2_attn_w_q.scale_values.f32.bin index 231c3983b89cfa09ecb9a9337a204f4c4a449015..62a113a5d7d3b0078f34722db50d5a3ae92f38bd 100644 --- a/layers/encoder_2_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:35f7c5b339f31018f1c2f6bc9d3d4fc7f583f3bf363748d5c2d0fb2b65358293 -size 2560 +oid sha256:b6a2a79210118706fe89b4ddb96a41eb06075852ab1c209cdcab1652caa3907c +size 4 diff --git a/layers/encoder_2_attn_w_v.layout_header.i32.bin b/layers/encoder_2_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_2_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_2_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_2_attn_w_v.packed_weight.u8.bin b/layers/encoder_2_attn_w_v.packed_weight.u8.bin index 36301da6c68a4e9b76af962ba789d4ee6e3bc05f..f52d34fe92db33b36e95f94923b12428033f7154 100644 --- a/layers/encoder_2_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_2_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df51d4bc08980ab65070ea27f26c7214cf85772646fe3c012d5abb2a38c18c1c +oid sha256:64940ce687d9f5cac4bc5c0ebeedaecb3e8551bfaf05135a27c04b4158b9b9f2 size 102400 diff --git a/layers/encoder_2_attn_w_v.scale_values.f32.bin b/layers/encoder_2_attn_w_v.scale_values.f32.bin index f5a8d8e89a0c853596811d2ac5474577e7945929..ac6c7558323da05185f80c170e42f0442efbd692 100644 --- a/layers/encoder_2_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_2_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9ccbe7a70a3661ec2f4759630383a3d9a55580a8d06df0e9cfecd64fecfc8558 -size 2560 +oid sha256:17eb0fc4ae802ce844e776193fc48d96664c74682bd8ed65f0659401c25ccee2 +size 4 diff --git a/layers/encoder_2_mlp_w_in.bias.f32.bin b/layers/encoder_2_mlp_w_in.bias.f32.bin index c55300e5cfdf44f45c4269b3d01f3969f3d22043..3054fd42dd7aa5be5fd0480dbb4b1a8f60518951 100644 --- a/layers/encoder_2_mlp_w_in.bias.f32.bin +++ b/layers/encoder_2_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5ae3330307450ac03ac34415b7644e09a0e2cb7ad403d1b5f12ab901de109998 +oid sha256:756a058396dc773b98e7fb45c72299bb1402b3a7f4ff319a435fdae1a5a14a0d size 16384 diff --git a/layers/encoder_2_mlp_w_in.layout_header.i32.bin b/layers/encoder_2_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_2_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_2_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_2_mlp_w_in.packed_weight.u8.bin b/layers/encoder_2_mlp_w_in.packed_weight.u8.bin index 9c45493cbfb0f8f410f4a7200da6dfdf7708baff..9500d132ade6955a2a2e5f95c4f8510968a6094c 100644 --- a/layers/encoder_2_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_2_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b786e18f9b0969d9582a9d7ab2c068409064ac30d1ec2233973ff0d7f5348772 +oid sha256:5c27668c24ade7f4989551e3a23c729512fa3399126e8131a9a7c3b7beba93f2 size 655360 diff --git a/layers/encoder_2_mlp_w_in.scale_values.f32.bin b/layers/encoder_2_mlp_w_in.scale_values.f32.bin index 02a5f88b4bc0d4c53b972ffbc09aceffc06354bc..6f92fef71e02546b77917aadc78aba2f48a49c13 100644 --- a/layers/encoder_2_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_2_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7a8be72029c197396595545fb4c87c3a9537fc1806948f07ab10435af3f6b728 -size 16384 +oid sha256:ea11ebc8e04d3fa09dad49efbb2465b461308a8353d1fddf1008c25cf47b1f49 +size 4 diff --git a/layers/encoder_2_mlp_w_out.bias.f32.bin b/layers/encoder_2_mlp_w_out.bias.f32.bin index aeacc9d27c3dc420e0b2b1835efa5421b0198ac4..14ac064beb110180f59f52f5a214b82f72a0ceb2 100644 --- a/layers/encoder_2_mlp_w_out.bias.f32.bin +++ b/layers/encoder_2_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d8dc575af7db2cc39fdf5088a8b3ddb2ffe120ce316e80589f7d67b39aa626ad +oid sha256:1a85a10eac9d0a55eec02edf2e3b706e87066e836808c100715b883e65689cc5 size 2560 diff --git a/layers/encoder_2_mlp_w_out.layout_header.i32.bin b/layers/encoder_2_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_2_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_2_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_2_mlp_w_out.packed_weight.u8.bin b/layers/encoder_2_mlp_w_out.packed_weight.u8.bin index 8d5fa9d5ef91790a57a64b8dcf6a1481fa476773..370f4a15fd7cd6ffa63037c4e215d072e9ec8ea0 100644 --- a/layers/encoder_2_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_2_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6575ab2984c61b415323a968cf2ccf84721f33259e0d940a8a6d79a082daecfe +oid sha256:dd26321691449af82d643801b9262dff7365260cc32b665c25dee5889cd4df69 size 327680 diff --git a/layers/encoder_2_mlp_w_out.scale_values.f32.bin b/layers/encoder_2_mlp_w_out.scale_values.f32.bin index dffeb9f2867e372d5fea62fb97cda14ba8a3c373..5142ca31d8f0bd31a7defcfbd69d5fbf269cd7f7 100644 --- a/layers/encoder_2_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_2_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7db5cc7f85da5f79e2937f9bc4fc646bca21ed4baf75f566ae9cfe7b8105f202 -size 2560 +oid sha256:ca2d4e4c3da8b0e7a0ab688a4883b2040bebf1e22d545576a795c847e5ea2b28 +size 4 diff --git a/layers/encoder_3_attn_w_k.layout_header.i32.bin b/layers/encoder_3_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_3_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_3_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_3_attn_w_k.packed_weight.u8.bin b/layers/encoder_3_attn_w_k.packed_weight.u8.bin index 9bce889970c0ed1ec6811909961e80f033ee79d2..6c34082e9155ab1deb5db7313ff629f5e453e078 100644 --- a/layers/encoder_3_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:60c7759210f429d911ecc35e4b8713aaae9dfd8633f7346bae24f736500afe35 +oid sha256:5a9a3e87cb0ccf9381821b2c13cd09a88996d04fcd808ae3b6313622c9986444 size 102400 diff --git a/layers/encoder_3_attn_w_k.scale_values.f32.bin b/layers/encoder_3_attn_w_k.scale_values.f32.bin index 3372545682072b434d2aaf937e245470d6caa201..8a8df4be3be301eafe1381a75835ee842e1cf042 100644 --- a/layers/encoder_3_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:896f661939f2fe43a62b13be603f2596dc3df6dd6cd9c0cad1fb2f13105184de -size 2560 +oid sha256:c94e97d5feb0a8acb690700c648981cd8ddadef54399a0a263cb112141cea08d +size 4 diff --git a/layers/encoder_3_attn_w_o.layout_header.i32.bin b/layers/encoder_3_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_3_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_3_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_3_attn_w_o.packed_weight.u8.bin b/layers/encoder_3_attn_w_o.packed_weight.u8.bin index 0d350e87388ef752feb281e056c6be6e6272ba99..f0c35cdd2bf2b90cbd53dca3c281ae5be4e86b1b 100644 --- a/layers/encoder_3_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de6d38106a582dfc0845e37d832281ca3ec94c62c1a935b35277ad2a793879ca +oid sha256:6291c1abeaaea0b97649438a296d76ceb106575b71884102d3542b00ef05e8c6 size 102400 diff --git a/layers/encoder_3_attn_w_o.scale_values.f32.bin b/layers/encoder_3_attn_w_o.scale_values.f32.bin index e0696fe1d31b8638ba9debf38b4ceafe2446edeb..23db519bde52fa46c457011b541cb878898665e8 100644 --- a/layers/encoder_3_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1fc6de6742fae87884a5e630e7c409fb39c9d4420875236665543be890a0740e -size 2560 +oid sha256:bd39061fcce791e35176cff9de492ef93343a6c39e27730e241ddedfb549a768 +size 4 diff --git a/layers/encoder_3_attn_w_q.layout_header.i32.bin b/layers/encoder_3_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_3_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_3_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_3_attn_w_q.packed_weight.u8.bin b/layers/encoder_3_attn_w_q.packed_weight.u8.bin index 4c8199556a25e90d209c3844a6266760d8776a8e..146eae7ebac54fabc69dc5f3e51d63d970eb95c7 100644 --- a/layers/encoder_3_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:43c4f0d6d23b5af6fe7c2c3e1b109c2055490098b3fc31683a550a43f059e298 +oid sha256:baa0d119c263884f0022dff7e7e4020996ea2c91c9912f568f2ede5559432027 size 102400 diff --git a/layers/encoder_3_attn_w_q.scale_values.f32.bin b/layers/encoder_3_attn_w_q.scale_values.f32.bin index 410a325cf4428aecce777f069faca21d90eeb525..97adbdcf542f508c8ec04808da791726834f9055 100644 --- a/layers/encoder_3_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f63de5f104f49da4f9ad4b052a01e94ab70ac250f4ebfc81dfb804932d434cec -size 2560 +oid sha256:adad57af78e9167da8b4e5855e46083456100ffd1ed101e0f84074e9496c7d27 +size 4 diff --git a/layers/encoder_3_attn_w_v.layout_header.i32.bin b/layers/encoder_3_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_3_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_3_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_3_attn_w_v.packed_weight.u8.bin b/layers/encoder_3_attn_w_v.packed_weight.u8.bin index ee44903b3096239a39fc1c8b39feda06f3fe6b54..89249e1ebb56c4eaaa06506998507590c473691a 100644 --- a/layers/encoder_3_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_3_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a6340999dbfd52b72ac1c8ab26ea8981e2d66638afde19e3498caff88eb74e8 +oid sha256:2bd7d1359728efce205ef25d36c8d47b7ded204343a3074ca03ad64bb485ae42 size 102400 diff --git a/layers/encoder_3_attn_w_v.scale_values.f32.bin b/layers/encoder_3_attn_w_v.scale_values.f32.bin index 4dc3e3190dce004e2f9d6cfdd7520d51651e2bc7..2a0e6d3bd5e2711d87bbc687e872d8a14f01d5f0 100644 --- a/layers/encoder_3_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_3_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b02dd07f237f832e50c41bd2e400e30bf13f7dccea1ab1befef78c76d342da95 -size 2560 +oid sha256:f7b3d178706d789bfbc5ed3419c8abdfce30d733cd967d5a7ce3f92560ecb7aa +size 4 diff --git a/layers/encoder_3_mlp_w_in.bias.f32.bin b/layers/encoder_3_mlp_w_in.bias.f32.bin index ddc96725b3c5b60a668ba055616a2885a245d6db..091b4f43a2dd2592cbf03a05b7f5856080a4ec53 100644 --- a/layers/encoder_3_mlp_w_in.bias.f32.bin +++ b/layers/encoder_3_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92a57bf5d82d7f0babb971567adbc2dfef3ca28e891a80ee8ac7813419886e91 +oid sha256:fd93590315d0550dadb82709589d499011558085fe7f42aa87a41a87c2742e9f size 16384 diff --git a/layers/encoder_3_mlp_w_in.layout_header.i32.bin b/layers/encoder_3_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_3_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_3_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_3_mlp_w_in.packed_weight.u8.bin b/layers/encoder_3_mlp_w_in.packed_weight.u8.bin index 67921b1d32b2e7be3ca9e9869d0e53b779e40025..af94632008d6de220aaef5f6a1bbe835009ef1d7 100644 --- a/layers/encoder_3_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_3_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11aae0a6d3a6390a198d014591584419c976d321d86324e2289c322c061878dd +oid sha256:8b117e51f471d478c8c5da5e498e0635c1ce74b32e75e4d923b6485ea87353da size 655360 diff --git a/layers/encoder_3_mlp_w_in.scale_values.f32.bin b/layers/encoder_3_mlp_w_in.scale_values.f32.bin index 6d21b4727411baa85d3ddba4ebd14cffcc6ef970..be020300e1942af581af12a50b581bceb9568add 100644 --- a/layers/encoder_3_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_3_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68a6035063d24067df5d569aa4702b2ec33e402ac4396206eba32bbebacefcdf -size 16384 +oid sha256:49e75f99e2d5f25276cbb411044e6acc42c8b520b449a0e88d0f36927fdb3b9b +size 4 diff --git a/layers/encoder_3_mlp_w_out.bias.f32.bin b/layers/encoder_3_mlp_w_out.bias.f32.bin index 8e92628434c19bfc384565bdb13b4b96193289c9..15296d365e08149f63b4e1c52b9b26b81c3beb79 100644 --- a/layers/encoder_3_mlp_w_out.bias.f32.bin +++ b/layers/encoder_3_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28cb43daae4e8a25875c6cda35e6386f889703430a87333fae4bd8be9dea69b4 +oid sha256:0f4777ca7ed1def47f66c0c13245e859f585b3401bff9b2fc0692869bcf6c3b8 size 2560 diff --git a/layers/encoder_3_mlp_w_out.layout_header.i32.bin b/layers/encoder_3_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_3_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_3_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_3_mlp_w_out.packed_weight.u8.bin b/layers/encoder_3_mlp_w_out.packed_weight.u8.bin index 23a4c79caf5dd70b4f1b510d04f4fcfaccc7ba9e..ccda21a748c8a50b99ad56bfbf253c7d2bc0cd68 100644 --- a/layers/encoder_3_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_3_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9b02f483fb6df052ea1fcb6ff5d088de525d94cf94fe964839eaaf7926c400e +oid sha256:3ddab3f329beb5d19a28e69aef00ac69b708a6696f78e84254033d362b4cff02 size 327680 diff --git a/layers/encoder_3_mlp_w_out.scale_values.f32.bin b/layers/encoder_3_mlp_w_out.scale_values.f32.bin index 2b81725c83fe6efc65b9992ecfc46c995106537b..4a38596d5943df0453ebbc2f9b781eb520713c3c 100644 --- a/layers/encoder_3_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_3_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:37e993462b64df0e8a791fc642c905c6cd95740fcbe052de7b27df97e5808bb7 -size 2560 +oid sha256:fc14d3937542e30e559658d7b9bb2377fd78c81771e3f3e7cc20c690648ea7b4 +size 4 diff --git a/layers/encoder_4_attn_w_k.layout_header.i32.bin b/layers/encoder_4_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_4_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_4_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_4_attn_w_k.packed_weight.u8.bin b/layers/encoder_4_attn_w_k.packed_weight.u8.bin index 35c4d414597a3f7ca94cafe4802c80f344b66c11..d2f093e15c6e353dc8b83af106c28a0c2328d39f 100644 --- a/layers/encoder_4_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c8d53dfc417dbd95009affeda84ee76f88467621e5a13e4057ff3345ff818c87 +oid sha256:10a703b02e24bbfaf3495bc1425befd4a89e9c6f09744e2a1c0706355cbcbeec size 102400 diff --git a/layers/encoder_4_attn_w_k.scale_values.f32.bin b/layers/encoder_4_attn_w_k.scale_values.f32.bin index 9c9fe80d1c8941f943878c45addfca8d4721cd71..a97e498f52d4a7da74bf2b0fca9354aa4499e506 100644 --- a/layers/encoder_4_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9089ee1b7185ccabf994b5f70eab40a93fb3ddc973499c59cd11aa34519029e -size 2560 +oid sha256:531f130bb155c8228c57f8775050b5bc55fe608c07b428bc621c7a2397638773 +size 4 diff --git a/layers/encoder_4_attn_w_o.layout_header.i32.bin b/layers/encoder_4_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_4_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_4_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_4_attn_w_o.packed_weight.u8.bin b/layers/encoder_4_attn_w_o.packed_weight.u8.bin index 0d269006e91ff2776966b3c04ee6a8eaca0539b6..a5b339ca826767360de5a5f1791b61a844413b2d 100644 --- a/layers/encoder_4_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1ff8d4a4f1b91665ca3a74d58fb90619d67a383655a392ab2d1402ab4584af26 +oid sha256:a94d196e77a98f4ed95df7a9102b2991e536dc5f3071302b1a497fce6d5de673 size 102400 diff --git a/layers/encoder_4_attn_w_o.scale_values.f32.bin b/layers/encoder_4_attn_w_o.scale_values.f32.bin index 0c1b94e8af853f0b39f6260ec3ac315162cd781c..e9eeaababd7734f88d760050e13a6636c7a2d271 100644 --- a/layers/encoder_4_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7900c5f4c08328434107eeb6a977d3e52e24d2e6e03ddd12ff960db27586c30b -size 2560 +oid sha256:65dafd5676fdc4978472be0e5ffecd6e5ec5549fb6d5664b79e8d02e4cd0878d +size 4 diff --git a/layers/encoder_4_attn_w_q.layout_header.i32.bin b/layers/encoder_4_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_4_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_4_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_4_attn_w_q.packed_weight.u8.bin b/layers/encoder_4_attn_w_q.packed_weight.u8.bin index d785afdb23152d83ed03a0383222e327cdcdf1ab..955fcac36dc7a86e2c89681ad42885cbd1d9b5a9 100644 --- a/layers/encoder_4_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d13a5cc5326e6b273e9af183087beca2cb322d8116c7424480aee6bb815b79f4 +oid sha256:728a805cfca6f97949f88c31871ef1be00603a46d9bf20fbbeaf9a63ecd92167 size 102400 diff --git a/layers/encoder_4_attn_w_q.scale_values.f32.bin b/layers/encoder_4_attn_w_q.scale_values.f32.bin index 730e506ce54c8f26f66522d439b3171f689b8365..e9a3646a8d1b5d8f2d87659a5c9ec939943a804f 100644 --- a/layers/encoder_4_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2eb000a73abd37c474f2fa50f53e25d2d44c91929890d30b919c9ec8539a688c -size 2560 +oid sha256:3b9e454e60a6a13e5102da4c03d527762bcf2b9bf12d486e799d61c3658c8dcd +size 4 diff --git a/layers/encoder_4_attn_w_v.layout_header.i32.bin b/layers/encoder_4_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_4_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_4_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_4_attn_w_v.packed_weight.u8.bin b/layers/encoder_4_attn_w_v.packed_weight.u8.bin index d1946e1e8bd04b127feb63c8f8d682cd405286d1..5e5368031d058d5a3fcb4cf3ea1b7790598bb355 100644 --- a/layers/encoder_4_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_4_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:02584e448294863bcbe19188adf9a6674b1428b823a0c8711bb88de01091c1ce +oid sha256:e5d4f475baae4060d3cc5a3a82f3a52ad92447d23710c3bb3577d99a02ce890d size 102400 diff --git a/layers/encoder_4_attn_w_v.scale_values.f32.bin b/layers/encoder_4_attn_w_v.scale_values.f32.bin index 64f691cb0931f2c0b2a54e5475e771a0e7be4cec..c827aba161ebb721e9f4aaca18371927139c793a 100644 --- a/layers/encoder_4_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_4_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:460bbf25434d9c7ad6edfed3c3c4f1f5ad70c7062666f2348fbd85b16932a5ff -size 2560 +oid sha256:8dc5c14c4a1ce0a7eda48fedb3496c154e2fd035b372b8c1fbb67ebfcbc3ad95 +size 4 diff --git a/layers/encoder_4_mlp_w_in.bias.f32.bin b/layers/encoder_4_mlp_w_in.bias.f32.bin index c1a3bf8af5e0aa53a67aadd9ee060fb2fd1dd4f0..817eab5b9e864a0732342b106f564fba6bb651e7 100644 --- a/layers/encoder_4_mlp_w_in.bias.f32.bin +++ b/layers/encoder_4_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:99053239c0447eb027095c62e66ac96c7ff6ff914c491bafb83b114bc3733c19 +oid sha256:1895bd3a783cadcce33598fd40adbec1468989bfb911673a0fb315883e21647e size 16384 diff --git a/layers/encoder_4_mlp_w_in.layout_header.i32.bin b/layers/encoder_4_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_4_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_4_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_4_mlp_w_in.packed_weight.u8.bin b/layers/encoder_4_mlp_w_in.packed_weight.u8.bin index 4c82cea64ae0fc435ff15182877f5660bfc5cd38..cf712baca10739bafafaa4a76c6b14e53827f5b5 100644 --- a/layers/encoder_4_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_4_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e7149c7d3ff509391cdba5af5d102429a7d235e1d41d582ea3565dabc7fee453 +oid sha256:9d3742046e3c417116c43c76a09c313d31979170bd39d42a5dde6f0a7e9ad08c size 655360 diff --git a/layers/encoder_4_mlp_w_in.scale_values.f32.bin b/layers/encoder_4_mlp_w_in.scale_values.f32.bin index 1cd103d9678b0e535fb09680adf8ae49e08c4baf..d32625fc5f2f3f0a530a7ccfbe38eab8b31c9c9a 100644 --- a/layers/encoder_4_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_4_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:493293bce6191f6df816e466933ff0c061273c1cec8d0fdd103131507cb21591 -size 16384 +oid sha256:88b516eb6de001eed4819d59a8e8af51f48eabf45e0e08400cf7351198e404b8 +size 4 diff --git a/layers/encoder_4_mlp_w_out.bias.f32.bin b/layers/encoder_4_mlp_w_out.bias.f32.bin index b4d9cdc69c742c027cae840353786b480ec0a7b8..dbca2910dc95108914a5b0077c0b13030b088ce6 100644 --- a/layers/encoder_4_mlp_w_out.bias.f32.bin +++ b/layers/encoder_4_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:37d72c03868b46c203a0550dc208cfc4fc89cfc963272e602a9f9114749453a2 +oid sha256:a37f53e3778a72816f2020f1e2e74ce0387bf8f7f1894bcb5e21337b17a975a5 size 2560 diff --git a/layers/encoder_4_mlp_w_out.layout_header.i32.bin b/layers/encoder_4_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_4_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_4_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_4_mlp_w_out.packed_weight.u8.bin b/layers/encoder_4_mlp_w_out.packed_weight.u8.bin index d1e42a364de20961da530bf18388291303f7fd47..c2a9c68c43d6f25321cdb1fb34e5ba70354d0391 100644 --- a/layers/encoder_4_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_4_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97c0df1606d2c2170c3fc4a0fa68777a6be93cc63d11641a113ddd144a69a803 +oid sha256:cb2919b644968c18f3d8d07f4a7c2dff37300f3a19ca9252d608515e27356843 size 327680 diff --git a/layers/encoder_4_mlp_w_out.scale_values.f32.bin b/layers/encoder_4_mlp_w_out.scale_values.f32.bin index 310e7ce6a185eefbd7569b48cb100953fbf49288..f7f323a381aa3ac52b0d7b3d205a6a7f15366c10 100644 --- a/layers/encoder_4_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_4_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9183e05de7aa601048f5715c1e04220ef4509b9db1a48afff7ed161c1f2fc910 -size 2560 +oid sha256:acf932162b73f02f4dac3a61e9fbb063804e282e457542dcb81087ac0288e496 +size 4 diff --git a/layers/encoder_5_attn_w_k.layout_header.i32.bin b/layers/encoder_5_attn_w_k.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_5_attn_w_k.layout_header.i32.bin +++ b/layers/encoder_5_attn_w_k.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_5_attn_w_k.packed_weight.u8.bin b/layers/encoder_5_attn_w_k.packed_weight.u8.bin index cf76f94d6c85052018f00b70a40a99aa29d69bbc..9e971bef6e84cdb081824c50b26dfc985588739b 100644 --- a/layers/encoder_5_attn_w_k.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_k.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:033c651731ecdcf3c309d6473c4f1597fa590b092540f0cefdca861befe49eed +oid sha256:6050252cdefae7097fef44b72a46832ef84555bf3129e31fb1706699b54fb993 size 102400 diff --git a/layers/encoder_5_attn_w_k.scale_values.f32.bin b/layers/encoder_5_attn_w_k.scale_values.f32.bin index 5704848c572032a1dd481dca79d5f591df1eed79..c6d644ed0cf339dbbfdd8a8172434fa07c87fcc6 100644 --- a/layers/encoder_5_attn_w_k.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_k.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:796fd982b5307ac8adc45a87b35fedf54cfa422ccc8e3e41b60f8009e45e3697 -size 2560 +oid sha256:821f63202f456185ca334f8df5549720d54d696d62ed9ae84dfe0ba200913545 +size 4 diff --git a/layers/encoder_5_attn_w_o.layout_header.i32.bin b/layers/encoder_5_attn_w_o.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_5_attn_w_o.layout_header.i32.bin +++ b/layers/encoder_5_attn_w_o.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_5_attn_w_o.packed_weight.u8.bin b/layers/encoder_5_attn_w_o.packed_weight.u8.bin index e20059ff160da09ceb34cdc696d3c01430c4ce28..a1c66e5c74c1848af40fb2a84780d3fe9563cc9f 100644 --- a/layers/encoder_5_attn_w_o.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_o.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a443fcae9400696e87049635cedfec342aee78caa3c2c4a773c23bc7554c9324 +oid sha256:0c9021bc8c3337e9e07cdeac52581df7895492820dd4c39aa2a8fa0a170e21a0 size 102400 diff --git a/layers/encoder_5_attn_w_o.scale_values.f32.bin b/layers/encoder_5_attn_w_o.scale_values.f32.bin index 2d725eb7372bf1b67cc93ded6cc4e9fbfb1fee15..68e2d3326ac37d4723994c0f19cdcdfeb4485358 100644 --- a/layers/encoder_5_attn_w_o.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_o.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1dcb875baa0c7acf4f19cec6638a5f604f16fef674780d3a5fd83fabda38a5b1 -size 2560 +oid sha256:79dcab88153ccd85a92bf06a820212da7514276d13c9d246b383731a60ad4278 +size 4 diff --git a/layers/encoder_5_attn_w_q.layout_header.i32.bin b/layers/encoder_5_attn_w_q.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_5_attn_w_q.layout_header.i32.bin +++ b/layers/encoder_5_attn_w_q.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_5_attn_w_q.packed_weight.u8.bin b/layers/encoder_5_attn_w_q.packed_weight.u8.bin index 6fee44dc4acd5c7215d8edbe3072f4ff53c73e23..9dd19d1e9c4174eb503bdb0a49ff96d4a3788806 100644 --- a/layers/encoder_5_attn_w_q.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_q.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b99d0e715a452c6efce69fcbdb8eceade7864e7d19c189fc55a4f0ef614e593b +oid sha256:7dd4d44c1ffabf832cb1a2de16b9fe41eda6fdab014995e14d8e985656429fef size 102400 diff --git a/layers/encoder_5_attn_w_q.scale_values.f32.bin b/layers/encoder_5_attn_w_q.scale_values.f32.bin index da8b59742067936dc8607adee7dd89c3c894163e..a1aba102d49f63b0d05cb0c644bf47da788f2dd7 100644 --- a/layers/encoder_5_attn_w_q.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_q.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4f9b137787662c0645bf2d15231874a41d42101fb6c753ff543f1b4a06c598d0 -size 2560 +oid sha256:7624e04915864961ee93653aa33a552ae72de0f333aac4bb5070ee12d3164a02 +size 4 diff --git a/layers/encoder_5_attn_w_v.layout_header.i32.bin b/layers/encoder_5_attn_w_v.layout_header.i32.bin index 9a0728fafd35754a01b6a5aeff5ba28a8013c582..b8ef9620a421174f06ae9d2e7db8bfca8a867811 100644 --- a/layers/encoder_5_attn_w_v.layout_header.i32.bin +++ b/layers/encoder_5_attn_w_v.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4 +oid sha256:849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914 size 52 diff --git a/layers/encoder_5_attn_w_v.packed_weight.u8.bin b/layers/encoder_5_attn_w_v.packed_weight.u8.bin index 8fd07695677ee6f19da142400118cf5388033b61..fb5c4e96283d2cc70e57df639e252be4bb9b04b4 100644 --- a/layers/encoder_5_attn_w_v.packed_weight.u8.bin +++ b/layers/encoder_5_attn_w_v.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d87031bdf3e41ea52362d83567809bff5110295124ee8e91f5f6e5a1e35645ed +oid sha256:e53e30cf99dfb375124f09e4aafd8f94d002f350320d64ed184535c6494d67f7 size 102400 diff --git a/layers/encoder_5_attn_w_v.scale_values.f32.bin b/layers/encoder_5_attn_w_v.scale_values.f32.bin index 13baee15f7290d6fdfecf013fed3e71b52befb30..2a44d74577bec42cff67d3c5674b384936944eab 100644 --- a/layers/encoder_5_attn_w_v.scale_values.f32.bin +++ b/layers/encoder_5_attn_w_v.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03788514329cad1f28970b717a4d43ef4a85e0278ed0dd885fe9d756ecfffb88 -size 2560 +oid sha256:f76061e291a207776605c5ad3c7d62fe4d33568ecc9033af6c0b627e411b3c11 +size 4 diff --git a/layers/encoder_5_mlp_w_in.bias.f32.bin b/layers/encoder_5_mlp_w_in.bias.f32.bin index cb1a6b4d70cad740c3766d7edda48722ef3a92de..31b38c4cf5cb94634720199810e01f2a45fc6849 100644 --- a/layers/encoder_5_mlp_w_in.bias.f32.bin +++ b/layers/encoder_5_mlp_w_in.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:191a36a424ec4dee9cbafac1f3fd69e4123c65e4bed4688de86a7c9b1a0406ef +oid sha256:84867af91e82c506906ddb71b0a230680dd925d90773bb297b7fd5b0b7713542 size 16384 diff --git a/layers/encoder_5_mlp_w_in.layout_header.i32.bin b/layers/encoder_5_mlp_w_in.layout_header.i32.bin index dfb09b60c1a463239bdde81ecc9589c186db51be..4f36c34f219a96fe3e8ec8c03b70d02426e7e7cb 100644 --- a/layers/encoder_5_mlp_w_in.layout_header.i32.bin +++ b/layers/encoder_5_mlp_w_in.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f +oid sha256:257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee size 52 diff --git a/layers/encoder_5_mlp_w_in.packed_weight.u8.bin b/layers/encoder_5_mlp_w_in.packed_weight.u8.bin index 74cc8521b334ed99d8cf2e74c0c2fe380c2f0422..b8c7d948dfdb1eca98787185b824be07d2910d47 100644 --- a/layers/encoder_5_mlp_w_in.packed_weight.u8.bin +++ b/layers/encoder_5_mlp_w_in.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b00064f3d22bdd64802c393149373738a78e7c5a24ac297fcee3b165acda3e8 +oid sha256:93f7b29f255947dd72d7a5ad15b60f2c68c4b3e148b922f4794bcf96bf7aef87 size 655360 diff --git a/layers/encoder_5_mlp_w_in.scale_values.f32.bin b/layers/encoder_5_mlp_w_in.scale_values.f32.bin index d08647056d4db60ee1c97512a0b9e33ba58f4fb6..11fc70f486ba838449022e432eb6512876ed62c8 100644 --- a/layers/encoder_5_mlp_w_in.scale_values.f32.bin +++ b/layers/encoder_5_mlp_w_in.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7452e6a08f8d28e1a2f4f84ea908a32bf76fb480751d5ece73faa33490950cd3 -size 16384 +oid sha256:07471f0e22ba2cd8c2c7b735c203d91c874fc834b4209788a236fc9529247943 +size 4 diff --git a/layers/encoder_5_mlp_w_out.bias.f32.bin b/layers/encoder_5_mlp_w_out.bias.f32.bin index 2c7051f0d3fcecbd95b0a4f355b544ccd11641bb..15e444acd5d5c5778f3a1400a024662f3cd1ebde 100644 --- a/layers/encoder_5_mlp_w_out.bias.f32.bin +++ b/layers/encoder_5_mlp_w_out.bias.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb7da7b400d0281d2afa3b758997e2af9ef546bcaeedb7d7adbdbf012699d243 +oid sha256:d1ccf0c6e752d23d27842dde01b4bc430190dab45e3bfa8dd8417dfe4c13cb15 size 2560 diff --git a/layers/encoder_5_mlp_w_out.layout_header.i32.bin b/layers/encoder_5_mlp_w_out.layout_header.i32.bin index 0e75d07047a66b2c5fdc1a4889b0f4b64984a9e0..bb2fc38f00bb69d3211700402632c7467e412926 100644 --- a/layers/encoder_5_mlp_w_out.layout_header.i32.bin +++ b/layers/encoder_5_mlp_w_out.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311 +oid sha256:d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64 size 52 diff --git a/layers/encoder_5_mlp_w_out.packed_weight.u8.bin b/layers/encoder_5_mlp_w_out.packed_weight.u8.bin index e814433f45f1481c805075d61762221d6755ae5e..19ed6f7000c2a203819a43b518bbf4ac91c3da6b 100644 --- a/layers/encoder_5_mlp_w_out.packed_weight.u8.bin +++ b/layers/encoder_5_mlp_w_out.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62ba8a94c88e14d9cfdafd791553656c8391223f1adfdeff3d7c6d73aa461d57 +oid sha256:5c8cf16a336ac7618477e7a52f8eb8b12d5bbd7004f961745f08abfb3f36039d size 327680 diff --git a/layers/encoder_5_mlp_w_out.scale_values.f32.bin b/layers/encoder_5_mlp_w_out.scale_values.f32.bin index ae945f896476c75bbe179064503cb0cc7a49575f..19b9b7a341a8f59419a3b10d69e9672da97e2386 100644 --- a/layers/encoder_5_mlp_w_out.scale_values.f32.bin +++ b/layers/encoder_5_mlp_w_out.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdd75db75a35624ce71b7c3a0f77e2d2e7123f619afa3f2e3f5247f72bb9e9a2 -size 2560 +oid sha256:4587070b10b62cb7687541b3e9946824e292b8f024c39b9d388202d61a5244b4 +size 4 diff --git a/layers/lm_head.layout_header.i32.bin b/layers/lm_head.layout_header.i32.bin index 73be774e6577bc924fbb984a60c069ac3caf2081..bb2db38d06881bf318279c4ce2d32d979c4fc207 100644 --- a/layers/lm_head.layout_header.i32.bin +++ b/layers/lm_head.layout_header.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6dbbe0f59e755d0a0ffc98bab96786a9a069a30db90c05011423767b48beca7a +oid sha256:1fdaf7af8cb18524a77d5a37d5265646c10d5d352a2eb3fc83b596fa4fb3a2c5 size 52 diff --git a/layers/lm_head.packed_weight.u8.bin b/layers/lm_head.packed_weight.u8.bin index 489063cdb017df0d4d8550e7d9e5eeaa185e4bfe..a5966cc8d7458cbda0e92bb841c58776ee3a96b5 100644 --- a/layers/lm_head.packed_weight.u8.bin +++ b/layers/lm_head.packed_weight.u8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2dda08a6b9c24d9bb30cd0e09147bd5720f6cdd8633b022afaa8a9b1c2946bb4 -size 1318400 +oid sha256:411e858d2476c7d4e8bce21dfdc58a7e4936a9fca18d822cd4f5cf2e2e8386f0 +size 1313280 diff --git a/layers/lm_head.scale_values.f32.bin b/layers/lm_head.scale_values.f32.bin index b3443a08891a1da67e3da9414a535cf0bc9d5ad2..0418e7c8159578c4cc934e38fe0f994b5ef9dfde 100644 --- a/layers/lm_head.scale_values.f32.bin +++ b/layers/lm_head.scale_values.f32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:26b1d8c807dad42bfd8cc1c0b084cb3292b232e0882285c72043c118a9368bca -size 32916 +oid sha256:f82895d1075ca96401b23568c539ac8944e0264adf62d8567dce2611e02587df +size 4 diff --git a/layers/lm_head.segment_offsets.i32.bin b/layers/lm_head.segment_offsets.i32.bin index ca7ae0ded31bc7ecd8535cf9c6c046db2589ae68..1e153c0fa1c6fbe15b018889f65bd6b8050dfd24 100644 --- a/layers/lm_head.segment_offsets.i32.bin +++ b/layers/lm_head.segment_offsets.i32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6a39e27878282be9d58d21a86fb95117d07c03a87a9919d24a86cbabe1597463 +oid sha256:77df73d01a55e70e6fe3ae9d1e3e1608045918c29f804021326ebd3337636ed0 size 8 diff --git a/manifest.json b/manifest.json index bb98f8bc699bfca87fa5b3dfac051b7f4f05cf31..0943cc922ce0846678c4428bf80104edfc2a6a1e 100644 --- a/manifest.json +++ b/manifest.json @@ -1,14 +1,152 @@ { + "agentkernel_lite": { + "chat_contract": { + "code_execution": false, + "extensions_may_be_suggested": true, + "primary_action": "respond", + "structured_decision": true + }, + "model_family": "agentkernel_lite_encdec_v1", + "parameter_count": 113507328, + "source_bundle_manifest_path": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/agentkernel_lite_encdec_manifest.json", + "source_model_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/model", + "source_tokenizer_dir": "/data/agentkernel/artifacts/agentkernel_lite_encdec/recommendation_answer_v11_exact_twopass_from_v9_train_00200_lr2e6/tokenizer" + }, + "compression": { + "dense_dtype": "float32", + "dense_float32_include": [], + "quant_exclude": [], + "quant_include": [], + "quantization": { + "activation_quant": "none", + "modules": [ + "encoder.0.attn.w_q", + "encoder.0.attn.w_k", + "encoder.0.attn.w_v", + "encoder.0.attn.w_o", + "encoder.0.mlp.w_in", + "encoder.0.mlp.w_out", + "encoder.1.attn.w_q", + "encoder.1.attn.w_k", + "encoder.1.attn.w_v", + "encoder.1.attn.w_o", + "encoder.1.mlp.w_in", + "encoder.1.mlp.w_out", + "encoder.2.attn.w_q", + "encoder.2.attn.w_k", + "encoder.2.attn.w_v", + "encoder.2.attn.w_o", + "encoder.2.mlp.w_in", + "encoder.2.mlp.w_out", + "encoder.3.attn.w_q", + "encoder.3.attn.w_k", + "encoder.3.attn.w_v", + "encoder.3.attn.w_o", + "encoder.3.mlp.w_in", + "encoder.3.mlp.w_out", + "encoder.4.attn.w_q", + "encoder.4.attn.w_k", + "encoder.4.attn.w_v", + "encoder.4.attn.w_o", + "encoder.4.mlp.w_in", + "encoder.4.mlp.w_out", + "encoder.5.attn.w_q", + "encoder.5.attn.w_k", + "encoder.5.attn.w_v", + "encoder.5.attn.w_o", + "encoder.5.mlp.w_in", + "encoder.5.mlp.w_out", + "decoder.0.self_attn_block.mlp.w_in", + "decoder.0.self_attn_block.mlp.w_out", + "decoder.0.self_attn_block.attn.w_q", + "decoder.0.self_attn_block.attn.w_k", + "decoder.0.self_attn_block.attn.w_v", + "decoder.0.self_attn_block.attn.w_o", + "decoder.0.cross_block.cross.w_q", + "decoder.0.cross_block.cross.w_k", + "decoder.0.cross_block.cross.w_v", + "decoder.0.cross_block.cross.w_o", + "decoder.0.cross_block.mlp.w_in", + "decoder.0.cross_block.mlp.w_out", + "decoder.1.self_attn_block.mlp.w_in", + "decoder.1.self_attn_block.mlp.w_out", + "decoder.1.self_attn_block.attn.w_q", + "decoder.1.self_attn_block.attn.w_k", + "decoder.1.self_attn_block.attn.w_v", + "decoder.1.self_attn_block.attn.w_o", + "decoder.1.cross_block.cross.w_q", + "decoder.1.cross_block.cross.w_k", + "decoder.1.cross_block.cross.w_v", + "decoder.1.cross_block.cross.w_o", + "decoder.1.cross_block.mlp.w_in", + "decoder.1.cross_block.mlp.w_out", + "decoder.2.self_attn_block.mlp.w_in", + "decoder.2.self_attn_block.mlp.w_out", + "decoder.2.self_attn_block.attn.w_q", + "decoder.2.self_attn_block.attn.w_k", + "decoder.2.self_attn_block.attn.w_v", + "decoder.2.self_attn_block.attn.w_o", + "decoder.2.cross_block.cross.w_q", + "decoder.2.cross_block.cross.w_k", + "decoder.2.cross_block.cross.w_v", + "decoder.2.cross_block.cross.w_o", + "decoder.2.cross_block.mlp.w_in", + "decoder.2.cross_block.mlp.w_out", + "decoder.3.self_attn_block.mlp.w_in", + "decoder.3.self_attn_block.mlp.w_out", + "decoder.3.self_attn_block.attn.w_q", + "decoder.3.self_attn_block.attn.w_k", + "decoder.3.self_attn_block.attn.w_v", + "decoder.3.self_attn_block.attn.w_o", + "decoder.3.cross_block.cross.w_q", + "decoder.3.cross_block.cross.w_k", + "decoder.3.cross_block.cross.w_v", + "decoder.3.cross_block.cross.w_o", + "decoder.3.cross_block.mlp.w_in", + "decoder.3.cross_block.mlp.w_out", + "decoder.4.self_attn_block.mlp.w_in", + "decoder.4.self_attn_block.mlp.w_out", + "decoder.4.self_attn_block.attn.w_q", + "decoder.4.self_attn_block.attn.w_k", + "decoder.4.self_attn_block.attn.w_v", + "decoder.4.self_attn_block.attn.w_o", + "decoder.4.cross_block.cross.w_q", + "decoder.4.cross_block.cross.w_k", + "decoder.4.cross_block.cross.w_v", + "decoder.4.cross_block.cross.w_o", + "decoder.4.cross_block.mlp.w_in", + "decoder.4.cross_block.mlp.w_out", + "decoder.5.self_attn_block.mlp.w_in", + "decoder.5.self_attn_block.mlp.w_out", + "decoder.5.self_attn_block.attn.w_q", + "decoder.5.self_attn_block.attn.w_k", + "decoder.5.self_attn_block.attn.w_v", + "decoder.5.self_attn_block.attn.w_o", + "decoder.5.cross_block.cross.w_q", + "decoder.5.cross_block.cross.w_k", + "decoder.5.cross_block.cross.w_v", + "decoder.5.cross_block.cross.w_o", + "decoder.5.cross_block.mlp.w_in", + "decoder.5.cross_block.mlp.w_out", + "lm_head" + ], + "num": 109, + "scheme": "bitnet", + "spin": false, + "weight_opt": "none" + }, + "quantize_bitnet": true + }, "dense_dtype": "float32", "dense_float32_patterns": [], "dense_tensors": { "dec_embed.weight": { - "bytes": 21066240, + "bytes": 21009920, "dtype": "float32", "path": "dense/dec_embed_weight.f32.bin", - "sha256": "d0b2d9d06dc96048cff8f30867bc4c520bcb7586df46a0325c95b6a93a84aeeb", + "sha256": "78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df", "shape": [ - 8229, + 8207, 640 ] }, @@ -16,7 +154,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/dec_norm_bias.f32.bin", - "sha256": "bc56aaf3ca92b1288564ce350a4714e94a6021ab1a54402de1644d717312a755", + "sha256": "5b5e96cac42589a663a9f5682082013889507d15b2134376aa286c1c002b7fcf", "shape": [ 640 ] @@ -25,7 +163,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/dec_norm_weight.f32.bin", - "sha256": "9db5943f63cd2d6154e730c9fed0f644a1bbf7c7ed77add76e90b84c1aa4ef3b", + "sha256": "f3007750a249fff13b6d5325bdec87cf3e823d773e9b4ddd8661358e1c88bc4a", "shape": [ 640 ] @@ -34,7 +172,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_cross_block_n1_weight.f32.bin", - "sha256": "891fb6b04974c8b901b28c09ae7ea6e5e0cdc726a71f6d17b07f1a375d4426da", + "sha256": "9e321bd4b5815ad26ae4a2c222d73c2bd84b44c67aa3ba4a3e7425389c6eb783", "shape": [ 640 ] @@ -43,36 +181,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_cross_block_n2_weight.f32.bin", - "sha256": "1a719c7ed5cf7db904f9077ad94985d06a65e2d38a64340465579147ffbac8c5", + "sha256": "e44330e6d5b15cb95b080f739e6fe708f9915ebfc33cab76c01c6c4c2bb4e51e", "shape": [ 640 ] }, - "decoder.0.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_0_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.0.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_0_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.0.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_self_attn_block_n1_weight.f32.bin", - "sha256": "3ecfb7e994fc3be415d9ca72f228f0a6fe1bac9ed350e75ae883ac75d4c5a431", + "sha256": "aa1687c4e058f3c05d691ed6f33ca18be4ec4ca67ddfe2806b29bc4926a06d87", "shape": [ 640 ] @@ -81,7 +199,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_0_self_attn_block_n2_weight.f32.bin", - "sha256": "33d786b3efc9c3443b12cd66a09c63bd595e18ec0c9eb07fae38297f7005bf84", + "sha256": "aaf84ca53571564ef264cd69f05f68a5feae20d67c51111440aa38971a927f0a", "shape": [ 640 ] @@ -90,7 +208,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_cross_block_n1_weight.f32.bin", - "sha256": "cbd55183838a8ab6e77bb181eeb8cf43c54e6fdec064a948915193df754f7cf9", + "sha256": "3ea07312d131aecfcf9aeca759f7da272db7f8669faaea13adaa03af9e74cdf7", "shape": [ 640 ] @@ -99,36 +217,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_cross_block_n2_weight.f32.bin", - "sha256": "5e01f19710f000878795ab523b271d8b34893f6c377f610bdd0eba9f18574a70", + "sha256": "a2d7b097f261522851525b00d4df45ee76aba6fd6d1c467bc592e7c75f7d0e21", "shape": [ 640 ] }, - "decoder.1.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_1_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.1.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_1_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.1.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_self_attn_block_n1_weight.f32.bin", - "sha256": "3ce6ed00aee268de7d08e6e9acdecb2ce494e53740f49b397653063f65708af9", + "sha256": "6e04d7ae884588db5de7ef2072346f6e8b2066b26ed9f5847645221ed9539942", "shape": [ 640 ] @@ -137,7 +235,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_1_self_attn_block_n2_weight.f32.bin", - "sha256": "3aff504c8c158ad32e0d53fcde49f9c3d9d2c6d8c6ffac4793913ab8e9fc351f", + "sha256": "c0b1278f7154bf8b2234bdd368fbce9e7bd74601a1c793f56fa4f3586a7f7b73", "shape": [ 640 ] @@ -146,7 +244,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_cross_block_n1_weight.f32.bin", - "sha256": "074691158ffb33267b6d1515d51dfccffd776d308d77ca10cd42f5c9e11d16b3", + "sha256": "28376ace409fa2952ac2990043be9b9c983aea3195e64ca73a2c6ba4a7679303", "shape": [ 640 ] @@ -155,36 +253,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_cross_block_n2_weight.f32.bin", - "sha256": "252019fc3c4e0a4b6e8d3b4a6612fa119688c8dda754f204055cd8276a1136ac", + "sha256": "1feefaae8826e4c2ad02d385f9b805519b96a7db7fe49052f1f8a8c693309339", "shape": [ 640 ] }, - "decoder.2.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_2_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.2.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_2_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.2.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_self_attn_block_n1_weight.f32.bin", - "sha256": "142d7795a7359da525adde3aa5342706ad7fddf0f79e984b0d6f95a3fb7074ec", + "sha256": "3731b30effc4197d021d7ed55349454c585246d030d74d9299b07aafa7b367d6", "shape": [ 640 ] @@ -193,7 +271,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_2_self_attn_block_n2_weight.f32.bin", - "sha256": "b5c5cb7840e3107062925817a43bd242b3fe2fd4a7786cc1a9460d9312c1b6eb", + "sha256": "632df68307a27cfc2054c13a9b511180dce6e735c8c79dc6a420e984ffcc385c", "shape": [ 640 ] @@ -202,7 +280,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_cross_block_n1_weight.f32.bin", - "sha256": "15ae5917f2aa04cc28786948c54d7375493275ebabe9e5ffc2d6b53825b7776f", + "sha256": "9e8c667419c8df40c09c7e194573444198f3e0f8d057e61e301b293928695560", "shape": [ 640 ] @@ -211,36 +289,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_cross_block_n2_weight.f32.bin", - "sha256": "caccd589d5a01abd27c8661e131ee691f8b6559a4330aeee886cb0492a73aeb3", + "sha256": "770f911b6ec49b1da40240580ffac220c6308585bb36d1151a6623a5d46ef740", "shape": [ 640 ] }, - "decoder.3.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_3_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.3.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_3_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.3.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_self_attn_block_n1_weight.f32.bin", - "sha256": "0ee7056ae2fdd0937969db21841862681e470303fa423918e28d426c6ea032dc", + "sha256": "083fed8849ddd08ad81f0dd422aadfb0570d1f11079073bf2f85121fcdd57274", "shape": [ 640 ] @@ -249,7 +307,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_3_self_attn_block_n2_weight.f32.bin", - "sha256": "a560a1dede092c8a7dde8fa9b96baa535ef09c717dfbd8943a0d15b326d9f9d5", + "sha256": "115676e9f45a24b93168c64e085aedcadfa8fe199d1a2b06b9ca67ba3615385c", "shape": [ 640 ] @@ -258,7 +316,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_cross_block_n1_weight.f32.bin", - "sha256": "c043209537341e6dc5f41dcf6a351fb4265565500d454fe64c667ac7b06c7e33", + "sha256": "b15ddc920e96f925d4bb97e943a92a38605ffd1e1f5a74373654daef985e377d", "shape": [ 640 ] @@ -267,36 +325,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_cross_block_n2_weight.f32.bin", - "sha256": "598e5457b0d29193b07509b15b611a39769cdd37c70e35c9ef33339988c1541c", + "sha256": "23021c9331a4ec203014d4d33f2a846ad81702b6da07a3fdcaab2ef30a4d73f6", "shape": [ 640 ] }, - "decoder.4.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_4_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.4.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_4_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.4.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_self_attn_block_n1_weight.f32.bin", - "sha256": "77f69a1f0ab7f6664172e335f1bacbede678a34d59234098b531a41f08eda87a", + "sha256": "f3ae1bf89ed7cdb798ec9b786ff358f126b58fb7fb6fa2b93d217a243318aeee", "shape": [ 640 ] @@ -305,7 +343,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_4_self_attn_block_n2_weight.f32.bin", - "sha256": "2c4fcbc99f4fcf2182c7ed689ef906b7135326b75644ba9155239e6ca65c1591", + "sha256": "7161e760f5e51f0e019f3ddf6285c1d31819100682234328ad54c9f3fb26768c", "shape": [ 640 ] @@ -314,7 +352,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_cross_block_n1_weight.f32.bin", - "sha256": "744b9f0653545a86ed4b7f963023c78c74637332d473b374e61fa19d72795ca7", + "sha256": "b49407ae4ad043d9c524839c8e197cfaed22ac0f9755458fc8dfb5f9501f62e5", "shape": [ 640 ] @@ -323,36 +361,16 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_cross_block_n2_weight.f32.bin", - "sha256": "41b98dd7de3c29b4b66996542d2b1f835d8729bcd09ae96689de78daa16c2041", + "sha256": "d7c9bf8b3e50171e0aa8882bc82629636d6afaa7ce2b36f3612a9a79e40a5840", "shape": [ 640 ] }, - "decoder.5.self_attn_block.attn._rope_cos": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_5_self_attn_block_attn__rope_cos.f32.bin", - "sha256": "6ad88ae23144aafc9b0fb5dbe306afcfdccb11fcf4909a512eb46125ce9f0d5b", - "shape": [ - 512, - 64 - ] - }, - "decoder.5.self_attn_block.attn._rope_sin": { - "bytes": 131072, - "dtype": "float32", - "path": "dense/decoder_5_self_attn_block_attn__rope_sin.f32.bin", - "sha256": "b7e60ef23d3ccabcb925a970b51fbeaed34dbd48374a45476f3212d61fc7407f", - "shape": [ - 512, - 64 - ] - }, "decoder.5.self_attn_block.n1.weight": { "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_self_attn_block_n1_weight.f32.bin", - "sha256": "1fa85cc37348e322bb9b80bd0c8775dabc0e8ca898919c86bc3092effd31b7d1", + "sha256": "5ab4801dfa1f732a06dd0d14acfa620dbcec11568fdf8c5e333b0deb154f1a51", "shape": [ 640 ] @@ -361,18 +379,18 @@ "bytes": 2560, "dtype": "float32", "path": "dense/decoder_5_self_attn_block_n2_weight.f32.bin", - "sha256": "2277d03a4376433872684796edfa38c6636a096944d5d8c9031b2f13bdcec68f", + "sha256": "c5666fab5237df5532e10c7c08ecd276dce4be357b11819655deea19d3d6b0e9", "shape": [ 640 ] }, "enc_embed.weight": { - "bytes": 21066240, + "bytes": 21009920, "dtype": "float32", "path": "dense/enc_embed_weight.f32.bin", - "sha256": "d0b2d9d06dc96048cff8f30867bc4c520bcb7586df46a0325c95b6a93a84aeeb", + "sha256": "78c2a80005b8926af3752edc2ab4c56399688951a282a6b85bf9edbf917fe6df", "shape": [ - 8229, + 8207, 640 ] }, @@ -380,7 +398,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/enc_norm_bias.f32.bin", - "sha256": "0f7a17d8d5a7e35c03338862b11b135d1a0816358f766706d2f83179d4bafc40", + "sha256": "73c7b6e76072acad2244afc73657d29377fd189a8af9bc41daa14aabb346606a", "shape": [ 640 ] @@ -389,8 +407,18 @@ "bytes": 2560, "dtype": "float32", "path": "dense/enc_norm_weight.f32.bin", - "sha256": "323e132c6135d519e191f4e98eaef83861db8531b4971f7dbc32686258e791c0", + "sha256": "fbce78fa3910cca15c0bec29f929009612f7f5b94d1d083771ed0b114bb2a337", + "shape": [ + 640 + ] + }, + "enc_pos_embed.weight": { + "bytes": 10485760, + "dtype": "float32", + "path": "dense/enc_pos_embed_weight.f32.bin", + "sha256": "41e06124cce8055432e8e6a7a9a9a2a6e39ac672071f23dea5872bd19c51e4d9", "shape": [ + 4096, 640 ] }, @@ -398,7 +426,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_0_n1_weight.f32.bin", - "sha256": "a2fca0cec706dcc674c02b5ecb68458f347cc18cbe0b5783ba08764863ca1211", + "sha256": "146bdd3c5419ea957cba0919904c3fa3a18345399e1190e38b1697c5bc56a18e", "shape": [ 640 ] @@ -407,7 +435,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_0_n2_weight.f32.bin", - "sha256": "e5592bab55e8eae12dbc21470a64a4f145450f19bd28292ec789863278e122e8", + "sha256": "2817160dc2b42d5f8de29fb566ed4165dff109f084f8a5af1766e544a7fea509", "shape": [ 640 ] @@ -416,7 +444,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_1_n1_weight.f32.bin", - "sha256": "9efa97efc788129bea077cbe83a7d35ce84e7d90a5cdbfd87f490fbf9bd26b3d", + "sha256": "4b3b5cbb90b337e7c217bfe73872429a99ef7aaeda0743a01e7c78b496abce08", "shape": [ 640 ] @@ -425,7 +453,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_1_n2_weight.f32.bin", - "sha256": "80da1c04bd2f7b3f1784986cfdd88a86f4a820b2e0c6ebd1b6b1ac4b7bb59645", + "sha256": "2030393e0c8cc4554a10187e03f03e541a380227d3b64c3f6455aa23d8295be6", "shape": [ 640 ] @@ -434,7 +462,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_2_n1_weight.f32.bin", - "sha256": "73b9240c3a6ceb6a628d5b63cb7cee6f5f4f0e1506d3e59ce8422692f9afe87b", + "sha256": "203d16e2f34a9fb6059e24d8bde0b3d2e85e8edbeaecb2eac7c647b9c81f1dde", "shape": [ 640 ] @@ -443,7 +471,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_2_n2_weight.f32.bin", - "sha256": "d4af0825ded821252546f8d1c587f59d9108b6ad5b3fec91f49de34dbf827133", + "sha256": "a223438f7de8e65465b9c95605748e0152bc1b92d77b72d3af2a41d9ff108927", "shape": [ 640 ] @@ -452,7 +480,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_3_n1_weight.f32.bin", - "sha256": "f7c7eafb79d56604c3b69489b6b4a0147df80e7a2b615f86be7b16b985c6a5de", + "sha256": "6f97f7dc429e26a0e2950787e5ec7c9fa3c3ab9b8ddd0fc1279c19908fdb9868", "shape": [ 640 ] @@ -461,7 +489,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_3_n2_weight.f32.bin", - "sha256": "5f69753e55446c6c2229018625ad180851a84470fbdb5c89e34f3c4424b17906", + "sha256": "9754f40fc928fdca4359684c41888d1b3d6af817936af59b161f3824b32534ff", "shape": [ 640 ] @@ -470,7 +498,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_4_n1_weight.f32.bin", - "sha256": "fee47b193f6ed6749017d6c8c2a74cc469e9011e30ca33e2b0e73359eda018dc", + "sha256": "2195f562646510d2e377c5d219dc1341d32001ed30b4d54cf754462cbcd175a1", "shape": [ 640 ] @@ -479,7 +507,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_4_n2_weight.f32.bin", - "sha256": "14fd5b086cde7b81dc01556e455e1ea895d13ab062471b558dbea32b2d842b13", + "sha256": "75fda5bbfe2285970162c18ebf565ebe3e4032b2751b4bac289409a0ed8cb12b", "shape": [ 640 ] @@ -488,7 +516,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_5_n1_weight.f32.bin", - "sha256": "8ccefbf5d0804e7ed9f0a693b26826dc330a5d0985d521b32c8b0ad8df02c149", + "sha256": "eb288cd1ccb8e5b7d5da5e6fa88afd881471b0bbbd355e14adbc3b885385e71f", "shape": [ 640 ] @@ -497,7 +525,7 @@ "bytes": 2560, "dtype": "float32", "path": "dense/encoder_5_n2_weight.f32.bin", - "sha256": "3445fe77c401b32595a7fd403f3cf3445041b9333e71307d1efc5f902736a040", + "sha256": "75218ab909794e1396d0a651023851988cfea12c5085c9230b883188d3a66ae1", "shape": [ 640 ] @@ -514,6 +542,7 @@ "decoder": "dec_embed.weight", "encoder": "enc_embed.weight" }, + "encoder_position_embeddings": true, "final_norms": { "decoder": { "bias": "dec_norm.bias", @@ -1402,15 +1431,20 @@ "n_heads": 10, "n_layers": 6, "norm": "layer", + "position_embeddings": { + "encoder": "enc_pos_embed.weight" + }, "rms_norm_eps": 1e-06, "supports": { + "agent_policy_heads": false, "batch_size": 1, "cross_attention": true, "decode": true, "encode": true, - "kv_cache": false + "kv_cache": false, + "retrieval_embeddings": false }, - "vocab_size": 8229 + "vocab_size": 8207 }, "layers": [ { @@ -1428,8 +1462,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1449,7 +1483,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1458,19 +1492,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_q.packed_weight.u8.bin", - "sha256": "d7ab06bc015f2be6319e3507d9bc4fc481ee92c5cc2c7c27c42f2fddfdd33497", + "sha256": "951c976f47b39ba620a2703f97b02ed8e753ccd8bb95a9c61ed0911139dd9009", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_q.scale_values.f32.bin", - "sha256": "dff7f19bccf1d55789a281957b398f254a65589e6cb304eb7281f66da102a1ec", + "sha256": "58f656d894a6673181860f8ec88093f0a6254b00ce39b1cb1e108f1615e638ab", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1499,8 +1533,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1520,7 +1554,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1529,19 +1563,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_k.packed_weight.u8.bin", - "sha256": "d52f992b0910b497849db037dcd3b211399dde003b3d5dc1c4243030aba97bcf", + "sha256": "0d358351e42a919e6f41efc8d3d8220d202c7a2592a36b18b1e4039c0312c49d", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_k.scale_values.f32.bin", - "sha256": "cb8a7e3e25b769081f540e81ace05f88ab7e7bdfe6369c062c4287b4dec83362", + "sha256": "363a2535ff463d2406751ad619b676aaf8f5043f972b10829d70e5c5370541e4", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1570,8 +1604,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1591,7 +1625,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1600,19 +1634,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_v.packed_weight.u8.bin", - "sha256": "108581897257e33bb4fbc1e55704ca7764944271553d0ddfcc722a18a112521d", + "sha256": "5f2fd0f6297addda94dfd003cc2902fbce3b926e9d3ccb9fbf56f118ba987bc8", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_v.scale_values.f32.bin", - "sha256": "c7271620555a6f171073cc1282d421ce99c44ac9320608a8eb146546ddc0fa4d", + "sha256": "834cb863484c883b449cc141b0d11a1441c8d5d4c6c00b76092e54b1b9726ffd", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1641,8 +1675,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1662,7 +1696,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1671,19 +1705,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_0_attn_w_o.packed_weight.u8.bin", - "sha256": "150c446d048f21dc70c7bf8257c066c366b16c66fbdb6e2e1a1696a7f825f07d", + "sha256": "83c19e24982850a0703bc51352e8d2dcf2d9c58cac17c3fb58815327b0117251", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_0_attn_w_o.scale_values.f32.bin", - "sha256": "c4ca4bd42c680d34759243aa28d4287d7b9ea25b33cd612cffcf186773e64fe7", + "sha256": "92e6c93ca7bf5dfca57fdc636156023c476dba44daa150855c770b191b2812d0", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1712,8 +1746,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -1733,7 +1767,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_0_mlp_w_in.bias.f32.bin", - "sha256": "0c76a21f7135f7f72f7c900a5774522e72fe8ab934d5ab5fccf1dfc79eca530a", + "sha256": "3a2cab48442eaf53044fbe153c8e3688fdd3ec3c035f8edeeaf67d3bcddaf4ff", "shape": [ 4096 ] @@ -1742,7 +1776,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -1751,19 +1785,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_0_mlp_w_in.packed_weight.u8.bin", - "sha256": "004d7e5054f2c9e259a2c13919c8df7f5b111c7ee22acca01a704acdd021471c", + "sha256": "8084c90cad779fcfbf3a68dd3d751dab75a495d6798f8d125b67ee076582c72a", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_0_mlp_w_in.scale_values.f32.bin", - "sha256": "4214d23605eea19d324210ad68ada5225528050abb903d19acc8a0e3268db8f1", + "sha256": "fc25f4d74c3d8a0be61dd9b7b006c93e806bc6dc048c05e98596e8542c1327c8", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -1792,8 +1826,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1813,7 +1847,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_0_mlp_w_out.bias.f32.bin", - "sha256": "3645d2a14f59327bfdb2fdb9a25d1fd73f210eb0d09d4ff9c1282216684f8411", + "sha256": "6d95b0054d8d8c155e33665b1fb3c0dd454478ad2a95eba4316160883bdefd47", "shape": [ 640 ] @@ -1822,7 +1856,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_0_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -1831,19 +1865,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_0_mlp_w_out.packed_weight.u8.bin", - "sha256": "d1834b3a1cfd59a330317fc20b6e5175e8efbdfb49d0cafe2187bda3da18151b", + "sha256": "2b475a637893e79948117383cd9138d44690a04653e49985b355e6e63693a783", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_0_mlp_w_out.scale_values.f32.bin", - "sha256": "55ae56768383392cdb0ce3dc1cb7e328065bac7b4d564636675908f7c7e2b5dc", + "sha256": "827241212e161c00a58bf08aeb8e001a475599cfb6786c2945b15dc39afe3dc7", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1872,8 +1906,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1893,7 +1927,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1902,19 +1936,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_q.packed_weight.u8.bin", - "sha256": "243e87c08f505a34c72a257c31da63f389f0dc9e7709c1f3993b621936c1c5c6", + "sha256": "abe92f5a662e92da5725883968212a2e90a77f05e8499dd0eb5c3134279535cb", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_q.scale_values.f32.bin", - "sha256": "6c3176454b5a9bc79ffa3a5b1426854dde1075fc8e95df718dbbf1e74c6a1a7d", + "sha256": "f92420a0087a6ad79021a64f1300eeb7d53c4146df1e5f92c339fdd606d4808b", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -1943,8 +1977,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -1964,7 +1998,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -1973,19 +2007,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_k.packed_weight.u8.bin", - "sha256": "ab05a077baeb46cdcc1d4aababdf59b5bea3aeffa68d20649de0e9fba1c37655", + "sha256": "27b7e94565efaf4b3c1518f3862c56328a9e2ecb594cdd76f52e8ecd87cbaeb2", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_k.scale_values.f32.bin", - "sha256": "5cbbafe639997041e3d9f1af4841ad61ce3fb4a01051527147ffb82ca3d7be5d", + "sha256": "8e90310d7f602900c61d1ec0029aa69460d20598de178d6755dd8b6c42b109ba", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2014,8 +2048,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2035,7 +2069,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2044,19 +2078,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_v.packed_weight.u8.bin", - "sha256": "6ba47a4c2c9493d604c2deccdf301f26327fd24aa4f8dea97ad227e1f6079297", + "sha256": "fe4fc47da4a97ad0fd49c5dcbb7175aec7a0d2f7fa4f9f82c2703ca88cd13b76", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_v.scale_values.f32.bin", - "sha256": "7c225f027928a3506f88c02591bdf37ef8024f3facede11ed9b6cca961e01252", + "sha256": "b2efaab082de4926716917ed6472d67ead22eaf2c71ebdcae672069a4acdf9fe", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2085,8 +2119,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2106,7 +2140,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2115,19 +2149,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_1_attn_w_o.packed_weight.u8.bin", - "sha256": "8983ff941314f11b1763fcf4151acf8b5f253e1edaa1af513393064e51170db2", + "sha256": "e1d4ba087cb7fd9337ad647b9ef35af6ef83ef1a9e2611f177e7e76cec268d67", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_1_attn_w_o.scale_values.f32.bin", - "sha256": "33dbe8951b3b693cdb8142d6eb69c78b4e8759f288cc4a5318104ac02c80b843", + "sha256": "94401ac4905ab9a6a51cd297f505caa81434ed03ba406ef6a8cc3e1759b2dbcd", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2156,8 +2190,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -2177,7 +2211,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_1_mlp_w_in.bias.f32.bin", - "sha256": "c0f7ec6b18dc60d7e34e54202e2dfa23161d0d1f9f236dc3793175b36787c33f", + "sha256": "025bae5bd7c6d3874c23d1348d4d32d7a5c399e719416f1b22112784599348f0", "shape": [ 4096 ] @@ -2186,7 +2220,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -2195,19 +2229,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_1_mlp_w_in.packed_weight.u8.bin", - "sha256": "2bb3428b472adfc90eb54828a2ead8b0ad6fdf2cc7b66675380493c22b20a62f", + "sha256": "97ff605bae210a9b872523f788aa25bf06ae8da80eb62537ac6ba898ab0cd4aa", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_1_mlp_w_in.scale_values.f32.bin", - "sha256": "f9da662769353c2563a0ede9f3d0c1f5a2c555ba0e0fa7fc44e3e618bd84c67c", + "sha256": "b14e688ad3655e5d1c26fc671f68d4911632515459181f058a45f5cc218a7973", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -2236,8 +2270,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2257,7 +2291,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_1_mlp_w_out.bias.f32.bin", - "sha256": "03b3887ae51c6b0037db1fd1f0de55da60433531a813d71fbde60aad3999a919", + "sha256": "44d5985a564ba0032aee0a81b081ba706266d8e085a12c7f44d688918c8f4811", "shape": [ 640 ] @@ -2266,7 +2300,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_1_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -2275,19 +2309,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_1_mlp_w_out.packed_weight.u8.bin", - "sha256": "5f22a3ff9267da588582fb278a582b05fe01b82db9926673cdac0ed2365c01c5", + "sha256": "7742ee5975e591618aabc5105a207b0f78065d02ee41cc6b45ac88df12bb4c1c", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_1_mlp_w_out.scale_values.f32.bin", - "sha256": "87b9271c50947f716a47673bc3d02148b87b5b907984913150bafd5fe213fdbc", + "sha256": "d4519cac1203163e20411c81058fcc9e15b2715b873377d9867a23f75a878b8a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2316,8 +2350,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2337,7 +2371,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2346,19 +2380,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_q.packed_weight.u8.bin", - "sha256": "6eb5f07dfaf3775aff9c4d2b6401f2a03dc1d62d7860673cfbbc4503a67ffdf8", + "sha256": "4046b1503f400adae06277ce337563059601462ea3ed824adc1143d2bbae8d25", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_q.scale_values.f32.bin", - "sha256": "35f7c5b339f31018f1c2f6bc9d3d4fc7f583f3bf363748d5c2d0fb2b65358293", + "sha256": "b6a2a79210118706fe89b4ddb96a41eb06075852ab1c209cdcab1652caa3907c", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2387,8 +2421,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2408,7 +2442,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2417,19 +2451,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_k.packed_weight.u8.bin", - "sha256": "b3969a8412ef274fdd8d1cdc0e717e65f093fea4b81ea1e4b86946396353282a", + "sha256": "32ed7fb622aff2cf751fbd3986344f581380fc2d004517e2b3b7ae111fd31bca", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_k.scale_values.f32.bin", - "sha256": "23558f8ad5065804514f605ae8632576452de53ce75d1ec1b8dc407891c59f84", + "sha256": "8607a763ae93991b49232ae2fd052fc67c7709ef43d9074d8bd91c940a2f4217", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2458,8 +2492,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2479,7 +2513,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2488,19 +2522,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_v.packed_weight.u8.bin", - "sha256": "df51d4bc08980ab65070ea27f26c7214cf85772646fe3c012d5abb2a38c18c1c", + "sha256": "64940ce687d9f5cac4bc5c0ebeedaecb3e8551bfaf05135a27c04b4158b9b9f2", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_v.scale_values.f32.bin", - "sha256": "9ccbe7a70a3661ec2f4759630383a3d9a55580a8d06df0e9cfecd64fecfc8558", + "sha256": "17eb0fc4ae802ce844e776193fc48d96664c74682bd8ed65f0659401c25ccee2", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2529,8 +2563,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2550,7 +2584,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2559,19 +2593,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_2_attn_w_o.packed_weight.u8.bin", - "sha256": "47d3496f29a2bd312b933e603109579534f189ac81bb9b85df90ca5489ba1b42", + "sha256": "4cd3154e5a261d3671f9255147f5c7c123b89e391fa8d95d0e0d8f0aee5b6824", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_2_attn_w_o.scale_values.f32.bin", - "sha256": "f4af4886a665b8eef127c37bed55363902266d84244dccf22aba98b57944a36c", + "sha256": "bd285179d72698f1f3ec0a18f279f4656df36d31c859f2b106ec8b01caa99dad", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2600,8 +2634,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -2621,7 +2655,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_2_mlp_w_in.bias.f32.bin", - "sha256": "5ae3330307450ac03ac34415b7644e09a0e2cb7ad403d1b5f12ab901de109998", + "sha256": "756a058396dc773b98e7fb45c72299bb1402b3a7f4ff319a435fdae1a5a14a0d", "shape": [ 4096 ] @@ -2630,7 +2664,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -2639,19 +2673,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_2_mlp_w_in.packed_weight.u8.bin", - "sha256": "b786e18f9b0969d9582a9d7ab2c068409064ac30d1ec2233973ff0d7f5348772", + "sha256": "5c27668c24ade7f4989551e3a23c729512fa3399126e8131a9a7c3b7beba93f2", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_2_mlp_w_in.scale_values.f32.bin", - "sha256": "7a8be72029c197396595545fb4c87c3a9537fc1806948f07ab10435af3f6b728", + "sha256": "ea11ebc8e04d3fa09dad49efbb2465b461308a8353d1fddf1008c25cf47b1f49", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -2680,8 +2714,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2701,7 +2735,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_2_mlp_w_out.bias.f32.bin", - "sha256": "d8dc575af7db2cc39fdf5088a8b3ddb2ffe120ce316e80589f7d67b39aa626ad", + "sha256": "1a85a10eac9d0a55eec02edf2e3b706e87066e836808c100715b883e65689cc5", "shape": [ 640 ] @@ -2710,7 +2744,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_2_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -2719,19 +2753,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_2_mlp_w_out.packed_weight.u8.bin", - "sha256": "6575ab2984c61b415323a968cf2ccf84721f33259e0d940a8a6d79a082daecfe", + "sha256": "dd26321691449af82d643801b9262dff7365260cc32b665c25dee5889cd4df69", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_2_mlp_w_out.scale_values.f32.bin", - "sha256": "7db5cc7f85da5f79e2937f9bc4fc646bca21ed4baf75f566ae9cfe7b8105f202", + "sha256": "ca2d4e4c3da8b0e7a0ab688a4883b2040bebf1e22d545576a795c847e5ea2b28", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2760,8 +2794,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2781,7 +2815,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2790,19 +2824,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_q.packed_weight.u8.bin", - "sha256": "43c4f0d6d23b5af6fe7c2c3e1b109c2055490098b3fc31683a550a43f059e298", + "sha256": "baa0d119c263884f0022dff7e7e4020996ea2c91c9912f568f2ede5559432027", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_q.scale_values.f32.bin", - "sha256": "f63de5f104f49da4f9ad4b052a01e94ab70ac250f4ebfc81dfb804932d434cec", + "sha256": "adad57af78e9167da8b4e5855e46083456100ffd1ed101e0f84074e9496c7d27", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2831,8 +2865,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2852,7 +2886,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2861,19 +2895,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_k.packed_weight.u8.bin", - "sha256": "60c7759210f429d911ecc35e4b8713aaae9dfd8633f7346bae24f736500afe35", + "sha256": "5a9a3e87cb0ccf9381821b2c13cd09a88996d04fcd808ae3b6313622c9986444", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_k.scale_values.f32.bin", - "sha256": "896f661939f2fe43a62b13be603f2596dc3df6dd6cd9c0cad1fb2f13105184de", + "sha256": "c94e97d5feb0a8acb690700c648981cd8ddadef54399a0a263cb112141cea08d", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2902,8 +2936,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2923,7 +2957,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -2932,19 +2966,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_v.packed_weight.u8.bin", - "sha256": "4a6340999dbfd52b72ac1c8ab26ea8981e2d66638afde19e3498caff88eb74e8", + "sha256": "2bd7d1359728efce205ef25d36c8d47b7ded204343a3074ca03ad64bb485ae42", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_v.scale_values.f32.bin", - "sha256": "b02dd07f237f832e50c41bd2e400e30bf13f7dccea1ab1befef78c76d342da95", + "sha256": "f7b3d178706d789bfbc5ed3419c8abdfce30d733cd967d5a7ce3f92560ecb7aa", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -2973,8 +3007,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -2994,7 +3028,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3003,19 +3037,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_3_attn_w_o.packed_weight.u8.bin", - "sha256": "de6d38106a582dfc0845e37d832281ca3ec94c62c1a935b35277ad2a793879ca", + "sha256": "6291c1abeaaea0b97649438a296d76ceb106575b71884102d3542b00ef05e8c6", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_3_attn_w_o.scale_values.f32.bin", - "sha256": "1fc6de6742fae87884a5e630e7c409fb39c9d4420875236665543be890a0740e", + "sha256": "bd39061fcce791e35176cff9de492ef93343a6c39e27730e241ddedfb549a768", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3044,8 +3078,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -3065,7 +3099,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_3_mlp_w_in.bias.f32.bin", - "sha256": "92a57bf5d82d7f0babb971567adbc2dfef3ca28e891a80ee8ac7813419886e91", + "sha256": "fd93590315d0550dadb82709589d499011558085fe7f42aa87a41a87c2742e9f", "shape": [ 4096 ] @@ -3074,7 +3108,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -3083,19 +3117,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_3_mlp_w_in.packed_weight.u8.bin", - "sha256": "11aae0a6d3a6390a198d014591584419c976d321d86324e2289c322c061878dd", + "sha256": "8b117e51f471d478c8c5da5e498e0635c1ce74b32e75e4d923b6485ea87353da", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_3_mlp_w_in.scale_values.f32.bin", - "sha256": "68a6035063d24067df5d569aa4702b2ec33e402ac4396206eba32bbebacefcdf", + "sha256": "49e75f99e2d5f25276cbb411044e6acc42c8b520b449a0e88d0f36927fdb3b9b", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -3124,8 +3158,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3145,7 +3179,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_3_mlp_w_out.bias.f32.bin", - "sha256": "28cb43daae4e8a25875c6cda35e6386f889703430a87333fae4bd8be9dea69b4", + "sha256": "0f4777ca7ed1def47f66c0c13245e859f585b3401bff9b2fc0692869bcf6c3b8", "shape": [ 640 ] @@ -3154,7 +3188,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_3_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -3163,19 +3197,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_3_mlp_w_out.packed_weight.u8.bin", - "sha256": "e9b02f483fb6df052ea1fcb6ff5d088de525d94cf94fe964839eaaf7926c400e", + "sha256": "3ddab3f329beb5d19a28e69aef00ac69b708a6696f78e84254033d362b4cff02", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_3_mlp_w_out.scale_values.f32.bin", - "sha256": "37e993462b64df0e8a791fc642c905c6cd95740fcbe052de7b27df97e5808bb7", + "sha256": "fc14d3937542e30e559658d7b9bb2377fd78c81771e3f3e7cc20c690648ea7b4", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3204,8 +3238,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3225,7 +3259,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3234,19 +3268,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_q.packed_weight.u8.bin", - "sha256": "d13a5cc5326e6b273e9af183087beca2cb322d8116c7424480aee6bb815b79f4", + "sha256": "728a805cfca6f97949f88c31871ef1be00603a46d9bf20fbbeaf9a63ecd92167", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_q.scale_values.f32.bin", - "sha256": "2eb000a73abd37c474f2fa50f53e25d2d44c91929890d30b919c9ec8539a688c", + "sha256": "3b9e454e60a6a13e5102da4c03d527762bcf2b9bf12d486e799d61c3658c8dcd", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3275,8 +3309,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3296,7 +3330,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3305,19 +3339,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_k.packed_weight.u8.bin", - "sha256": "c8d53dfc417dbd95009affeda84ee76f88467621e5a13e4057ff3345ff818c87", + "sha256": "10a703b02e24bbfaf3495bc1425befd4a89e9c6f09744e2a1c0706355cbcbeec", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_k.scale_values.f32.bin", - "sha256": "a9089ee1b7185ccabf994b5f70eab40a93fb3ddc973499c59cd11aa34519029e", + "sha256": "531f130bb155c8228c57f8775050b5bc55fe608c07b428bc621c7a2397638773", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3346,8 +3380,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3367,7 +3401,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3376,19 +3410,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_v.packed_weight.u8.bin", - "sha256": "02584e448294863bcbe19188adf9a6674b1428b823a0c8711bb88de01091c1ce", + "sha256": "e5d4f475baae4060d3cc5a3a82f3a52ad92447d23710c3bb3577d99a02ce890d", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_v.scale_values.f32.bin", - "sha256": "460bbf25434d9c7ad6edfed3c3c4f1f5ad70c7062666f2348fbd85b16932a5ff", + "sha256": "8dc5c14c4a1ce0a7eda48fedb3496c154e2fd035b372b8c1fbb67ebfcbc3ad95", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3417,8 +3451,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3438,7 +3472,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3447,19 +3481,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_4_attn_w_o.packed_weight.u8.bin", - "sha256": "1ff8d4a4f1b91665ca3a74d58fb90619d67a383655a392ab2d1402ab4584af26", + "sha256": "a94d196e77a98f4ed95df7a9102b2991e536dc5f3071302b1a497fce6d5de673", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_4_attn_w_o.scale_values.f32.bin", - "sha256": "7900c5f4c08328434107eeb6a977d3e52e24d2e6e03ddd12ff960db27586c30b", + "sha256": "65dafd5676fdc4978472be0e5ffecd6e5ec5549fb6d5664b79e8d02e4cd0878d", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3488,8 +3522,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -3509,7 +3543,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_4_mlp_w_in.bias.f32.bin", - "sha256": "99053239c0447eb027095c62e66ac96c7ff6ff914c491bafb83b114bc3733c19", + "sha256": "1895bd3a783cadcce33598fd40adbec1468989bfb911673a0fb315883e21647e", "shape": [ 4096 ] @@ -3518,7 +3552,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -3527,19 +3561,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_4_mlp_w_in.packed_weight.u8.bin", - "sha256": "e7149c7d3ff509391cdba5af5d102429a7d235e1d41d582ea3565dabc7fee453", + "sha256": "9d3742046e3c417116c43c76a09c313d31979170bd39d42a5dde6f0a7e9ad08c", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_4_mlp_w_in.scale_values.f32.bin", - "sha256": "493293bce6191f6df816e466933ff0c061273c1cec8d0fdd103131507cb21591", + "sha256": "88b516eb6de001eed4819d59a8e8af51f48eabf45e0e08400cf7351198e404b8", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -3568,8 +3602,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3589,7 +3623,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_4_mlp_w_out.bias.f32.bin", - "sha256": "37d72c03868b46c203a0550dc208cfc4fc89cfc963272e602a9f9114749453a2", + "sha256": "a37f53e3778a72816f2020f1e2e74ce0387bf8f7f1894bcb5e21337b17a975a5", "shape": [ 640 ] @@ -3598,7 +3632,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_4_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -3607,19 +3641,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_4_mlp_w_out.packed_weight.u8.bin", - "sha256": "97c0df1606d2c2170c3fc4a0fa68777a6be93cc63d11641a113ddd144a69a803", + "sha256": "cb2919b644968c18f3d8d07f4a7c2dff37300f3a19ca9252d608515e27356843", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_4_mlp_w_out.scale_values.f32.bin", - "sha256": "9183e05de7aa601048f5715c1e04220ef4509b9db1a48afff7ed161c1f2fc910", + "sha256": "acf932162b73f02f4dac3a61e9fbb063804e282e457542dcb81087ac0288e496", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3648,8 +3682,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3669,7 +3703,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3678,19 +3712,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_q.packed_weight.u8.bin", - "sha256": "b99d0e715a452c6efce69fcbdb8eceade7864e7d19c189fc55a4f0ef614e593b", + "sha256": "7dd4d44c1ffabf832cb1a2de16b9fe41eda6fdab014995e14d8e985656429fef", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_q.scale_values.f32.bin", - "sha256": "4f9b137787662c0645bf2d15231874a41d42101fb6c753ff543f1b4a06c598d0", + "sha256": "7624e04915864961ee93653aa33a552ae72de0f333aac4bb5070ee12d3164a02", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3719,8 +3753,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3740,7 +3774,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3749,19 +3783,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_k.packed_weight.u8.bin", - "sha256": "033c651731ecdcf3c309d6473c4f1597fa590b092540f0cefdca861befe49eed", + "sha256": "6050252cdefae7097fef44b72a46832ef84555bf3129e31fb1706699b54fb993", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_k.scale_values.f32.bin", - "sha256": "796fd982b5307ac8adc45a87b35fedf54cfa422ccc8e3e41b60f8009e45e3697", + "sha256": "821f63202f456185ca334f8df5549720d54d696d62ed9ae84dfe0ba200913545", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3790,8 +3824,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3811,7 +3845,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3820,19 +3854,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_v.packed_weight.u8.bin", - "sha256": "d87031bdf3e41ea52362d83567809bff5110295124ee8e91f5f6e5a1e35645ed", + "sha256": "e53e30cf99dfb375124f09e4aafd8f94d002f350320d64ed184535c6494d67f7", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_v.scale_values.f32.bin", - "sha256": "03788514329cad1f28970b717a4d43ef4a85e0278ed0dd885fe9d756ecfffb88", + "sha256": "f76061e291a207776605c5ad3c7d62fe4d33568ecc9033af6c0b627e411b3c11", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3861,8 +3895,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -3882,7 +3916,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -3891,19 +3925,19 @@ "bytes": 102400, "dtype": "uint8", "path": "encoder_5_attn_w_o.packed_weight.u8.bin", - "sha256": "a443fcae9400696e87049635cedfec342aee78caa3c2c4a773c23bc7554c9324", + "sha256": "0c9021bc8c3337e9e07cdeac52581df7895492820dd4c39aa2a8fa0a170e21a0", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_5_attn_w_o.scale_values.f32.bin", - "sha256": "1dcb875baa0c7acf4f19cec6638a5f604f16fef674780d3a5fd83fabda38a5b1", + "sha256": "79dcab88153ccd85a92bf06a820212da7514276d13c9d246b383731a60ad4278", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -3932,8 +3966,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -3953,7 +3987,7 @@ "bytes": 16384, "dtype": "float32", "path": "encoder_5_mlp_w_in.bias.f32.bin", - "sha256": "191a36a424ec4dee9cbafac1f3fd69e4123c65e4bed4688de86a7c9b1a0406ef", + "sha256": "84867af91e82c506906ddb71b0a230680dd925d90773bb297b7fd5b0b7713542", "shape": [ 4096 ] @@ -3962,7 +3996,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -3971,19 +4005,19 @@ "bytes": 655360, "dtype": "uint8", "path": "encoder_5_mlp_w_in.packed_weight.u8.bin", - "sha256": "0b00064f3d22bdd64802c393149373738a78e7c5a24ac297fcee3b165acda3e8", + "sha256": "93f7b29f255947dd72d7a5ad15b60f2c68c4b3e148b922f4794bcf96bf7aef87", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "encoder_5_mlp_w_in.scale_values.f32.bin", - "sha256": "7452e6a08f8d28e1a2f4f84ea908a32bf76fb480751d5ece73faa33490950cd3", + "sha256": "07471f0e22ba2cd8c2c7b735c203d91c874fc834b4209788a236fc9529247943", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -4012,8 +4046,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4033,7 +4067,7 @@ "bytes": 2560, "dtype": "float32", "path": "encoder_5_mlp_w_out.bias.f32.bin", - "sha256": "cb7da7b400d0281d2afa3b758997e2af9ef546bcaeedb7d7adbdbf012699d243", + "sha256": "d1ccf0c6e752d23d27842dde01b4bc430190dab45e3bfa8dd8417dfe4c13cb15", "shape": [ 640 ] @@ -4042,7 +4076,7 @@ "bytes": 52, "dtype": "int32", "path": "encoder_5_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -4051,19 +4085,19 @@ "bytes": 327680, "dtype": "uint8", "path": "encoder_5_mlp_w_out.packed_weight.u8.bin", - "sha256": "62ba8a94c88e14d9cfdafd791553656c8391223f1adfdeff3d7c6d73aa461d57", + "sha256": "5c8cf16a336ac7618477e7a52f8eb8b12d5bbd7004f961745f08abfb3f36039d", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "encoder_5_mlp_w_out.scale_values.f32.bin", - "sha256": "bdd75db75a35624ce71b7c3a0f77e2d2e7123f619afa3f2e3f5247f72bb9e9a2", + "sha256": "4587070b10b62cb7687541b3e9946824e292b8f024c39b9d388202d61a5244b4", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4092,8 +4126,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -4113,7 +4147,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "03f4c36fe4f7d830223a0f442b9b15a6b82a10dd37f139d1bcf6b67b097b8f5b", + "sha256": "e31392b1c36010e0789ec0b99e127aeef5058181d02807917ff9dd091777b9fd", "shape": [ 4096 ] @@ -4122,7 +4156,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -4131,19 +4165,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_0_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "a93390ed156e0b0fe0886c537b4c223efa58119a2d3ef74a509feffb8d3a5faf", + "sha256": "9cb2abe959183ae123b07b3ab1db7b98eb21a72e6775282e1793ec1efd6a9f51", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "42a65fe4d99200f8d73192af4c23ece3b905554d184fb1ff2f245916aa1d00a7", + "sha256": "203c7722acd5a6a17458bcace023040352b430777f2bf1668ec64ef00774bec6", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -4172,8 +4206,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4193,7 +4227,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "65c03a26b3b5cc37f42318ca20e55cdc4fdb3df11b031aa1056c5fb7311717f1", + "sha256": "d483dd0a73a79a2a5a78cdc9629f7658f6e6eecdd50647fbf1df6a7784a48d4c", "shape": [ 640 ] @@ -4202,7 +4236,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -4211,19 +4245,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_0_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "e3ed6900ac4cbfc0c66404135ed3357764c8bb91b14481969406d10651d6a380", + "sha256": "66ebf71cf9aa0930f98edead53d5c6557294117e52c6060d3e515385fb8b7c21", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "2e1b173e866f97309124e9e65ebfbc84a34e5855125b20ebca2ff54f16b1b793", + "sha256": "2e3753caa7aaccec574fe60f6e7da33de305c0698012ad5f666cb78f7b9a8207", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4252,8 +4286,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4273,7 +4307,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4282,19 +4316,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "9bffd32c4471bcdfc023a17d068eadf47632e0da196f2de8afb3c0748852ba89", + "sha256": "b69a0802082960964d365f01736cc207853276e8ee31f16a62d67a9e9f6fe4e0", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "ace432da1e7b4f9731947428b48cb68caa0a3d9092a9da11dcdb4387fef97048", + "sha256": "cce1c626617073725f601763dca680ec47d2133ea70f7d8e6d2c4834a3534860", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4323,8 +4357,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4344,7 +4378,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4353,19 +4387,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "a315b12d0b86f25cc04527a71f8743d9bd1d3cf0bd4908142dd960c0b086b956", + "sha256": "a08b0d5a4abc10a63261efd14e67113fc454547474fc7473a3391a2682d92f58", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "28cf54f16e3af1f8b4c98f645e3075e9b88f3a87b118056bb1da4c086895bf07", + "sha256": "0e98fb82ceccf1cce50a58a31c2bc5aa778528de7112166fd3a3d9e0d8d160c4", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4394,8 +4428,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4415,7 +4449,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4424,19 +4458,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "e8e19b7b1b4afb0ba99f550b05516e6f49b5b717d1f3494c0e2b2e8aa95782ff", + "sha256": "4e724fdeaa3bf358ce60a23b5819f16e3d6953d27345b59051bcca52b6d535e2", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "f7db1205ef1a06954b3ec54f2a6f25c354d2ec62f647087dd59159bd66b5abba", + "sha256": "0164f5b76a21689a3217a3a14b333715ba53ff3515d6a47d993062ccf1eec43a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4465,8 +4499,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4486,7 +4520,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4495,19 +4529,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "b68167c060a0068345304b71046c1b220738cdb1fca03ff28daef70e12414b0a", + "sha256": "41d3f58c4e1c71a5e4238ecb90580beb3ecb66d82074d462f6bba66410488ed4", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "3ca8fa5888fb89bbac7e20dbe4a6fc50f040b38977ce0ca892da7464b2e5a8e1", + "sha256": "9335b23e739a7ea4fb3e2a1406ff9a264afc8cb3a6aba655f76ffb98a965e472", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4536,8 +4570,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4557,7 +4591,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4566,19 +4600,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "cdb4e6bfba40293068056ce54f3e4c97b0c3b1a0aed88969106d1e9d3a0aff7e", + "sha256": "af7d96d094f15aec2e3085ed7886bc977551a73ec02f8303de8aae92c1a9dc5b", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "7b2f4085a97118a209bf0cd98997c037aaed5437047cac9405c2cddabf5565d3", + "sha256": "8dd70c2cf3f9bd573a92e6e26febf05f647c9aa2a96be406653c820ad0236fd7", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4607,8 +4641,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4628,7 +4662,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4637,19 +4671,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "dab1fe7b8a9c0d16962d04385eb4bd8278ebc6b710048e308f4e952815704a89", + "sha256": "08479bdf9b9e401f6cb67193a75376c4d033262548fdb311cb43304639416056", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "ccda5b9b61ca846d301dbf9745c708b2167137998117d3ab418e8afb2444d49c", + "sha256": "5f1804fd15e3d2f211b606b28e53cf7f6c9dba0b41aca6331c21267374a2d2af", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4678,8 +4712,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4699,7 +4733,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4708,19 +4742,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "bce666c81785261a37d521f07d4d33311234b80a61f376301b81c66fc45c37fa", + "sha256": "e22c38d92ffc3b80e9e671365641515aea6d6752bc5daad7093fadf0cc824d6b", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "a5caee871504a64e3511d4abbfad95d73af3cc09261c05b6c0f536bac8b54161", + "sha256": "66caf7ed5c1928df1a13e925b9dc0668f373d962df677fe30849d7d651490180", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4749,8 +4783,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4770,7 +4804,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -4779,19 +4813,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_0_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "a27b0efed3dc1b8317570f0b1c8c69dae70290817b2e5a6e6f2ce3be3793e0fe", + "sha256": "626e1354171e0957b38f6a2477c00951a23c6817ed63da0407e5eaed32d7a8c0", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "0b675f7d7585183acc3ae150ff7795d89028ad8f54dbd834b84f42d02b3d6a4f", + "sha256": "5a9d7dba971eab55495a66c347f16b6f87381a569377479629f0afb1e024b64c", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4820,8 +4854,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -4841,7 +4875,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "0d1c7b21f7a5b3247e98ad66ad7e06b4405cd982256e530764ca6e81b14fd441", + "sha256": "05ca09aa97d5c292ea175fdba1462466841965246c1f484fe65a8796fb730d6a", "shape": [ 4096 ] @@ -4850,7 +4884,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -4859,19 +4893,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_0_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "1b0ff6a2225621176cd52511c077eaa16aca405450460acf1ea1e0733fb676b3", + "sha256": "01a9eafef410331309602cfd32771cf501cd4c49ee2288717fdc8f8cf3103056", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "11410d9dd859c6356330fd0ff8c0f5d0ad6cd29d2498e14a3e5b2f11e5d78acd", + "sha256": "334cbe3fc324d58e30e72661d54c03ed1085c27b3d642851df99d165861e2e23", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -4900,8 +4934,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -4921,7 +4955,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "ad99b45a62019c799b3fb1bb85547e9c2f260f88ce0a791e7cbe6a66b22f4cb7", + "sha256": "cd523a559d16f295950e4eefba07a2f728433c7ead25c64bfd23ab91107239d3", "shape": [ 640 ] @@ -4930,7 +4964,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_0_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -4939,19 +4973,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_0_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "f8b98787aff27d2c5c2ef02ee5a8e2d51ae48477440c14aeb3f80f518bea0086", + "sha256": "b9506f4167f7524afe5d3b1acc61e8ceab2d3137ec6f4b545d24f9ba31c8c7bf", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_0_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "d1cf7d1512bb52ed1cd21db60765567bed2cb48f248fb81b68b82a0bf01991a7", + "sha256": "711af3f0d6d03e14c13f3536cd4c46f20a8b727fbd25b2b2e7f1b97f60194c1d", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -4980,8 +5014,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -5001,7 +5035,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "db359faa9d174bff94c2274019c8401c9b9cdd5fec5c3c7da9e7dbe7627723e4", + "sha256": "cf73fdfbe8b4919a8011de646e3cc5a1d8438fc08cc1d70403453f39d8bf5a9b", "shape": [ 4096 ] @@ -5010,7 +5044,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -5019,19 +5053,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_1_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "da5f2bb8654af32349bffb9907ee0db606fa63df16a5802c29700cc33b9de975", + "sha256": "c035ce58f51ad9bdb3869a4b4fc5d49a9fdb3ae922c8748d04d5fcba076eaa0d", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "8cec28ced33955f68fddbbd870c2a0b0fd969eb6b478b3a4cdba0cbf56a6fd22", + "sha256": "0848c8fa964abf68b054126ff610f8525c1030c0f0c8c061d865dfacd66c938b", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -5060,8 +5094,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5081,7 +5115,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "013cfd5cdffcfff5bc159d970f94d01811f6f3d118fdea9ac821333f2af399b1", + "sha256": "5a1f09f3f10cc9731a269ec34ac6e5f721ae3e6c08e84cb33cc46050de33d962", "shape": [ 640 ] @@ -5090,7 +5124,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -5099,19 +5133,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_1_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "b4ce6d83159561062230049e832bcca18287dd68f40d60397aa23e6045562bb2", + "sha256": "72b1bf0497c3af46aba032c7fc0225c6bab53539728f100131faf88e474d2424", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "f8a8117d6d4b72628c9ff1d88b3e39800e567f1b816abd017d5531f0a270b26e", + "sha256": "5e915f656a0ab9ceeee2f2570b8be4ab2e190c0a7324d2fafe35fefa0d560d1a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5140,8 +5174,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5161,7 +5195,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5170,19 +5204,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "d8a8b78ec75e0c333663940e9f8a74b44f7252d399895df9b27da2b4037d157b", + "sha256": "f62eead467ee63a5bb17213bd7744956aff491ec56204820143ac249b8a2dd36", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "332eb215c1ba8817f68d134462324f799236b88c7a050bb63ca6bd0d4c0d7753", + "sha256": "49d0d891621d97a6caa308fc53d029f8d89c6437a02014014fcf8198275bf19f", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5211,8 +5245,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5232,7 +5266,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5241,19 +5275,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "1ef7df6ce7c7cf79e720be6fddd8fb86dacdb6067ce088e981e5cd11c053d588", + "sha256": "6a36f2f65841904629925fbcfa84e126aae8f6e9c8abcd6f72a8ecd7f22ccbd7", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "2622bf47efeaa15ebdbb9f9eaa930af498683747212acaee09496955364fe787", + "sha256": "846e22bc9fcb3f7dc3993852f8d0fd8befab13ce081324a3abc1fdc56fea413d", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5282,8 +5316,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5303,7 +5337,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5312,19 +5346,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "1e55dd6de5285a9a895c2fdce7c57f32b37d0882fc31a2ec66c021bb4707886a", + "sha256": "306f969e226ee36dc20a66056ac851a449b7810160bee0166aec85710cfd51fc", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "e26e8e075bc0ae64848a79d680a9603d5a67b1319ad22e86613e95c382e37072", + "sha256": "3b2c300fcc22571bc36c6819fb412f49fce02d486d528946416d4e9f7f1b50b3", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5353,8 +5387,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5374,7 +5408,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5383,19 +5417,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "04ddf127b2c76986e4d0b3b9c36e1dc8bbf404b314b836958794ab3ba5e198a4", + "sha256": "17b81e31d14fd2377646cc5351be3ff7299c4025b1a65ee0bc0378d6d69ef4ba", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "7e63be7ea82af79ae38e684120c0ce922ee52f6b2cadbfb11fde9545f5c91a64", + "sha256": "63565a86aae052794d7e726aeb21584a9e39c52a2646ad0454ca7ae4cb1e575c", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5424,8 +5458,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5445,7 +5479,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5454,19 +5488,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "08be78ad3df0180ff637243fbc2ed3ca5e46c1b983ac09530e90f78e68b25379", + "sha256": "fbc0c47e3e99833cfd35d714791c5a20482d1db64a1dd2524f85cbd90a09d5ee", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "68798aa8d4fb447fd0540177b3c2b2d5056c3fb17b6262da551a3f821090e174", + "sha256": "22a56325517500e9aa144b6c45c43142c71f2f3785a0ca9f368ba92b33b6a10a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5495,8 +5529,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5516,7 +5550,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5525,19 +5559,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "32252c6527d271f9dbbd442837e8e20d81077dfedc331500d2a6a58e3a2fe846", + "sha256": "92da8351ea49f3e5e5cac3fa2f3ec616b2ab1f2c2e0590f77c241eeb1edb3d4c", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "dd2d3910474cb1007ca2b9982543b5cbb71d8b001752a8838c35fd817d81e01b", + "sha256": "48d46cb7803af682dd8b3e6358e5a8829f3031e6051774bd606815dcd32022d7", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5566,8 +5600,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5587,7 +5621,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5596,19 +5630,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "c719a28098be92cc1ff0118fbe3b9bcb49d0f374d06ad4619198bb9f198b6519", + "sha256": "a3d150e880dc3d1e210143ac8f14431ccbb73e26e2182f2695eaa133b01a05de", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "54941c4e0b7edc9d9658ba42cfa5ce0652836fd57a274141bad95df2aafd52df", + "sha256": "4f426dc2b506ed8e8b0dfc6436e74d16ab7e2650a494946f7b92c66cb14b8753", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5637,8 +5671,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5658,7 +5692,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -5667,19 +5701,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_1_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "10cffac7ec80a010b58e7ac2c1e528d083b61411bb7adcbc3ed46ac5bbaeeb1a", + "sha256": "d40ee2db7dbc602afd3cff0b7046e7571092feb5bd2acab9d751fe39b8f0393a", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "56e9ca708e8eab4f2439a734b9a8f20ce70ad57d3a113628e5607d0da9c4daed", + "sha256": "19b42d8f06375451e83c749579aabb9e152ed409def93381d8378f2b80ed4bda", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5708,8 +5742,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -5729,7 +5763,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "c12df42bd62e067ab734a5fb22311d1b8e0eadc2a3a8a0d3eacad5d4ba8edbaf", + "sha256": "353917073379bcde4b14d13263453d8e1ea0f9efc761a0f5a25c45ca30cdb7e4", "shape": [ 4096 ] @@ -5738,7 +5772,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -5747,19 +5781,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_1_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "147f2cb807148dd9b9903e5aab63602ad272f7c7287d366858e25bb42dffc7a9", + "sha256": "7e6ce561de8adedea09bd594dbf820ff345a4b839d7176158594223c2f23c059", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "0da7709e16e4c7ca38ffb1d9c3c815e2ddae7b5191c07c107c80646085238205", + "sha256": "5f5bc5b85387c70f0ff0a8a6236137247179cc750539ade22badb819f046a146", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -5788,8 +5822,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5809,7 +5843,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "177029674ff23caa5d0f64d5d59ab8c30997300c226e9a1d0769d4198b3bcf9e", + "sha256": "5483e84f88674f52dc3f127ace0d01c79d4000fadbc51ebf1567deb2a5c3a617", "shape": [ 640 ] @@ -5818,7 +5852,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_1_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -5827,19 +5861,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_1_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "9ec392d9ebad88b0211e4325a5526cadb95b11687d74c57e375de0f8a05072b2", + "sha256": "388cfedf59b1d4a8a3b3caa5db87ab91b4914351dd5bb0a88488dfcbb24bec4d", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_1_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "cfbfb56d430de308a8d3ed35905aa51ea32f1cd3aa97942652b43a6add1c3ffd", + "sha256": "fac4e93a918e7832ac8e7d7bf7295ef64aa7694f874856f7a931bdee21d2f2c0", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -5868,8 +5902,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -5889,7 +5923,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "927295ef6316c7afd4c4d8b8ed649f5b1411fd993e764fe08c896e631c4c9566", + "sha256": "6d2d6bbf68f226d911b8685478969e47862d6c77135f4e59b26a523ad5fc4ba8", "shape": [ 4096 ] @@ -5898,7 +5932,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -5907,19 +5941,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_2_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "814fe93187b306522f2e2f44366604c6136ae8e88770e0baf172a0d9f47f8d6a", + "sha256": "7ad63162b55e63274c9df645f9cb8f876ebf3f69f3e79b3d89c9e5043f95969f", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "57659daf026b8a58f21b043009c202151184cf022d11d005d1049f2a953b1719", + "sha256": "c4996743a1807ca846a22787da890efc8acdd1cb2fff49a0bda050d21f60bba2", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -5948,8 +5982,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -5969,7 +6003,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "7120d39a97140da8f52785ce16a5edf7d8584912e24a104d4f70b3b7a0b48ac2", + "sha256": "6630012f9386a03840589168e20887549e8047f3024c6559cd31468e9742490f", "shape": [ 640 ] @@ -5978,7 +6012,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -5987,19 +6021,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_2_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "455d1361f4c8a97e9c2a7fa480b72762655e69fe447b77dbd6defe4637089c7a", + "sha256": "e84e1b4da3cbda5ffb8d639a5df25579890f33ec1b9e3533afbe5a8e64b6a9e2", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "3278f0004d71004a3cf57ec8ecd600c7216678e032f239e03f712eff375070fe", + "sha256": "80bd2688eb5c2aa9e027729d0ad8228ce2900fd43452341b728ba098c5cecbc3", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6028,8 +6062,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6049,7 +6083,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6058,19 +6092,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "ee221a90adfb6b2827509d51b0ce244828bef9e3a9a262f1dace51ebdaeed413", + "sha256": "1d13a29954664d845f2cd98812e1fabee6a9e170375ba2bc45d23c52c54d6451", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "b8cf30ab162d8091bf588b85a36a288e2a4ae3b5d045ac7dfbed1a3db6b2161f", + "sha256": "47251edd0a08418643195800fecf0e458182321181477a15ab3010913b118b47", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6099,8 +6133,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6120,7 +6154,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6129,19 +6163,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "9c5a7b17bef87ae00765b3af4e06e5bc4baa47572a11ff28b4934974f2545872", + "sha256": "8b705241d97aca82476624e41fe3c140ae7d9235f5f3a5b5bb5e12d3b870924c", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "2eb0318a2e6b38b19caf9921aa01fcf72468fde21a11092c82e3b2e01e6bd1de", + "sha256": "05bba73e8e543abc881c7eaa776bc92dba6a2ae60242763a4c3dca027fc9bde0", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6170,8 +6204,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6191,7 +6225,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6200,19 +6234,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "dce50f6236c1def1d66af65586f306a99d60f81370f6dde81b665f352f15ad30", + "sha256": "063dedadd12036857efe5cf02e6c5f8a72f95955a10f2d505b53f2bf970e2009", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "d54124058055e97d7d177cee143b3d9af8c7ae40eb47052a706db0f21b1613a4", + "sha256": "03d502752c8a6f1756549584a3b7322b0e399d227df984a716fbe9c00489dfde", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6241,8 +6275,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6262,7 +6296,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6271,19 +6305,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "24304fd6258f3395e3d0a6de4b278540c71f7c33ed976cfa11f756d19195785b", + "sha256": "ca48a2627346da038dcddd11d166de40fb13bef35721e2f145dbbd02f6a812e1", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "32bc8118f0830b955cb008e5d7e216753b01852f8d26f64dfcd65e11c03192c5", + "sha256": "5f32c56c00f6599aa359c568271168fe2f9b703d3ae525fd6f5c90e9e8fd1101", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6312,8 +6346,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6333,7 +6367,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6342,19 +6376,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "b751950d3a076dc83467a2ec55298c5c9cbfd95dafa26ccbd43d28dec2573c70", + "sha256": "609d07290090c8ef4302591373e4908b287aaa745a422eea94ae9533d36e4233", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "37ed7b5a0e185bc2c19807c5853e907788af50c18a739852d1a6a0d35df1f430", + "sha256": "4d319778f3e29447ddf90f96449fca67c89b32a91d0c812fc37f6a90ccf19765", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6383,8 +6417,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6404,7 +6438,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6413,19 +6447,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "40bb2ca08a1c0b8dfb988b7e61a5b57aeedc55c20e9d0c35caab4aead2966449", + "sha256": "41e7cb11fe40d3dd71fd9261df9ba5919bfe1e13e81b34feab2ec682a2138d60", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "f07e412aef0bbb6ceafc7c6c99708ccfbc1524e6ce038191e2a4699a415ee870", + "sha256": "75a0324241350114abdff35b66cf04401eae67cceb15c6d94f3ebba0e357b07f", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6454,8 +6488,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6475,7 +6509,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6484,19 +6518,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "e084d111d06a9a0d76aa499e744722550d05eae2f1772f271811db88098eebac", + "sha256": "aa561b95c482d3e84dde5b670b1dccfe3f90f9f54cf5129447cf126ec6d0f0bd", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "155a3ede99090e94a080e9e4264f7a66af48394caac960c0b4ab7f29c1a87f25", + "sha256": "00710a7d695de7913cb4ec8b60882839a999e13a0ff2f7100d17112df55783f8", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6525,8 +6559,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6546,7 +6580,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6555,19 +6589,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_2_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "9f83084ce3d183412dc6709472bc0957af6133a40d678a1be8628213eafb0bf3", + "sha256": "6f4aac9b6307efe0813bb7133ff5d32baaea2aa869e1ce4585bc3253e465cbe9", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "a5b0e7833c17a2ff33c6f5eb2ed13740aff81b4507ac20975dfd68494df733bc", + "sha256": "054938dfb43c4787837f7db97a0a0a40e078b5ef09aeb61720d07085e262a8b9", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6596,8 +6630,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -6617,7 +6651,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "b544ea371ac2c1203d9d2a9c4e5de96cd267bf48e12ab9bc642489d2bfcd35b9", + "sha256": "c215a193ec6d3dacf0e99800d066f1a703f83a25e37cde9eb29cd3c5e98f1089", "shape": [ 4096 ] @@ -6626,7 +6660,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -6635,19 +6669,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_2_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "f7dfd5b21df56ff51cfd9a989001a8bb84f20a744a16a52444ebc0360fc823e1", + "sha256": "c61cc24ec3441640300dd8819e57df7aee2859e12cf4921e8c927ca73336fd62", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "024294b499c04b0f98736ba1cf71a1eaec1569908cc1b7e7e7f29a2e2288e70a", + "sha256": "9d8f7893980dca5cb4ea179cca82881fa0a975afc060c7bab202d84b7c26c0a0", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -6676,8 +6710,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6697,7 +6731,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "7fe1fb1a00d470795ea8ca416523f2b87da5de8f8370035df1f12a9235e93ff9", + "sha256": "dddac929ae3b499247e4babaacaf9085b3b438edc00ecf20b769b87ba906b57d", "shape": [ 640 ] @@ -6706,7 +6740,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_2_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -6715,19 +6749,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_2_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "84d5e83faf90d19110eeeb505a3036848cb5df357f5cb1bfdf69c4f0b6724bb6", + "sha256": "1a5a777485495e3453ac1efe529125b6e41c41e8c6c91b573891bae2ba664c5c", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_2_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "6104b6247af8eeb849065c5f9a5c5cd437f68906eed1f755500db50589d9526f", + "sha256": "27a4aeebab0d1a35828177169e6f0f6b560ec3e41994baa94cc361357a52f8c0", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6756,8 +6790,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -6777,7 +6811,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "e7fa2b9db048551c93fa33e511d2a04b57b1b699e3c567d7c2013b9acf0fe5c2", + "sha256": "c6f37b9c581395a6b65481f3f77556e773d35842ede2ada8a98604a0b670f648", "shape": [ 4096 ] @@ -6786,7 +6820,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -6795,19 +6829,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_3_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "ed0f958756cbd0c9eeb7c7ffab33a2de6bddf84d8d9482d7ca640dde9e1d6dbd", + "sha256": "52bff5aede2592e837d1cb076af815d440b21210b384f4cfaab5998155008af1", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "f46afa8863a3d2d1734daa2ffefb013a0e16e3d996c118ac27f4d40713a4bfc3", + "sha256": "93bd0593493ea584d8263a622757475f44d54afc26c7e3c8ec3f2be2c6d65e56", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -6836,8 +6870,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6857,7 +6891,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "9ef4e426cc678bdc2145f566ca1b752cb5126a1cee5ba1596670727c07102551", + "sha256": "f68950966a1c83f11814cb0f919e4bcef8566c7756be781c635f4042b80cdaa1", "shape": [ 640 ] @@ -6866,7 +6900,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -6875,19 +6909,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_3_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "9add00e6c4822b6e42e9fe755d1e64de6581345ef650c5c3997ffcd5f28972db", + "sha256": "b833a34b79e1a6e90a9d5738edc0fd96058669853377212d0b6854f7a115e421", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "bd1ba26139a6268ff548cf38f4254585c7cf9705fe8e98e3e466060f130251ae", + "sha256": "b660f513eabe0896e1eae74471316b75cf882f2b2ebc96b5d96dc48b117f9b68", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6916,8 +6950,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -6937,7 +6971,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -6946,19 +6980,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "5492c34a0278505bdc4e822ac0189fcca8b8d729015236b78ae9fd1ddd8784af", + "sha256": "8e60525417ba8a8826caa9835f1c73c530c8fa0e6c371461165809f230528161", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "80a3ad5ecce3023ac262c8972e0ae7c26da488b4efbc97d9d37a1e2f69e1ee30", + "sha256": "391c8ae81bf21ea2bcb1244cf9e9ad32d873c5c06b83a7fa75da229fde0fc411", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -6987,8 +7021,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7008,7 +7042,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7017,19 +7051,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "8d0ab575d0b279fa4474d7b9f00647929f35685ab76cd3643c6433a46e8ed4de", + "sha256": "bace7d74ed3d9800393c16f73dc1d5edfc7e335e80b25862492756f04efeded2", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "71249b7aaf64de63e50bf8f046bd46570d7e95512373946b35ae69230d0f7ff6", + "sha256": "e4adf7959163fd8a9fbd35076cf99bf292ebd9fbf10db3aab0363f335a43ad80", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7058,8 +7092,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7079,7 +7113,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7088,19 +7122,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "1372ee94bdd78746b74f299fadfdb2542584b82e774f2897213c2f80c3d97b0a", + "sha256": "9282bfc70ccf622291e17fe2b9d1cee2812e73a66fa8f3aba79369541bff4841", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "39b616adaf778fb8765fa0d429aef8dcaca66563ec1a9bd7b101db0a3ec08ec6", + "sha256": "0564851be9a55276d9a60a6784b8674feaf663ac7fb071f027caa0f244c97071", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7129,8 +7163,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7150,7 +7184,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7159,19 +7193,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "baa3747fd7115ae1207676b6f0b7a24c143394c391efcde887fd7d04535c04e6", + "sha256": "b03dadf7d238896ba81b0778ad41d57be94c7dafa18a0eed2bcf083d333344ce", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "3bbcce09479da4f651ffaeaa820380ac3d06546fbf304dc3da300953c27c1d06", + "sha256": "f4187a6eefd5fdd64919509ea071d950e1747c9546ab9fa69d1caa234c175c81", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7200,8 +7234,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7221,7 +7255,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7230,19 +7264,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "c0c754c1c26de9b5f045269a549c4e78715f400d08a7d5ac2fc3a56f4d7ccb2e", + "sha256": "aee3c8de55436c54869b5e2275c9aece2a09a18464b1af113bb0ff8be47f750c", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "ed490ffbfaebd2130ba5a0bc7158305fec49152aabf872e11b438cd898ee23e9", + "sha256": "72fb79ed33a2c5752c4eb020474046f673be865b858e0d99c68914d10ac74535", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7271,8 +7305,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7292,7 +7326,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7301,19 +7335,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "4615506b9de6bf246a308393f0b47bc554a89d0e8a86859f06fb2e9cb5455557", + "sha256": "8105f4ef6ee1fd9bd42f78e0bd9c1f982a2cd3ad899e41826cf0e5bf5ad05007", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "98e293a04fcc5eb815240f8620bb42ab961696d25df43a0a1456549121fd1dda", + "sha256": "d75a9affb73da4e16bc9a90f247fd084576544b1e658dfdd636fc21eb34c0d2e", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7342,8 +7376,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7363,7 +7397,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7372,19 +7406,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "b66c7d11f1d89055a23b186d56e13c83f897838ce3d316fcab2857ac5f14de93", + "sha256": "61023e45baaf3879bf48cea3186a42852bec4ed5f042183803772d7463b70f00", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "61d4936b988663a9b7ff66eaffb0adbb160653377f09b42f03840186374cb111", + "sha256": "49dc0865e16ceee877c011c75f72eadbac2c734c3645fb2ebd9309e61bf6cdaf", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7413,8 +7447,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7434,7 +7468,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7443,19 +7477,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_3_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "33e89992827e578d2db3ef7bae29f9ebec8db7b4d5cbca90ac1567824f08d59b", + "sha256": "65549080d4995a379029003c546796c5ae914910b0ad1dc250691fd22a4f8417", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "f4e26d26400a65d13fd45f45e212c75884fcfceb7d370dd2fb958c66384b6825", + "sha256": "03938795c6cd8f22b6a622f93e244251d3b96dc3ab422a45604eb9c21c7f0d1e", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7484,8 +7518,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -7505,7 +7539,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "2a00b32a39221435a08beb98b5df5a7fef1a9ca45087f09c5dbca2d1ed6fd67f", + "sha256": "0d2cf34775e4122f3f773a7000d1e36329f250e8cba0c12154c1287f2ed640c0", "shape": [ 4096 ] @@ -7514,7 +7548,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -7523,19 +7557,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_3_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "9d50b29b673d876e72d051ec8dac1a997b48b6d279c3c0686a15d6d1ca17cc20", + "sha256": "fdbf9731e6997780c963cc037cd8ea297db91d72b9cd75b33e8ea651aee7dc61", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "b2aaf1731428de4dea2b2c94d92be1605a5914147820df01b613bfb938ae2641", + "sha256": "5253e4d1f1d0333ecec00ba3ad5da6c09855b22c2c47d64d3a032c36027b8c13", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -7564,8 +7598,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7585,7 +7619,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "404606177696da2165733d6f8af43fec6228499443d8c463d17d4888578e8af9", + "sha256": "acc4d0806de36f892e17b7bc0ddccfe679788b28fd05347071aab28246142515", "shape": [ 640 ] @@ -7594,7 +7628,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_3_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -7603,19 +7637,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_3_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "9edee44179fb49efef2f42b3ec5016df1afed8835787720d1191cd4da4ebdcf8", + "sha256": "93bb7dc6c659ed2b3787d09cb0a3b196e5d0fd2965bc269a1bee8dc280d6e6fc", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_3_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "d16e05105856f137094f69b422ed1c30b9f8eb90bc8a9ff205e9493b0bbe73dc", + "sha256": "3b1d604246796ef8e2677732742d85621d7586140406b32fedaca157cc6350c2", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7644,8 +7678,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -7665,7 +7699,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "8b0d86432bf25ca0274aea9be29ee3dc8867e07e7cc6fd60373ca8829f0e929b", + "sha256": "5548b21f0b218bc045dd0c1ec40ece79f43064b71830d6b91a8e075f07fb9339", "shape": [ 4096 ] @@ -7674,7 +7708,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -7683,19 +7717,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_4_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "39887530c7398e4ba170dba80b6425c9aed66e6acd35b5364c872f1821263579", + "sha256": "4020ba9b97b8a890b0dee73ef2f31ca49dbb4ad2d80e8498c71e2753c1663876", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "c5e055cd129678d616322fb600fc710f0453ea70c6befb41f6f666dcd898da94", + "sha256": "41f956e7d96fa10803a64f37e87d3c384ce48e2efcd7785468eac768fd0085ae", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -7724,8 +7758,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7745,7 +7779,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "ee2de22f8151f93d09c7d09fc3b523ae0b62a9602b5f06332e3f1b24c56115ba", + "sha256": "060cbb3793b9dc02486280df05b2b834e626637b4dfe7838d4b4f159b84f01c0", "shape": [ 640 ] @@ -7754,7 +7788,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -7763,19 +7797,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_4_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "701990d2141da402c51f03194222e1d7260ab6011e694ff0e61fb4eb93ebd6b6", + "sha256": "38cdbedb4b51266fbb4422fc7a9fa03ce073ef2234d51f2f46396bf2ff99520a", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "8a52afa4fe59d22780b74a03679c037bb852d1136808c38c6f65f1211b4a4911", + "sha256": "1f5504e7f4c1c0adf3cb757f77667111ddec260d2f98562ef5f07124f3bfc39a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7804,8 +7838,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7825,7 +7859,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7834,19 +7868,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "6fddf10d6206a2fda4146574c6e35aafde38ce57ac9d944e8776e45b38640d02", + "sha256": "705018b26a50bfd8f8db2543ba218eee04659da2bd2f670029751cd846a4da00", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "365d59cde5cde0d76ae1056f9b6f9a7062ea4298ad7846db9ecd6e30fd63a19b", + "sha256": "ae7f62151c5884804a9eaddd9fa36f5b4c457d092aba8d78d8154b8eb1ad188d", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7875,8 +7909,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7896,7 +7930,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7905,19 +7939,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "2c5749cb807ddcc419546bc4eaf90e08426c81bafc0d08f988bb5a0864058884", + "sha256": "91ba999d8060f5a3081c848f64e8b14a7dec437ed842962ede41d18dd1c210aa", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "54dd0e2297946d77d8c8b5f3dcd7f3c116d90a5b7ed4fe5404e7de7bb749922d", + "sha256": "4f2f42b8ce0a5ff7a5211a44e6f071a777df886ba6cfa87b941a3c3ea57048de", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -7946,8 +7980,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -7967,7 +8001,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -7976,19 +8010,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "5f0b5bee4f6752aa8804110605497b301456328c3fd8f92f800e5aceb2b58ac8", + "sha256": "b1682806f928cfe008f5ad7cf8a62ff8f31312ee864685836db9469f6e536fe5", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "34685d4ff05fb0c35a230447f75d913faeae21a103c8bc3731d1f628dc27ceb1", + "sha256": "471259b8b6c1958cdcaf03f3d889ed4269ac077a514397511f7a6826a5dba552", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8017,8 +8051,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8038,7 +8072,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8047,19 +8081,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "de4d3f36dddec5d85edbd1eea9336de4b84d347253de4e759c539e25e9007040", + "sha256": "a4c4f008decffa7ee25bc837ee608ff3020d840dab661d75ddf158e59ea0c1d8", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "dc479e96cc27e74edb0cfb05c035f6c6f135e64e52b61a26b3515a5aa7cd196a", + "sha256": "703dc8c734ebcc942733bb5d6e2dde21b48df4829a2c2bf654947ed4dd2e7cd4", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8088,8 +8122,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8109,7 +8143,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8118,19 +8152,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "ce1a77e60422d32c2f46934a766d426bf038344f2e7ea0c5b0dd7c5c7617aeff", + "sha256": "4616bfc7b4ee6594a074bf87afe0b3de1aee8ec0467067e68a90cdb55e4b0893", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "bf0662981cf96dd423851b49062f15376ae4902938808056f0d0fbfa35c0e0ad", + "sha256": "3a2e3d1ba069ade3259a5f99d9b0bf9224de6ece09c62beea206b23d7b9b1fb7", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8159,8 +8193,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8180,7 +8214,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8189,19 +8223,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "4c3875278ad62825f74504bb5c9cfbdb3c707607219de5000eb33d8d4bd93523", + "sha256": "31524643e06ef3020f262caef697c874b75e408d9c2f11b749d8a9b1b7e9b843", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "33667cf828fc4b0223668f61a4d19df07fc65412645b23d9608986fae8f8299d", + "sha256": "3f488d0b11a99264984291678bcb679df9190a00385e4b73e46790555073e217", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8230,8 +8264,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8251,7 +8285,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8260,19 +8294,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "691ee8830941075f454a8bc70497aab974a86e2faa7ec004d05be1b460d26faa", + "sha256": "bf7de31509287e5e5fd652f3e15f78ab4fdaa35dc31007011ef6d13d4a78ec3a", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "756df02cb043bf56b2b6a6c2b49f91415b744a8d9dc48398081f26d671bff9ff", + "sha256": "529c7e330c43ee50eead8d189012170c1ec46fb4e33389e614e40ff8f6c36d85", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8301,8 +8335,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8322,7 +8356,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8331,19 +8365,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_4_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "d779dce49505f8f4796061d9c48b8952f8a2744ef886baaa84762cd1e22e110d", + "sha256": "0a03bbbb018fbbb45c3d7587aa68c507ebf5befaf82759c55cf15878a1b17065", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "f45aba4aa8b028ac833a520a51e9152f61408b8d644cc8be7263db6920f07784", + "sha256": "1da26be124ad087738062d6177cc05257be78c2d2a956abd0bb3b161e7d8b0db", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8372,8 +8406,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -8393,7 +8427,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "99c2ddd2ef7cfe781327186d74be769db274772bd22ec56ef8dd2e4d93f2ce20", + "sha256": "1a42e9a422a18d500744229a74c9f4e5d29cbe5f5c29e827ab99eadeb9a4316c", "shape": [ 4096 ] @@ -8402,7 +8436,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -8411,19 +8445,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_4_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "64bdf33d4af3bb01b77e21ce7b6878be698ade724636a6fa6ebc7af697eb9bc4", + "sha256": "e5dd270c2a9e69b837cfb0bab4b43c57989bf83ce6c15f7b9cca27a32fedacb7", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "c9ea4cc4f63e9e30e08037ec2717237a21ee76d7382aa25d823713ed9afbe238", + "sha256": "cbd99c99c9af6c3112db595ea710801a67c3b231c89ed68ccd1e211660bf58de", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -8452,8 +8486,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8473,7 +8507,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "7698c41fa41db9e931e0866ba25316c02da7112774a03e79089e70b405fd1856", + "sha256": "9e5fd75ca05f0cff37991d42a5a50a5de092708bdeb663d2a9d074fb6e2603a2", "shape": [ 640 ] @@ -8482,7 +8516,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_4_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -8491,19 +8525,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_4_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "2a9e4d3d7740d4bc4d0bf9c8268544f28dae5c5cfa56120c3566c26c7391afd5", + "sha256": "7ce2e9e96e8008fe75b033c97729382205c3985799b6cd344012cc9273796ff6", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_4_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "a07ee9fa0e3d703f194c12d30d48c1ed2966c42260413329a52a5bd06d31f82a", + "sha256": "328ff35703d7b9a3c5c531efc74c40d7e5f0bc5d6590f58974752967e569406e", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8532,8 +8566,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -8553,7 +8587,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_in.bias.f32.bin", - "sha256": "cc2627ea7e1f20f1f0bd4dd22c40a0676b93389dced88ec93f076c04d2977e75", + "sha256": "9c011e158b3eedac0e294b2ded17297c587a790c50b6dc0c5bfdd795fce6e431", "shape": [ 4096 ] @@ -8562,7 +8596,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -8571,19 +8605,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_5_self_attn_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "9f332a3be87df814615bd0c5076861d892480726ae149562978734a69cd89eb5", + "sha256": "324d5b0baa2bd143549f6b876e4847bfb14df87e6f4c5f2ed8c38f80f7a1bd60", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_in.scale_values.f32.bin", - "sha256": "269e730c81acfe542eefe0157297240e1f909ca448d555e6aebf0ec2d22e6d55", + "sha256": "ff71e0cb9e0cbd714cfe53000e4c6693e243b3a528dbea9bbde5a9791fb76cd1", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -8612,8 +8646,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8633,7 +8667,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_out.bias.f32.bin", - "sha256": "9ce93bf1e56f8944815bc3feeacd388fae0f0d65a826beacd5f4dbe652ae0a17", + "sha256": "934ef203f64706d6f3980935dca28accf5fff8c05d3595244f878091ea0ef1a7", "shape": [ 640 ] @@ -8642,7 +8676,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -8651,19 +8685,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_5_self_attn_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "c1ee787f01158b228e633fab235a13aed3ab1ef306930d66f5374f1f3639495f", + "sha256": "d11e2e2807b998655988a6994f40b12f1147bfcb09e1d212a6ceddf86a8b9d70", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_mlp_w_out.scale_values.f32.bin", - "sha256": "87656f15f2449f30ce1a19ea2b83134086f71bed5d05923029fae7baff63275c", + "sha256": "e57b7781511191ee1c6211206145643aecfeed5fd10e2be8ba5d4a79fda582e9", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8692,8 +8726,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8713,7 +8747,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_attn_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8722,19 +8756,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_q.packed_weight.u8.bin", - "sha256": "0823d35b6cfc35c11009c68fe3583c980e3a51b6d473194d11e2f378b508ba33", + "sha256": "820c8b917dedfa7b94fd8168a696940b32885dc20a6fb0423506e773efc2284a", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_q.scale_values.f32.bin", - "sha256": "811c5513fb65eb2a4aa83753c9c60b7201c7e47eae248153fbfce96540ec12f8", + "sha256": "de28049a482ce86e09aae54b4037fb595650cd33e7947abb29e9528019872250", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8763,8 +8797,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8784,7 +8818,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_attn_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8793,19 +8827,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_k.packed_weight.u8.bin", - "sha256": "c3ef72c857d0463d779455d464cceca3556a5308c6b5cefa85b4e5d2b7036ba4", + "sha256": "43946fb26e7fa4fe90888545317f91ce7dd7dc80339271914038eb7a8a6534e9", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_k.scale_values.f32.bin", - "sha256": "1696afaa802b7df890080fab4b2148db46aac451061ca56d67971f7eb15ed9ed", + "sha256": "a8a5b74730bc699c1734b0f115c2665213f0b9b22f30a3345001554da141996e", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8834,8 +8868,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8855,7 +8889,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_attn_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8864,19 +8898,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_v.packed_weight.u8.bin", - "sha256": "71df327a240d414357000156bc4ce569ccdf02203a8f6c2997c3e994a424fbd3", + "sha256": "e9cd3f10c5ca5524ad7916a8bac067ef9898cf9f53a9b6a6ae15c190a0d71a4e", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_v.scale_values.f32.bin", - "sha256": "7fd4d47d4be6dc31c2add3f32ba8b2d2dd25cd2ba65a472dfc88404dab1e60d8", + "sha256": "dc59d8f713e7157ea3221dba1f622b898c0245dd4d0d34327d920006e3ba09f1", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8905,8 +8939,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8926,7 +8960,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_self_attn_block_attn_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -8935,19 +8969,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_self_attn_block_attn_w_o.packed_weight.u8.bin", - "sha256": "67b98a2983d6281d356e2bdee9c55c93ab827279c23438508d8af4f37b78929e", + "sha256": "c76e70f5dd66747c201dd205fbbe05881d7f49346e32c6156fc708d13c8c3340", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_self_attn_block_attn_w_o.scale_values.f32.bin", - "sha256": "41f4fe30c5f18229023424b02acfbc5aeca6a33406c3d4102ffe57f437b392cd", + "sha256": "959180edcc34bc6313cc1b8af6ec69ff1b5ec9e43a6ad6f0e0af7cd39f2a9cb9", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -8976,8 +9010,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -8997,7 +9031,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_cross_w_q.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -9006,19 +9040,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_q.packed_weight.u8.bin", - "sha256": "c5dcd16f7f9ab08348414c39abab26115e8ff33e36fb7348a2c62b5c413de00b", + "sha256": "7b975bb3aa36faa59373a89a11ce871ea2286260d6285d40814516b9e1993580", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_q.scale_values.f32.bin", - "sha256": "22cbf5b9acb47633ab9cb6ad7de2b7165f0c15ee371d274a23b0d2f0203afa34", + "sha256": "7f0e41304cbfd55072ad386c5da6970259e29bd09325c00ea3da3bc9704ee52c", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -9047,8 +9081,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -9068,7 +9102,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_cross_w_k.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -9077,19 +9111,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_k.packed_weight.u8.bin", - "sha256": "ff57e7d933af1dbeb6ff7608257112e011ef1bb58c1e4550834b4374f300ad80", + "sha256": "8342ee2946efbf8358c5ac1084462bf9bc205d8ba3a861a8e9fc0b0ca27727a4", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_k.scale_values.f32.bin", - "sha256": "eeb881a1d106ad608534ca10ca458ae0abf9e2cac941bfdafe380686025013d6", + "sha256": "57a1556ffa48c12c84a3673f0909b63d09dcc23e63ad61b108718ce87697a20a", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -9118,8 +9152,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -9139,7 +9173,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_cross_w_v.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -9148,19 +9182,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_v.packed_weight.u8.bin", - "sha256": "e9784b965d55e41ea7f9a3214632e6408dfcbe021404905bdf787e579660e2a4", + "sha256": "9f9eb5e98403ef2ba3df649c0670bf1e3bd7e456b7ec9fe6ff6ae63a546d100d", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_v.scale_values.f32.bin", - "sha256": "071b5dab363a13142def242b7cb5bd90039646344b14258cdb807ad2cfd50624", + "sha256": "5a2b1b58e2a938ffac91f830ffe24d862d2d1a3f641796a9cccc73871cd89498", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -9189,8 +9223,8 @@ 640, 640, 640, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -9210,7 +9244,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_cross_w_o.layout_header.i32.bin", - "sha256": "9156b654d9210718214387c2d1cd21b1b546da5f8f81f734bf2519021c4a6ed4", + "sha256": "849939dc8cf07dc8f4b572bf8e2ab75f666f997582a34ef824f17169f84b6914", "shape": [ 13 ] @@ -9219,19 +9253,19 @@ "bytes": 102400, "dtype": "uint8", "path": "decoder_5_cross_block_cross_w_o.packed_weight.u8.bin", - "sha256": "e267d346a55332f235a935d667179f493c829e90d09a7b2e667452667832d14c", + "sha256": "dd328e224e0ced6111c0f60827a3d64cbabd59082f1f45483271d0f73a287aca", "shape": [ 640, 160 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_cross_w_o.scale_values.f32.bin", - "sha256": "f319c054716b93dce66b0908086acf3c1a07ba5ebc55d15a45a7d54c92050513", + "sha256": "50c843aedcc684ba0a5d6541d3d7a431502dcea46994c8374269112970727833", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -9260,8 +9294,8 @@ 640, 4096, 640, - 2, - 1, + 0, + 4096, 1, 80, 1, @@ -9281,7 +9315,7 @@ "bytes": 16384, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_in.bias.f32.bin", - "sha256": "7adbf3be58996a63513302c855e26b50ca5e09f71be5e024856660126d8d18e1", + "sha256": "ebfe00189def83024b2f04f083dc0ca6effe5dcdd379970582cdce4b7461786e", "shape": [ 4096 ] @@ -9290,7 +9324,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_mlp_w_in.layout_header.i32.bin", - "sha256": "b3fb30db028c0e0ededdf2405137b889d77da2cbce717652e77bb13fe4de7b0f", + "sha256": "257ba1249ac6ab2f370f675bdb2b3b2d961f2ab08ee011510a04fc7eca2b15ee", "shape": [ 13 ] @@ -9299,19 +9333,19 @@ "bytes": 655360, "dtype": "uint8", "path": "decoder_5_cross_block_mlp_w_in.packed_weight.u8.bin", - "sha256": "4f0b7415b003709bdaadbdad025c40e417708947587b419b4608c51bc954d81d", + "sha256": "25d3fdd07478a9fbd57e57775db0038bfa039b15fe323bb8373e5d3d76bf8ec7", "shape": [ 4096, 160 ] }, "scale_values": { - "bytes": 16384, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_in.scale_values.f32.bin", - "sha256": "b6adeb822555f5aa9a5c40afdc2c2189444f687d97124f9d32b4f4f498796b52", + "sha256": "cd530857b08c9fe35b573115654d2b23ab3c2a93b39f9238ca420b40f42ae569", "shape": [ - 4096 + 1 ] }, "segment_offsets": { @@ -9340,8 +9374,8 @@ 2048, 640, 2048, - 2, - 1, + 0, + 640, 1, 80, 1, @@ -9361,7 +9395,7 @@ "bytes": 2560, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_out.bias.f32.bin", - "sha256": "a01b04fdfe3e63d331eea3a1fdd245621e69e3dee97d9eb4d0df7a4a747c7a1a", + "sha256": "9d635dbdf18da4b8934862a8e5105e8056b0dea0d0883c365964d94b1270a236", "shape": [ 640 ] @@ -9370,7 +9404,7 @@ "bytes": 52, "dtype": "int32", "path": "decoder_5_cross_block_mlp_w_out.layout_header.i32.bin", - "sha256": "d10f8dfecaca42257835bba6832b19c805498af240be2c1e4e6340a2776e7311", + "sha256": "d10c345b4c76db0edf40b416615c6b81649d8a54bc55de921b84f3d75b7c7d64", "shape": [ 13 ] @@ -9379,19 +9413,19 @@ "bytes": 327680, "dtype": "uint8", "path": "decoder_5_cross_block_mlp_w_out.packed_weight.u8.bin", - "sha256": "fb30694fbf89d6dfa78ccc0bd167365c8264a8aa6988dd4c5cddc872c73e243f", + "sha256": "177d7c4bad958d79e536ba68d66d66d0971834ed869f1e5ca49040db4610d56a", "shape": [ 640, 512 ] }, "scale_values": { - "bytes": 2560, + "bytes": 4, "dtype": "float32", "path": "decoder_5_cross_block_mlp_w_out.scale_values.f32.bin", - "sha256": "7027d96b72a45c6e83a44a76fc6743262877e6783c965d7b8ba82aaee34fd446", + "sha256": "78c2bae093d73a281404ef5e8e0c1c441f2a4a97e560ef68a4af4c73aee4cc04", "shape": [ - 640 + 1 ] }, "segment_offsets": { @@ -9416,19 +9450,19 @@ 1, 16, 32, - 8229, + 8207, 640, - 8240, + 8208, 640, - 2, - 1, + 0, + 8207, 1, 80, 1, 0 ], "name": "lm_head", - "out_features": 8229, + "out_features": 8207, "tensors": { "act_scale": { "bytes": 4, @@ -9441,35 +9475,35 @@ "bytes": 52, "dtype": "int32", "path": "lm_head.layout_header.i32.bin", - "sha256": "6dbbe0f59e755d0a0ffc98bab96786a9a069a30db90c05011423767b48beca7a", + "sha256": "1fdaf7af8cb18524a77d5a37d5265646c10d5d352a2eb3fc83b596fa4fb3a2c5", "shape": [ 13 ] }, "packed_weight": { - "bytes": 1318400, + "bytes": 1313280, "dtype": "uint8", "path": "lm_head.packed_weight.u8.bin", - "sha256": "2dda08a6b9c24d9bb30cd0e09147bd5720f6cdd8633b022afaa8a9b1c2946bb4", + "sha256": "411e858d2476c7d4e8bce21dfdc58a7e4936a9fca18d822cd4f5cf2e2e8386f0", "shape": [ - 8240, + 8208, 160 ] }, "scale_values": { - "bytes": 32916, + "bytes": 4, "dtype": "float32", "path": "lm_head.scale_values.f32.bin", - "sha256": "26b1d8c807dad42bfd8cc1c0b084cb3292b232e0882285c72043c118a9368bca", + "sha256": "f82895d1075ca96401b23568c539ac8944e0264adf62d8567dce2611e02587df", "shape": [ - 8229 + 1 ] }, "segment_offsets": { "bytes": 8, "dtype": "int32", "path": "lm_head.segment_offsets.i32.bin", - "sha256": "6a39e27878282be9d58d21a86fb95117d07c03a87a9919d24a86cbabe1597463", + "sha256": "77df73d01a55e70e6fe3ae9d1e3e1608045918c29f804021326ebd3337636ed0", "shape": [ 2 ] @@ -9480,24 +9514,28 @@ "max_seq_len": 1024, "model": { "activation": "silu", + "agent_policy_heads": false, "attention_bias": false, - "attn_dropout": 0.0, + "attn_dropout": 0.05, "attn_impl": "eager", "d_ff": 2048, "d_model": 640, "dtype": "bfloat16", - "encoder_position_embeddings": false, + "encoder_position_embeddings": true, "head_dim": null, "kv_cache_paged": true, "masking": "build_causal_mask", "max_position_embeddings": 4096, + "mlp_dropout": 0.03, "n_heads": 10, "n_kv_heads": null, "n_layers": 6, "norm": "layer", "pad_token_id": 0, "positional": "apply_rotary", + "resid_dropout": 0.03, "residual": "prenorm", + "retrieval_head_dim": null, "rms_norm_eps": 1e-06, "rope_attention_scaling": null, "rope_scaling_factor": null, @@ -9509,7 +9547,7 @@ "sliding_window": null, "softmax": "safe_softmax", "version": 1, - "vocab_size": 8229 + "vocab_size": 8207 }, "runtime": { "fallback": "wasm", @@ -9535,7 +9573,8 @@ "kind": "agentkernel-bpe", "pad_token_id": 0, "path": "tokenizer/tokenizer.json", + "source_kind": "agentkernel_bytelevel_bpe_v1", "unk_token_id": 3, - "vocab_size": 8229 + "vocab_size": 8207 } } \ No newline at end of file diff --git a/modelcard.json b/modelcard.json index 27184014e534ec7da6ede68855e587b19fa1ae40..5a6a3c8d796254ab4f19407a0acee139ab4da8fc 100644 --- a/modelcard.json +++ b/modelcard.json @@ -1,4 +1,5 @@ { + "dense_tensor_count": 43, "format": "browser-bitnet", "layer_count": 109, "manifest": "manifest.json", @@ -10,5 +11,16 @@ "webgpu_js": "runtime/bitnet_webgpu.js", "wgsl": "runtime/bitnet_linear.wgsl" }, - "sha256": "cfa2962f89ec51a601bf87f0534aa0597aa84cec1f4891e6dd0743e40f005188" + "sha256": "263c6eeb35f349a7ced003571cb694c73a4c7be6d9da5ae4997b3d73aa09f660", + "tokenizer": { + "bos_token_id": 1, + "config_path": "tokenizer/tokenizer_config.json", + "eos_token_id": 2, + "kind": "agentkernel-bpe", + "pad_token_id": 0, + "path": "tokenizer/tokenizer.json", + "source_kind": "agentkernel_bytelevel_bpe_v1", + "unk_token_id": 3, + "vocab_size": 8207 + } } \ No newline at end of file diff --git a/runtime/bitnet_webgpu.js b/runtime/bitnet_webgpu.js index 12a83581a62318f3f2cb4b87274939316b36f94f..23a17fb3ed8603094e40e61ca0ba8e363d4acc3e 100644 --- a/runtime/bitnet_webgpu.js +++ b/runtime/bitnet_webgpu.js @@ -203,6 +203,7 @@ export class BitNetLinearWebGPU { size: PARAM_BUFFER_BYTES, usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST, }); + this.runCache = new Map(); } static async fromManifestLayer(device, manifest, layer, manifestUrl, options = {}) { @@ -264,9 +265,34 @@ export class BitNetLinearWebGPU { } const outputLength = rows * this.layout.logicalOut; - const inputBuffer = createStorageBuffer(this.device, x); - const outputBuffer = createOutputBuffer(this.device, outputLength * Float32Array.BYTES_PER_ELEMENT); - const readbackBuffer = createReadbackBuffer(this.device, outputLength * Float32Array.BYTES_PER_ELEMENT); + const inputBytes = x.byteLength; + const outputBytes = outputLength * Float32Array.BYTES_PER_ELEMENT; + const cacheKey = `${rows}:${this.layout.logicalIn}:${this.layout.logicalOut}`; + let cache = this.runCache.get(cacheKey); + if (!cache) { + const inputBuffer = this.device.createBuffer({ + size: align4(inputBytes), + usage: GPUBufferUsage.STORAGE | GPUBufferUsage.COPY_DST, + }); + const outputBuffer = createOutputBuffer(this.device, outputBytes); + const readbackBuffer = createReadbackBuffer(this.device, outputBytes); + const bindGroup = this.device.createBindGroup({ + layout: this.pipeline.getBindGroupLayout(0), + entries: [ + { binding: 0, resource: { buffer: inputBuffer } }, + { binding: 1, resource: { buffer: this.packedWeightBuffer } }, + { binding: 2, resource: { buffer: this.scaleBuffer } }, + { binding: 3, resource: { buffer: this.segmentOffsetBuffer } }, + { binding: 4, resource: { buffer: this.biasBuffer } }, + { binding: 5, resource: { buffer: this.inputScaleBuffer } }, + { binding: 6, resource: { buffer: outputBuffer } }, + { binding: 7, resource: { buffer: this.paramsBuffer } }, + ], + }); + cache = { inputBuffer, outputBuffer, readbackBuffer, bindGroup }; + this.runCache.set(cacheKey, cache); + } + this.device.queue.writeBuffer(cache.inputBuffer, 0, x.buffer, x.byteOffset, x.byteLength); const params = new Uint32Array([ rows, @@ -284,33 +310,19 @@ export class BitNetLinearWebGPU { ]); this.device.queue.writeBuffer(this.paramsBuffer, 0, params); - const bindGroup = this.device.createBindGroup({ - layout: this.pipeline.getBindGroupLayout(0), - entries: [ - { binding: 0, resource: { buffer: inputBuffer } }, - { binding: 1, resource: { buffer: this.packedWeightBuffer } }, - { binding: 2, resource: { buffer: this.scaleBuffer } }, - { binding: 3, resource: { buffer: this.segmentOffsetBuffer } }, - { binding: 4, resource: { buffer: this.biasBuffer } }, - { binding: 5, resource: { buffer: this.inputScaleBuffer } }, - { binding: 6, resource: { buffer: outputBuffer } }, - { binding: 7, resource: { buffer: this.paramsBuffer } }, - ], - }); - const encoder = this.device.createCommandEncoder(); const pass = encoder.beginComputePass(); pass.setPipeline(this.pipeline); - pass.setBindGroup(0, bindGroup); + pass.setBindGroup(0, cache.bindGroup); pass.dispatchWorkgroups(Math.ceil(this.layout.logicalOut / 8), Math.ceil(rows / 8), 1); pass.end(); - encoder.copyBufferToBuffer(outputBuffer, 0, readbackBuffer, 0, outputLength * Float32Array.BYTES_PER_ELEMENT); + encoder.copyBufferToBuffer(cache.outputBuffer, 0, cache.readbackBuffer, 0, outputBytes); this.device.queue.submit([encoder.finish()]); - await readbackBuffer.mapAsync(GPUMapMode.READ); - const mapped = readbackBuffer.getMappedRange(); + await cache.readbackBuffer.mapAsync(GPUMapMode.READ); + const mapped = cache.readbackBuffer.getMappedRange(); const result = new Float32Array(mapped.slice(0)); - readbackBuffer.unmap(); + cache.readbackBuffer.unmap(); return result; } } diff --git a/runtime/encdec_runtime.js b/runtime/encdec_runtime.js index 98f29ac31d6c4064eeae76040d669ca965077b74..db195d880bdd3fd17bb54f04403c697f5a41c2e2 100644 --- a/runtime/encdec_runtime.js +++ b/runtime/encdec_runtime.js @@ -84,6 +84,30 @@ function addInPlace(dst, src) { return dst; } +function l2Normalize(values) { + let norm = 0; + for (let i = 0; i < values.length; i += 1) norm += values[i] * values[i]; + norm = Math.sqrt(Math.max(norm, 1e-12)); + const out = new Float32Array(values.length); + for (let i = 0; i < values.length; i += 1) out[i] = values[i] / norm; + return out; +} + +function meanPoolRows(x, rows, cols, attentionMask = null) { + const out = new Float32Array(cols); + let denom = 0; + for (let r = 0; r < rows; r += 1) { + const weight = attentionMask ? Number(attentionMask[r] || 0) : 1; + if (weight <= 0) continue; + denom += weight; + const rowOffset = r * cols; + for (let c = 0; c < cols; c += 1) out[c] += x[rowOffset + c] * weight; + } + denom = Math.max(denom, 1); + for (let c = 0; c < cols; c += 1) out[c] /= denom; + return out; +} + function appendRows(existing, next) { if (!existing || existing.length === 0) return next.slice(); const out = new Float32Array(existing.length + next.length); @@ -92,6 +116,27 @@ function appendRows(existing, next) { return out; } +function appendCachedRows(cache, field, next) { + const source = next instanceof Float32Array ? next : new Float32Array(next); + const lengthField = `${field}Length`; + const capacityField = `${field}Capacity`; + const currentLength = Number(cache[lengthField] || 0); + const required = currentLength + source.length; + let storage = cache[field]; + if (!storage || storage.length < required) { + let capacity = Math.max(required, Number(cache[capacityField] || 0), source.length * 8); + while (capacity < required) capacity *= 2; + const grown = new Float32Array(capacity); + if (storage && currentLength > 0) grown.set(storage.subarray(0, currentLength), 0); + storage = grown; + cache[field] = storage; + cache[capacityField] = capacity; + } + storage.set(source, currentLength); + cache[lengthField] = required; + return storage.subarray(0, required); +} + function layerNorm(x, rows, cols, weight, bias, eps = 1e-5) { const out = new Float32Array(x.length); for (let r = 0; r < rows; r += 1) { @@ -275,7 +320,7 @@ function mergeHeads(heads, seqLen, nHeads, headDim) { return out; } -function attention(q, k, v, qLen, kvLen, nHeads, headDim, causal) { +function attention(q, k, v, qLen, kvLen, nHeads, headDim, causal, pastLen = 0) { const qh = splitHeads(q, qLen, nHeads, headDim); const kh = splitHeads(k, kvLen, nHeads, headDim); const vh = splitHeads(v, kvLen, nHeads, headDim); @@ -287,7 +332,7 @@ function attention(q, k, v, qLen, kvLen, nHeads, headDim, causal) { const scores = new Float32Array(kvLen); let maxScore = -Infinity; for (let j = 0; j < kvLen; j += 1) { - let score = causal && j > i ? -1e30 : 0; + let score = causal && j > pastLen + i ? -1e30 : 0; if (score > -1e20) { for (let d = 0; d < headDim; d += 1) { score += qh[h][i * headDim + d] * kh[h][j * headDim + d] * scale; @@ -497,13 +542,30 @@ export class BitNetEncoderDecoderWebGPU { if (this.decoderRotary) { applyRotaryMergedInPlace(q, kNew, 1, nHeads, headDim, this.decoderRotaryBase, position); } - layerCache.selfK = appendRows(layerCache.selfK, kNew); - layerCache.selfV = appendRows(layerCache.selfV, vNew); + layerCache.selfK = appendCachedRows(layerCache, "selfK", kNew); + layerCache.selfV = appendCachedRows(layerCache, "selfV", vNew); layerCache.selfLen = Number(layerCache.selfLen || 0) + 1; const merged = attention(q, layerCache.selfK, layerCache.selfV, 1, layerCache.selfLen, nHeads, headDim, false); return this.linear(`${prefix}.w_o`).run(merged, 1); } + async selfAttentionIncrementalSpan(prefix, x, seqLen, layerCache) { + const nHeads = this.graph.n_heads; + const headDim = this.graph.head_dim; + const q = await this.linear(`${prefix}.w_q`).run(x, seqLen); + const kNew = await this.linear(`${prefix}.w_k`).run(x, seqLen); + const vNew = await this.linear(`${prefix}.w_v`).run(x, seqLen); + const position = Number(layerCache.selfLen || 0); + if (this.decoderRotary) { + applyRotaryMergedInPlace(q, kNew, seqLen, nHeads, headDim, this.decoderRotaryBase, position); + } + layerCache.selfK = appendCachedRows(layerCache, "selfK", kNew); + layerCache.selfV = appendCachedRows(layerCache, "selfV", vNew); + layerCache.selfLen = Number(layerCache.selfLen || 0) + seqLen; + const merged = attention(q, layerCache.selfK, layerCache.selfV, seqLen, layerCache.selfLen, nHeads, headDim, true, position); + return this.linear(`${prefix}.w_o`).run(merged, seqLen); + } + async crossAttentionCached(prefix, x, memory, memoryLen, layerCache) { const nHeads = this.graph.n_heads; const headDim = this.graph.head_dim; @@ -516,6 +578,18 @@ export class BitNetEncoderDecoderWebGPU { return this.linear(`${prefix}.w_o`).run(merged, 1); } + async crossAttentionCachedSpan(prefix, x, seqLen, memory, memoryLen, layerCache) { + const nHeads = this.graph.n_heads; + const headDim = this.graph.head_dim; + const q = await this.linear(`${prefix}.w_q`).run(x, seqLen); + if (!layerCache.crossK || !layerCache.crossV) { + layerCache.crossK = await this.linear(`${prefix}.w_k`).run(memory, memoryLen); + layerCache.crossV = await this.linear(`${prefix}.w_v`).run(memory, memoryLen); + } + const merged = attention(q, layerCache.crossK, layerCache.crossV, seqLen, memoryLen, nHeads, headDim, false); + return this.linear(`${prefix}.w_o`).run(merged, seqLen); + } + async mlp(prefix, x, seqLen) { const wIn = this.linear(`${prefix}.w_in`); const wOut = this.linear(`${prefix}.w_out`); @@ -566,6 +640,23 @@ export class BitNetEncoderDecoderWebGPU { return addInPlace(x, await this.mlp(`decoder.${index}.cross_block.mlp`, n, 1)); } + async decoderLayerIncrementalSpan(index, x, seqLen, memory, memoryLen, layerCache) { + let n = this.norm(`decoder.${index}.self_attn_block.n1`, x, seqLen); + x = addInPlace( + x.slice(), + await this.selfAttentionIncrementalSpan(`decoder.${index}.self_attn_block.attn`, n, seqLen, layerCache), + ); + n = this.norm(`decoder.${index}.self_attn_block.n2`, x, seqLen); + x = addInPlace(x, await this.mlp(`decoder.${index}.self_attn_block.mlp`, n, seqLen)); + n = this.norm(`decoder.${index}.cross_block.n1`, x, seqLen); + x = addInPlace( + x.slice(), + await this.crossAttentionCachedSpan(`decoder.${index}.cross_block.cross`, n, seqLen, memory, memoryLen, layerCache), + ); + n = this.norm(`decoder.${index}.cross_block.n2`, x, seqLen); + return addInPlace(x, await this.mlp(`decoder.${index}.cross_block.mlp`, n, seqLen)); + } + async encode(encInputIds) { let x = embed(encInputIds, this.tensor("enc_embed.weight"), this.graph.d_model); if (this.graph.encoder_position_embeddings) { @@ -583,6 +674,32 @@ export class BitNetEncoderDecoderWebGPU { ); } + async retrievalEmbedding(encInputIds, options = {}) { + const retrieval = this.graph.retrieval || {}; + const headName = options.kind === "doc" ? retrieval.doc_head : retrieval.query_head; + if (!headName) { + throw new Error("model manifest does not expose retrieval heads"); + } + const inputIds = Array.from(encInputIds || [], Number); + const memory = await this.encode(inputIds); + const pooled = meanPoolRows( + memory, + inputIds.length, + this.graph.d_model, + options.attentionMask || inputIds.map((id) => (id === 0 ? 0 : 1)), + ); + const projected = await this.linear(headName).run(pooled, 1); + return l2Normalize(projected); + } + + async retrievalQueryEmbedding(encInputIds, options = {}) { + return this.retrievalEmbedding(encInputIds, { ...options, kind: "query" }); + } + + async retrievalDocEmbedding(encInputIds, options = {}) { + return this.retrievalEmbedding(encInputIds, { ...options, kind: "doc" }); + } + async decode(decInputIds, memory, memoryLen) { let x = embed(decInputIds, this.tensor("dec_embed.weight"), this.graph.d_model); for (let i = 0; i < this.graph.n_layers; i += 1) { @@ -688,6 +805,45 @@ export class BitNetEncoderDecoderGenerationSession { ); return this.runtime.linear("lm_head").run(hidden, 1); } + + cloneState() { + return this.layerCaches.map((cache) => { + const cloned = { ...cache }; + if (cache.selfK) { + cloned.selfK = cache.selfK.slice(); + cloned.selfKLength = cloned.selfK.length; + cloned.selfKCapacity = cloned.selfK.length; + } + if (cache.selfV) { + cloned.selfV = cache.selfV.slice(); + cloned.selfVLength = cloned.selfV.length; + cloned.selfVCapacity = cloned.selfV.length; + } + return cloned; + }); + } + + restoreState(layerCaches) { + this.layerCaches = layerCaches; + } + + async nextMany(tokenIds) { + const ids = Array.from(tokenIds || [], Number).filter((id) => Number.isFinite(id)); + if (!ids.length) return new Float32Array(0); + await this.prepare(); + let x = embed(ids, this.runtime.tensor("dec_embed.weight"), this.runtime.graph.d_model); + for (let i = 0; i < this.runtime.graph.n_layers; i += 1) { + x = await this.runtime.decoderLayerIncrementalSpan(i, x, ids.length, this.memory, this.memoryLen, this.layerCaches[i]); + } + const hidden = layerNorm( + x, + ids.length, + this.runtime.graph.d_model, + this.runtime.tensor("dec_norm.weight"), + this.runtime.dense["dec_norm.bias"]?.data, + ); + return this.runtime.linear("lm_head").run(hidden, ids.length); + } } export class BitNetEncoderDecoderWASM extends BitNetEncoderDecoderWebGPU { diff --git a/tokenizer/tokenizer.json b/tokenizer/tokenizer.json index 6497f1aaab7604a7d28815195a93246a08f5a652..914bce84245f429ad5ba10ef8ab496eb62714da7 100644 --- a/tokenizer/tokenizer.json +++ b/tokenizer/tokenizer.json @@ -173,204 +173,6 @@ "rstrip": false, "normalized": false, "special": true - }, - { - "id": 8207, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8208, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8209, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8210, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8211, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8212, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8213, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8214, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8215, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8216, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8217, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8218, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8219, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8220, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8221, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8222, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8223, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8224, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8225, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8226, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8227, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true - }, - { - "id": 8228, - "content": "", - "single_word": false, - "lstrip": false, - "rstrip": false, - "normalized": false, - "special": true } ], "normalizer": null, diff --git a/tokenizer/tokenizer_config.json b/tokenizer/tokenizer_config.json index 0ceaca008823b35d151ed95ad972c40dd5fe16b6..5d1c3eef5339dea03894c5e932e6780760fa8929 100644 --- a/tokenizer/tokenizer_config.json +++ b/tokenizer/tokenizer_config.json @@ -4,38 +4,16 @@ "", "", "", - "", - "", - "", "", - "", "", - "", - "", - "", - "", - "", - "", "", - "", - "", - "", "", "", - "", "", "", - "", - "", - "", - "", - "", - "", "", "", "", - "", - "", "" ], "bos_token": "", @@ -47,5 +25,5 @@ "tokenizer_kind": "agentkernel_bytelevel_bpe_v1", "unk_token": "", "unk_token_id": 3, - "vocab_size": 8229 + "vocab_size": 8207 } \ No newline at end of file