{ "metadata": { "total_size": 6317342724 }, "weight_map": { "lm_head.weight": "model-00002-of-00002.safetensors", "transformer.ln_f.weight": "model-00002-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.0.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.1.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.10.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.2.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.3.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.4.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.5.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.6.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.7.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.8.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.null_k": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.null_v": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.lowcoder.layers.blocks.9.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.retriever.key_projection.bias": "model-00001-of-00002.safetensors", "transformer.retriever.key_projection.weight": "model-00001-of-00002.safetensors", "transformer.retriever.pre_key_norm.weight": "model-00001-of-00002.safetensors", "transformer.retriever.pre_query_norm.weight": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bi_attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.null_k": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.null_v": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.retriever.preret_bidir_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.retriever.query_projection.bias": "model-00001-of-00002.safetensors", "transformer.retriever.query_projection.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.0.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.1.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.attention_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca.cross_attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.cca_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.feed_forward.w1.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.feed_forward.w2.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.feed_forward.w3.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.10.ffn_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.2.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.3.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.4.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.5.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.feed_forward.w1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.feed_forward.w2.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.feed_forward.w3.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.6.ffn_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.attention_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca.cross_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.cca_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.feed_forward.w1.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.feed_forward.w2.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.feed_forward.w3.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.7.ffn_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.attention_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca.cross_attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.cca_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.feed_forward.w1.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.feed_forward.w2.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.feed_forward.w3.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.8.ffn_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.attention_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.null_k": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.null_v": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.wk.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.wo.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.wq.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca.cross_attention.wv.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.cca_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.feed_forward.w1.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.feed_forward.w2.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.feed_forward.w3.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.layers.blocks.9.ffn_norm.weight": "model-00002-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bi_attention_norm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.postret_bidir_attention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention_knorm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_augmentor.query_nei_xattention_qnorm.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.null_k": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.null_v": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.wk.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.wo.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.wq.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.cross_neig_causal_att.wv.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.weight.bias": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.weight.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.xnei_bias": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.xnei_norm1.weight": "model-00001-of-00002.safetensors", "transformer.upcoder.neighbor_cross_augmentor.xnei_norm2.weight": "model-00001-of-00002.safetensors", "transformer.wte.weight": "model-00001-of-00002.safetensors" } }