Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

qwen3-vl-4b/acts.pt +3 -0
qwen3-vl-4b/mmproj-fp16.npz +3 -0
qwen3-vl-4b/mmproj.txt +537 -0
qwen3-vl-4b/model.pt +3 -0
qwen3-vl-4b/out-fp16.npz +3 -0
qwen3-vl-4b/out.npz +3 -0
qwen3-vl-4b/scale.pt +3 -0
qwen3-vl-4b/smooth.pt +3 -0
qwen3-vl-4b/wgts.pt +3 -0

qwen3-vl-4b/acts.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a931f2b9373fc5d63f2d8386a808f56245ddd5e772428177a6c6a16fcdc2523
+size 55975

qwen3-vl-4b/mmproj-fp16.npz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:56824b179176c4112ab1fb4a1005f7156b78aced2d0b6aa99b0b102e1eb28537
+size 642657486

qwen3-vl-4b/mmproj.txt ADDED Viewed

	@@ -0,0 +1,537 @@

+Loading GGUF file: mmproj-F16.gguf
+Found 316 tensors
+Converting v.blk.0.attn_out.bias to FP16
+  v.blk.0.attn_out.bias                    -> model.layers.0.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.0.attn_out.weight                  -> model.layers.0.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.0.attn_qkv.bias to FP16
+  v.blk.0.attn_qkv.bias                    -> model.layers.0.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.0.attn_qkv.weight                  -> model.layers.0.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.0.ffn_up.bias to FP16
+  v.blk.0.ffn_up.bias                      -> model.layers.0.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.0.ffn_up.weight                    -> model.layers.0.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.0.ffn_down.bias to FP16
+  v.blk.0.ffn_down.bias                    -> model.layers.0.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.0.ffn_down.weight                  -> model.layers.0.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.0.ln1.bias to FP16
+  v.blk.0.ln1.bias                         -> model.layers.0.ln1.bias                            shape: (1024,)
+Converting v.blk.0.ln1.weight to FP16
+  v.blk.0.ln1.weight                       -> model.layers.0.ln1.weight                          shape: (1024,)
+Converting v.blk.0.ln2.bias to FP16
+  v.blk.0.ln2.bias                         -> model.layers.0.ln2.bias                            shape: (1024,)
+Converting v.blk.0.ln2.weight to FP16
+  v.blk.0.ln2.weight                       -> model.layers.0.ln2.weight                          shape: (1024,)
+Converting v.blk.1.attn_out.bias to FP16
+  v.blk.1.attn_out.bias                    -> model.layers.1.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.1.attn_out.weight                  -> model.layers.1.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.1.attn_qkv.bias to FP16
+  v.blk.1.attn_qkv.bias                    -> model.layers.1.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.1.attn_qkv.weight                  -> model.layers.1.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.1.ffn_up.bias to FP16
+  v.blk.1.ffn_up.bias                      -> model.layers.1.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.1.ffn_up.weight                    -> model.layers.1.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.1.ffn_down.bias to FP16
+  v.blk.1.ffn_down.bias                    -> model.layers.1.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.1.ffn_down.weight                  -> model.layers.1.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.1.ln1.bias to FP16
+  v.blk.1.ln1.bias                         -> model.layers.1.ln1.bias                            shape: (1024,)
+Converting v.blk.1.ln1.weight to FP16
+  v.blk.1.ln1.weight                       -> model.layers.1.ln1.weight                          shape: (1024,)
+Converting v.blk.1.ln2.bias to FP16
+  v.blk.1.ln2.bias                         -> model.layers.1.ln2.bias                            shape: (1024,)
+Converting v.blk.1.ln2.weight to FP16
+  v.blk.1.ln2.weight                       -> model.layers.1.ln2.weight                          shape: (1024,)
+Converting v.blk.10.attn_out.bias to FP16
+  v.blk.10.attn_out.bias                   -> model.layers.10.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.10.attn_out.weight                 -> model.layers.10.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.10.attn_qkv.bias to FP16
+  v.blk.10.attn_qkv.bias                   -> model.layers.10.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.10.attn_qkv.weight                 -> model.layers.10.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.10.ffn_up.bias to FP16
+  v.blk.10.ffn_up.bias                     -> model.layers.10.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.10.ffn_up.weight                   -> model.layers.10.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.10.ffn_down.bias to FP16
+  v.blk.10.ffn_down.bias                   -> model.layers.10.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.10.ffn_down.weight                 -> model.layers.10.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.10.ln1.bias to FP16
+  v.blk.10.ln1.bias                        -> model.layers.10.ln1.bias                           shape: (1024,)
+Converting v.blk.10.ln1.weight to FP16
+  v.blk.10.ln1.weight                      -> model.layers.10.ln1.weight                         shape: (1024,)
+Converting v.blk.10.ln2.bias to FP16
+  v.blk.10.ln2.bias                        -> model.layers.10.ln2.bias                           shape: (1024,)
+Converting v.blk.10.ln2.weight to FP16
+  v.blk.10.ln2.weight                      -> model.layers.10.ln2.weight                         shape: (1024,)
+Converting v.blk.11.attn_out.bias to FP16
+  v.blk.11.attn_out.bias                   -> model.layers.11.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.11.attn_out.weight                 -> model.layers.11.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.11.attn_qkv.bias to FP16
+  v.blk.11.attn_qkv.bias                   -> model.layers.11.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.11.attn_qkv.weight                 -> model.layers.11.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.11.ffn_up.bias to FP16
+  v.blk.11.ffn_up.bias                     -> model.layers.11.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.11.ffn_up.weight                   -> model.layers.11.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.11.ffn_down.bias to FP16
+  v.blk.11.ffn_down.bias                   -> model.layers.11.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.11.ffn_down.weight                 -> model.layers.11.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.11.ln1.bias to FP16
+  v.blk.11.ln1.bias                        -> model.layers.11.ln1.bias                           shape: (1024,)
+Converting v.blk.11.ln1.weight to FP16
+  v.blk.11.ln1.weight                      -> model.layers.11.ln1.weight                         shape: (1024,)
+Converting v.blk.11.ln2.bias to FP16
+  v.blk.11.ln2.bias                        -> model.layers.11.ln2.bias                           shape: (1024,)
+Converting v.blk.11.ln2.weight to FP16
+  v.blk.11.ln2.weight                      -> model.layers.11.ln2.weight                         shape: (1024,)
+Converting v.blk.12.attn_out.bias to FP16
+  v.blk.12.attn_out.bias                   -> model.layers.12.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.12.attn_out.weight                 -> model.layers.12.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.12.attn_qkv.bias to FP16
+  v.blk.12.attn_qkv.bias                   -> model.layers.12.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.12.attn_qkv.weight                 -> model.layers.12.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.12.ffn_up.bias to FP16
+  v.blk.12.ffn_up.bias                     -> model.layers.12.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.12.ffn_up.weight                   -> model.layers.12.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.12.ffn_down.bias to FP16
+  v.blk.12.ffn_down.bias                   -> model.layers.12.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.12.ffn_down.weight                 -> model.layers.12.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.12.ln1.bias to FP16
+  v.blk.12.ln1.bias                        -> model.layers.12.ln1.bias                           shape: (1024,)
+Converting v.blk.12.ln1.weight to FP16
+  v.blk.12.ln1.weight                      -> model.layers.12.ln1.weight                         shape: (1024,)
+Converting v.blk.12.ln2.bias to FP16
+  v.blk.12.ln2.bias                        -> model.layers.12.ln2.bias                           shape: (1024,)
+Converting v.blk.12.ln2.weight to FP16
+  v.blk.12.ln2.weight                      -> model.layers.12.ln2.weight                         shape: (1024,)
+Converting v.blk.13.attn_out.bias to FP16
+  v.blk.13.attn_out.bias                   -> model.layers.13.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.13.attn_out.weight                 -> model.layers.13.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.13.attn_qkv.bias to FP16
+  v.blk.13.attn_qkv.bias                   -> model.layers.13.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.13.attn_qkv.weight                 -> model.layers.13.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.13.ffn_up.bias to FP16
+  v.blk.13.ffn_up.bias                     -> model.layers.13.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.13.ffn_up.weight                   -> model.layers.13.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.13.ffn_down.bias to FP16
+  v.blk.13.ffn_down.bias                   -> model.layers.13.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.13.ffn_down.weight                 -> model.layers.13.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.13.ln1.bias to FP16
+  v.blk.13.ln1.bias                        -> model.layers.13.ln1.bias                           shape: (1024,)
+Converting v.blk.13.ln1.weight to FP16
+  v.blk.13.ln1.weight                      -> model.layers.13.ln1.weight                         shape: (1024,)
+Converting v.blk.13.ln2.bias to FP16
+  v.blk.13.ln2.bias                        -> model.layers.13.ln2.bias                           shape: (1024,)
+Converting v.blk.13.ln2.weight to FP16
+  v.blk.13.ln2.weight                      -> model.layers.13.ln2.weight                         shape: (1024,)
+Converting v.blk.14.attn_out.bias to FP16
+  v.blk.14.attn_out.bias                   -> model.layers.14.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.14.attn_out.weight                 -> model.layers.14.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.14.attn_qkv.bias to FP16
+  v.blk.14.attn_qkv.bias                   -> model.layers.14.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.14.attn_qkv.weight                 -> model.layers.14.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.14.ffn_up.bias to FP16
+  v.blk.14.ffn_up.bias                     -> model.layers.14.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.14.ffn_up.weight                   -> model.layers.14.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.14.ffn_down.bias to FP16
+  v.blk.14.ffn_down.bias                   -> model.layers.14.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.14.ffn_down.weight                 -> model.layers.14.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.14.ln1.bias to FP16
+  v.blk.14.ln1.bias                        -> model.layers.14.ln1.bias                           shape: (1024,)
+Converting v.blk.14.ln1.weight to FP16
+  v.blk.14.ln1.weight                      -> model.layers.14.ln1.weight                         shape: (1024,)
+Converting v.blk.14.ln2.bias to FP16
+  v.blk.14.ln2.bias                        -> model.layers.14.ln2.bias                           shape: (1024,)
+Converting v.blk.14.ln2.weight to FP16
+  v.blk.14.ln2.weight                      -> model.layers.14.ln2.weight                         shape: (1024,)
+Converting v.blk.15.attn_out.bias to FP16
+  v.blk.15.attn_out.bias                   -> model.layers.15.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.15.attn_out.weight                 -> model.layers.15.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.15.attn_qkv.bias to FP16
+  v.blk.15.attn_qkv.bias                   -> model.layers.15.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.15.attn_qkv.weight                 -> model.layers.15.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.15.ffn_up.bias to FP16
+  v.blk.15.ffn_up.bias                     -> model.layers.15.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.15.ffn_up.weight                   -> model.layers.15.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.15.ffn_down.bias to FP16
+  v.blk.15.ffn_down.bias                   -> model.layers.15.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.15.ffn_down.weight                 -> model.layers.15.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.15.ln1.bias to FP16
+  v.blk.15.ln1.bias                        -> model.layers.15.ln1.bias                           shape: (1024,)
+Converting v.blk.15.ln1.weight to FP16
+  v.blk.15.ln1.weight                      -> model.layers.15.ln1.weight                         shape: (1024,)
+Converting v.blk.15.ln2.bias to FP16
+  v.blk.15.ln2.bias                        -> model.layers.15.ln2.bias                           shape: (1024,)
+Converting v.blk.15.ln2.weight to FP16
+  v.blk.15.ln2.weight                      -> model.layers.15.ln2.weight                         shape: (1024,)
+Converting v.blk.16.attn_out.bias to FP16
+  v.blk.16.attn_out.bias                   -> model.layers.16.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.16.attn_out.weight                 -> model.layers.16.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.16.attn_qkv.bias to FP16
+  v.blk.16.attn_qkv.bias                   -> model.layers.16.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.16.attn_qkv.weight                 -> model.layers.16.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.16.ffn_up.bias to FP16
+  v.blk.16.ffn_up.bias                     -> model.layers.16.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.16.ffn_up.weight                   -> model.layers.16.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.16.ffn_down.bias to FP16
+  v.blk.16.ffn_down.bias                   -> model.layers.16.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.16.ffn_down.weight                 -> model.layers.16.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.16.ln1.bias to FP16
+  v.blk.16.ln1.bias                        -> model.layers.16.ln1.bias                           shape: (1024,)
+Converting v.blk.16.ln1.weight to FP16
+  v.blk.16.ln1.weight                      -> model.layers.16.ln1.weight                         shape: (1024,)
+Converting v.blk.16.ln2.bias to FP16
+  v.blk.16.ln2.bias                        -> model.layers.16.ln2.bias                           shape: (1024,)
+Converting v.blk.16.ln2.weight to FP16
+  v.blk.16.ln2.weight                      -> model.layers.16.ln2.weight                         shape: (1024,)
+Converting v.blk.17.attn_out.bias to FP16
+  v.blk.17.attn_out.bias                   -> model.layers.17.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.17.attn_out.weight                 -> model.layers.17.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.17.attn_qkv.bias to FP16
+  v.blk.17.attn_qkv.bias                   -> model.layers.17.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.17.attn_qkv.weight                 -> model.layers.17.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.17.ffn_up.bias to FP16
+  v.blk.17.ffn_up.bias                     -> model.layers.17.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.17.ffn_up.weight                   -> model.layers.17.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.17.ffn_down.bias to FP16
+  v.blk.17.ffn_down.bias                   -> model.layers.17.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.17.ffn_down.weight                 -> model.layers.17.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.17.ln1.bias to FP16
+  v.blk.17.ln1.bias                        -> model.layers.17.ln1.bias                           shape: (1024,)
+Converting v.blk.17.ln1.weight to FP16
+  v.blk.17.ln1.weight                      -> model.layers.17.ln1.weight                         shape: (1024,)
+Converting v.blk.17.ln2.bias to FP16
+  v.blk.17.ln2.bias                        -> model.layers.17.ln2.bias                           shape: (1024,)
+Converting v.blk.17.ln2.weight to FP16
+  v.blk.17.ln2.weight                      -> model.layers.17.ln2.weight                         shape: (1024,)
+Converting v.blk.18.attn_out.bias to FP16
+  v.blk.18.attn_out.bias                   -> model.layers.18.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.18.attn_out.weight                 -> model.layers.18.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.18.attn_qkv.bias to FP16
+  v.blk.18.attn_qkv.bias                   -> model.layers.18.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.18.attn_qkv.weight                 -> model.layers.18.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.18.ffn_up.bias to FP16
+  v.blk.18.ffn_up.bias                     -> model.layers.18.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.18.ffn_up.weight                   -> model.layers.18.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.18.ffn_down.bias to FP16
+  v.blk.18.ffn_down.bias                   -> model.layers.18.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.18.ffn_down.weight                 -> model.layers.18.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.18.ln1.bias to FP16
+  v.blk.18.ln1.bias                        -> model.layers.18.ln1.bias                           shape: (1024,)
+Converting v.blk.18.ln1.weight to FP16
+  v.blk.18.ln1.weight                      -> model.layers.18.ln1.weight                         shape: (1024,)
+Converting v.blk.18.ln2.bias to FP16
+  v.blk.18.ln2.bias                        -> model.layers.18.ln2.bias                           shape: (1024,)
+Converting v.blk.18.ln2.weight to FP16
+  v.blk.18.ln2.weight                      -> model.layers.18.ln2.weight                         shape: (1024,)
+Converting v.blk.19.attn_out.bias to FP16
+  v.blk.19.attn_out.bias                   -> model.layers.19.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.19.attn_out.weight                 -> model.layers.19.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.19.attn_qkv.bias to FP16
+  v.blk.19.attn_qkv.bias                   -> model.layers.19.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.19.attn_qkv.weight                 -> model.layers.19.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.19.ffn_up.bias to FP16
+  v.blk.19.ffn_up.bias                     -> model.layers.19.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.19.ffn_up.weight                   -> model.layers.19.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.19.ffn_down.bias to FP16
+  v.blk.19.ffn_down.bias                   -> model.layers.19.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.19.ffn_down.weight                 -> model.layers.19.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.19.ln1.bias to FP16
+  v.blk.19.ln1.bias                        -> model.layers.19.ln1.bias                           shape: (1024,)
+Converting v.blk.19.ln1.weight to FP16
+  v.blk.19.ln1.weight                      -> model.layers.19.ln1.weight                         shape: (1024,)
+Converting v.blk.19.ln2.bias to FP16
+  v.blk.19.ln2.bias                        -> model.layers.19.ln2.bias                           shape: (1024,)
+Converting v.blk.19.ln2.weight to FP16
+  v.blk.19.ln2.weight                      -> model.layers.19.ln2.weight                         shape: (1024,)
+Converting v.blk.2.attn_out.bias to FP16
+  v.blk.2.attn_out.bias                    -> model.layers.2.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.2.attn_out.weight                  -> model.layers.2.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.2.attn_qkv.bias to FP16
+  v.blk.2.attn_qkv.bias                    -> model.layers.2.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.2.attn_qkv.weight                  -> model.layers.2.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.2.ffn_up.bias to FP16
+  v.blk.2.ffn_up.bias                      -> model.layers.2.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.2.ffn_up.weight                    -> model.layers.2.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.2.ffn_down.bias to FP16
+  v.blk.2.ffn_down.bias                    -> model.layers.2.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.2.ffn_down.weight                  -> model.layers.2.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.2.ln1.bias to FP16
+  v.blk.2.ln1.bias                         -> model.layers.2.ln1.bias                            shape: (1024,)
+Converting v.blk.2.ln1.weight to FP16
+  v.blk.2.ln1.weight                       -> model.layers.2.ln1.weight                          shape: (1024,)
+Converting v.blk.2.ln2.bias to FP16
+  v.blk.2.ln2.bias                         -> model.layers.2.ln2.bias                            shape: (1024,)
+Converting v.blk.2.ln2.weight to FP16
+  v.blk.2.ln2.weight                       -> model.layers.2.ln2.weight                          shape: (1024,)
+Converting v.blk.20.attn_out.bias to FP16
+  v.blk.20.attn_out.bias                   -> model.layers.20.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.20.attn_out.weight                 -> model.layers.20.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.20.attn_qkv.bias to FP16
+  v.blk.20.attn_qkv.bias                   -> model.layers.20.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.20.attn_qkv.weight                 -> model.layers.20.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.20.ffn_up.bias to FP16
+  v.blk.20.ffn_up.bias                     -> model.layers.20.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.20.ffn_up.weight                   -> model.layers.20.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.20.ffn_down.bias to FP16
+  v.blk.20.ffn_down.bias                   -> model.layers.20.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.20.ffn_down.weight                 -> model.layers.20.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.20.ln1.bias to FP16
+  v.blk.20.ln1.bias                        -> model.layers.20.ln1.bias                           shape: (1024,)
+Converting v.blk.20.ln1.weight to FP16
+  v.blk.20.ln1.weight                      -> model.layers.20.ln1.weight                         shape: (1024,)
+Converting v.blk.20.ln2.bias to FP16
+  v.blk.20.ln2.bias                        -> model.layers.20.ln2.bias                           shape: (1024,)
+Converting v.blk.20.ln2.weight to FP16
+  v.blk.20.ln2.weight                      -> model.layers.20.ln2.weight                         shape: (1024,)
+Converting v.blk.21.attn_out.bias to FP16
+  v.blk.21.attn_out.bias                   -> model.layers.21.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.21.attn_out.weight                 -> model.layers.21.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.21.attn_qkv.bias to FP16
+  v.blk.21.attn_qkv.bias                   -> model.layers.21.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.21.attn_qkv.weight                 -> model.layers.21.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.21.ffn_up.bias to FP16
+  v.blk.21.ffn_up.bias                     -> model.layers.21.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.21.ffn_up.weight                   -> model.layers.21.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.21.ffn_down.bias to FP16
+  v.blk.21.ffn_down.bias                   -> model.layers.21.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.21.ffn_down.weight                 -> model.layers.21.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.21.ln1.bias to FP16
+  v.blk.21.ln1.bias                        -> model.layers.21.ln1.bias                           shape: (1024,)
+Converting v.blk.21.ln1.weight to FP16
+  v.blk.21.ln1.weight                      -> model.layers.21.ln1.weight                         shape: (1024,)
+Converting v.blk.21.ln2.bias to FP16
+  v.blk.21.ln2.bias                        -> model.layers.21.ln2.bias                           shape: (1024,)
+Converting v.blk.21.ln2.weight to FP16
+  v.blk.21.ln2.weight                      -> model.layers.21.ln2.weight                         shape: (1024,)
+Converting v.blk.22.attn_out.bias to FP16
+  v.blk.22.attn_out.bias                   -> model.layers.22.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.22.attn_out.weight                 -> model.layers.22.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.22.attn_qkv.bias to FP16
+  v.blk.22.attn_qkv.bias                   -> model.layers.22.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.22.attn_qkv.weight                 -> model.layers.22.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.22.ffn_up.bias to FP16
+  v.blk.22.ffn_up.bias                     -> model.layers.22.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.22.ffn_up.weight                   -> model.layers.22.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.22.ffn_down.bias to FP16
+  v.blk.22.ffn_down.bias                   -> model.layers.22.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.22.ffn_down.weight                 -> model.layers.22.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.22.ln1.bias to FP16
+  v.blk.22.ln1.bias                        -> model.layers.22.ln1.bias                           shape: (1024,)
+Converting v.blk.22.ln1.weight to FP16
+  v.blk.22.ln1.weight                      -> model.layers.22.ln1.weight                         shape: (1024,)
+Converting v.blk.22.ln2.bias to FP16
+  v.blk.22.ln2.bias                        -> model.layers.22.ln2.bias                           shape: (1024,)
+Converting v.blk.22.ln2.weight to FP16
+  v.blk.22.ln2.weight                      -> model.layers.22.ln2.weight                         shape: (1024,)
+Converting v.blk.23.attn_out.bias to FP16
+  v.blk.23.attn_out.bias                   -> model.layers.23.self_attn.o_proj.bias              shape: (1024,)
+  v.blk.23.attn_out.weight                 -> model.layers.23.self_attn.o_proj.weight            shape: (1024, 1024)
+Converting v.blk.23.attn_qkv.bias to FP16
+  v.blk.23.attn_qkv.bias                   -> model.layers.23.self_attn.qkv_proj.bias            shape: (3072,)
+  v.blk.23.attn_qkv.weight                 -> model.layers.23.self_attn.qkv_proj.weight          shape: (3072, 1024)
+Converting v.blk.23.ffn_up.bias to FP16
+  v.blk.23.ffn_up.bias                     -> model.layers.23.mlp.up_proj.bias                   shape: (4096,)
+  v.blk.23.ffn_up.weight                   -> model.layers.23.mlp.up_proj.weight                 shape: (4096, 1024)
+Converting v.blk.23.ffn_down.bias to FP16
+  v.blk.23.ffn_down.bias                   -> model.layers.23.mlp.down_proj.bias                 shape: (1024,)
+  v.blk.23.ffn_down.weight                 -> model.layers.23.mlp.down_proj.weight               shape: (1024, 4096)
+Converting v.blk.23.ln1.bias to FP16
+  v.blk.23.ln1.bias                        -> model.layers.23.ln1.bias                           shape: (1024,)
+Converting v.blk.23.ln1.weight to FP16
+  v.blk.23.ln1.weight                      -> model.layers.23.ln1.weight                         shape: (1024,)
+Converting v.blk.23.ln2.bias to FP16
+  v.blk.23.ln2.bias                        -> model.layers.23.ln2.bias                           shape: (1024,)
+Converting v.blk.23.ln2.weight to FP16
+  v.blk.23.ln2.weight                      -> model.layers.23.ln2.weight                         shape: (1024,)
+Converting v.blk.3.attn_out.bias to FP16
+  v.blk.3.attn_out.bias                    -> model.layers.3.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.3.attn_out.weight                  -> model.layers.3.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.3.attn_qkv.bias to FP16
+  v.blk.3.attn_qkv.bias                    -> model.layers.3.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.3.attn_qkv.weight                  -> model.layers.3.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.3.ffn_up.bias to FP16
+  v.blk.3.ffn_up.bias                      -> model.layers.3.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.3.ffn_up.weight                    -> model.layers.3.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.3.ffn_down.bias to FP16
+  v.blk.3.ffn_down.bias                    -> model.layers.3.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.3.ffn_down.weight                  -> model.layers.3.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.3.ln1.bias to FP16
+  v.blk.3.ln1.bias                         -> model.layers.3.ln1.bias                            shape: (1024,)
+Converting v.blk.3.ln1.weight to FP16
+  v.blk.3.ln1.weight                       -> model.layers.3.ln1.weight                          shape: (1024,)
+Converting v.blk.3.ln2.bias to FP16
+  v.blk.3.ln2.bias                         -> model.layers.3.ln2.bias                            shape: (1024,)
+Converting v.blk.3.ln2.weight to FP16
+  v.blk.3.ln2.weight                       -> model.layers.3.ln2.weight                          shape: (1024,)
+Converting v.blk.4.attn_out.bias to FP16
+  v.blk.4.attn_out.bias                    -> model.layers.4.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.4.attn_out.weight                  -> model.layers.4.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.4.attn_qkv.bias to FP16
+  v.blk.4.attn_qkv.bias                    -> model.layers.4.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.4.attn_qkv.weight                  -> model.layers.4.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.4.ffn_up.bias to FP16
+  v.blk.4.ffn_up.bias                      -> model.layers.4.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.4.ffn_up.weight                    -> model.layers.4.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.4.ffn_down.bias to FP16
+  v.blk.4.ffn_down.bias                    -> model.layers.4.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.4.ffn_down.weight                  -> model.layers.4.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.4.ln1.bias to FP16
+  v.blk.4.ln1.bias                         -> model.layers.4.ln1.bias                            shape: (1024,)
+Converting v.blk.4.ln1.weight to FP16
+  v.blk.4.ln1.weight                       -> model.layers.4.ln1.weight                          shape: (1024,)
+Converting v.blk.4.ln2.bias to FP16
+  v.blk.4.ln2.bias                         -> model.layers.4.ln2.bias                            shape: (1024,)
+Converting v.blk.4.ln2.weight to FP16
+  v.blk.4.ln2.weight                       -> model.layers.4.ln2.weight                          shape: (1024,)
+Converting v.blk.5.attn_out.bias to FP16
+  v.blk.5.attn_out.bias                    -> model.layers.5.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.5.attn_out.weight                  -> model.layers.5.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.5.attn_qkv.bias to FP16
+  v.blk.5.attn_qkv.bias                    -> model.layers.5.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.5.attn_qkv.weight                  -> model.layers.5.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.5.ffn_up.bias to FP16
+  v.blk.5.ffn_up.bias                      -> model.layers.5.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.5.ffn_up.weight                    -> model.layers.5.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.5.ffn_down.bias to FP16
+  v.blk.5.ffn_down.bias                    -> model.layers.5.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.5.ffn_down.weight                  -> model.layers.5.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.5.ln1.bias to FP16
+  v.blk.5.ln1.bias                         -> model.layers.5.ln1.bias                            shape: (1024,)
+Converting v.blk.5.ln1.weight to FP16
+  v.blk.5.ln1.weight                       -> model.layers.5.ln1.weight                          shape: (1024,)
+Converting v.blk.5.ln2.bias to FP16
+  v.blk.5.ln2.bias                         -> model.layers.5.ln2.bias                            shape: (1024,)
+Converting v.blk.5.ln2.weight to FP16
+  v.blk.5.ln2.weight                       -> model.layers.5.ln2.weight                          shape: (1024,)
+Converting v.blk.6.attn_out.bias to FP16
+  v.blk.6.attn_out.bias                    -> model.layers.6.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.6.attn_out.weight                  -> model.layers.6.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.6.attn_qkv.bias to FP16
+  v.blk.6.attn_qkv.bias                    -> model.layers.6.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.6.attn_qkv.weight                  -> model.layers.6.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.6.ffn_up.bias to FP16
+  v.blk.6.ffn_up.bias                      -> model.layers.6.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.6.ffn_up.weight                    -> model.layers.6.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.6.ffn_down.bias to FP16
+  v.blk.6.ffn_down.bias                    -> model.layers.6.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.6.ffn_down.weight                  -> model.layers.6.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.6.ln1.bias to FP16
+  v.blk.6.ln1.bias                         -> model.layers.6.ln1.bias                            shape: (1024,)
+Converting v.blk.6.ln1.weight to FP16
+  v.blk.6.ln1.weight                       -> model.layers.6.ln1.weight                          shape: (1024,)
+Converting v.blk.6.ln2.bias to FP16
+  v.blk.6.ln2.bias                         -> model.layers.6.ln2.bias                            shape: (1024,)
+Converting v.blk.6.ln2.weight to FP16
+  v.blk.6.ln2.weight                       -> model.layers.6.ln2.weight                          shape: (1024,)
+Converting v.blk.7.attn_out.bias to FP16
+  v.blk.7.attn_out.bias                    -> model.layers.7.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.7.attn_out.weight                  -> model.layers.7.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.7.attn_qkv.bias to FP16
+  v.blk.7.attn_qkv.bias                    -> model.layers.7.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.7.attn_qkv.weight                  -> model.layers.7.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.7.ffn_up.bias to FP16
+  v.blk.7.ffn_up.bias                      -> model.layers.7.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.7.ffn_up.weight                    -> model.layers.7.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.7.ffn_down.bias to FP16
+  v.blk.7.ffn_down.bias                    -> model.layers.7.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.7.ffn_down.weight                  -> model.layers.7.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.7.ln1.bias to FP16
+  v.blk.7.ln1.bias                         -> model.layers.7.ln1.bias                            shape: (1024,)
+Converting v.blk.7.ln1.weight to FP16
+  v.blk.7.ln1.weight                       -> model.layers.7.ln1.weight                          shape: (1024,)
+Converting v.blk.7.ln2.bias to FP16
+  v.blk.7.ln2.bias                         -> model.layers.7.ln2.bias                            shape: (1024,)
+Converting v.blk.7.ln2.weight to FP16
+  v.blk.7.ln2.weight                       -> model.layers.7.ln2.weight                          shape: (1024,)
+Converting v.blk.8.attn_out.bias to FP16
+  v.blk.8.attn_out.bias                    -> model.layers.8.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.8.attn_out.weight                  -> model.layers.8.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.8.attn_qkv.bias to FP16
+  v.blk.8.attn_qkv.bias                    -> model.layers.8.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.8.attn_qkv.weight                  -> model.layers.8.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.8.ffn_up.bias to FP16
+  v.blk.8.ffn_up.bias                      -> model.layers.8.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.8.ffn_up.weight                    -> model.layers.8.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.8.ffn_down.bias to FP16
+  v.blk.8.ffn_down.bias                    -> model.layers.8.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.8.ffn_down.weight                  -> model.layers.8.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.8.ln1.bias to FP16
+  v.blk.8.ln1.bias                         -> model.layers.8.ln1.bias                            shape: (1024,)
+Converting v.blk.8.ln1.weight to FP16
+  v.blk.8.ln1.weight                       -> model.layers.8.ln1.weight                          shape: (1024,)
+Converting v.blk.8.ln2.bias to FP16
+  v.blk.8.ln2.bias                         -> model.layers.8.ln2.bias                            shape: (1024,)
+Converting v.blk.8.ln2.weight to FP16
+  v.blk.8.ln2.weight                       -> model.layers.8.ln2.weight                          shape: (1024,)
+Converting v.blk.9.attn_out.bias to FP16
+  v.blk.9.attn_out.bias                    -> model.layers.9.self_attn.o_proj.bias               shape: (1024,)
+  v.blk.9.attn_out.weight                  -> model.layers.9.self_attn.o_proj.weight             shape: (1024, 1024)
+Converting v.blk.9.attn_qkv.bias to FP16
+  v.blk.9.attn_qkv.bias                    -> model.layers.9.self_attn.qkv_proj.bias             shape: (3072,)
+  v.blk.9.attn_qkv.weight                  -> model.layers.9.self_attn.qkv_proj.weight           shape: (3072, 1024)
+Converting v.blk.9.ffn_up.bias to FP16
+  v.blk.9.ffn_up.bias                      -> model.layers.9.mlp.up_proj.bias                    shape: (4096,)
+  v.blk.9.ffn_up.weight                    -> model.layers.9.mlp.up_proj.weight                  shape: (4096, 1024)
+Converting v.blk.9.ffn_down.bias to FP16
+  v.blk.9.ffn_down.bias                    -> model.layers.9.mlp.down_proj.bias                  shape: (1024,)
+  v.blk.9.ffn_down.weight                  -> model.layers.9.mlp.down_proj.weight                shape: (1024, 4096)
+Converting v.blk.9.ln1.bias to FP16
+  v.blk.9.ln1.bias                         -> model.layers.9.ln1.bias                            shape: (1024,)
+Converting v.blk.9.ln1.weight to FP16
+  v.blk.9.ln1.weight                       -> model.layers.9.ln1.weight                          shape: (1024,)
+Converting v.blk.9.ln2.bias to FP16
+  v.blk.9.ln2.bias                         -> model.layers.9.ln2.bias                            shape: (1024,)
+Converting v.blk.9.ln2.weight to FP16
+  v.blk.9.ln2.weight                       -> model.layers.9.ln2.weight                          shape: (1024,)
+Converting v.deepstack.5.fc1.bias to FP16
+  v.deepstack.5.fc1.bias                   -> model.deepstack.5.fc1.bias                         shape: (4096,)
+  v.deepstack.5.fc1.weight                 -> model.deepstack.5.fc1.weight                       shape: (4096, 4096)
+Converting v.deepstack.5.fc2.bias to FP16
+  v.deepstack.5.fc2.bias                   -> model.deepstack.5.fc2.bias                         shape: (2560,)
+  v.deepstack.5.fc2.weight                 -> model.deepstack.5.fc2.weight                       shape: (2560, 4096)
+Converting v.deepstack.5.norm.bias to FP16
+  v.deepstack.5.norm.bias                  -> model.deepstack.5.norm.bias                        shape: (4096,)
+Converting v.deepstack.5.norm.weight to FP16
+  v.deepstack.5.norm.weight                -> model.deepstack.5.norm.weight                      shape: (4096,)
+Converting v.deepstack.11.fc1.bias to FP16
+  v.deepstack.11.fc1.bias                  -> model.deepstack.11.fc1.bias                        shape: (4096,)
+  v.deepstack.11.fc1.weight                -> model.deepstack.11.fc1.weight                      shape: (4096, 4096)
+Converting v.deepstack.11.fc2.bias to FP16
+  v.deepstack.11.fc2.bias                  -> model.deepstack.11.fc2.bias                        shape: (2560,)
+  v.deepstack.11.fc2.weight                -> model.deepstack.11.fc2.weight                      shape: (2560, 4096)
+Converting v.deepstack.11.norm.bias to FP16
+  v.deepstack.11.norm.bias                 -> model.deepstack.11.norm.bias                       shape: (4096,)
+Converting v.deepstack.11.norm.weight to FP16
+  v.deepstack.11.norm.weight               -> model.deepstack.11.norm.weight                     shape: (4096,)
+Converting v.deepstack.17.fc1.bias to FP16
+  v.deepstack.17.fc1.bias                  -> model.deepstack.17.fc1.bias                        shape: (4096,)
+  v.deepstack.17.fc1.weight                -> model.deepstack.17.fc1.weight                      shape: (4096, 4096)
+Converting v.deepstack.17.fc2.bias to FP16
+  v.deepstack.17.fc2.bias                  -> model.deepstack.17.fc2.bias                        shape: (2560,)
+  v.deepstack.17.fc2.weight                -> model.deepstack.17.fc2.weight                      shape: (2560, 4096)
+Converting v.deepstack.17.norm.bias to FP16
+  v.deepstack.17.norm.bias                 -> model.deepstack.17.norm.bias                       shape: (4096,)
+Converting v.deepstack.17.norm.weight to FP16
+  v.deepstack.17.norm.weight               -> model.deepstack.17.norm.weight                     shape: (4096,)
+Converting mm.0.bias to FP16
+  mm.0.bias                                -> model.mm.0.bias                                    shape: (4096,)
+  mm.0.weight                              -> model.mm.0.weight                                  shape: (4096, 4096)
+Converting mm.2.bias to FP16
+  mm.2.bias                                -> model.mm.2.bias                                    shape: (2560,)
+  mm.2.weight                              -> model.mm.2.weight                                  shape: (2560, 4096)
+Converting v.post_ln.bias to FP16
+  v.post_ln.bias                           -> model.post_ln.bias                                 shape: (1024,)
+Converting v.post_ln.weight to FP16
+  v.post_ln.weight                         -> model.post_ln.weight                               shape: (1024,)
+Converting v.patch_embd.bias to FP16
+  v.patch_embd.bias                        -> model.patch_embd.bias                              shape: (1024,)
+  v.patch_embd.weight                      -> model.patch_embd.weight                            shape: (1024, 3, 16, 16)
+  v.patch_embd.weight.1                    -> model.patch_embd.weight.1                          shape: (1024, 3, 16, 16)
+Converting v.position_embd.weight to FP16
+  v.position_embd.weight                   -> model.position_embd.weight                         shape: (2304, 1024)
+Converted 316 tensors
+All required tensors present!
+Saving to qwen3-vl-4b/mmproj-fp16.npz...
+Output file size: 0.60 GB
+Conversion complete!

qwen3-vl-4b/model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3109e254938ff3d66477b10880bda5bf744bfc9be66c08755765fa5d67fad30c
+size 8045090783

qwen3-vl-4b/out-fp16.npz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:978c95d567adbd14e55f2703dcabac4b1148b7c722ea839ab53eb879df1be8e5
+size 6797257649

qwen3-vl-4b/out.npz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fa2c56277a413cb044389d87723af357c16d2cf3e4e4cbd120e63d177d9ec3b2
+size 2927132949

qwen3-vl-4b/scale.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcaf2e8164bc08707382108563f164c79a67aa315a10918eec8de7b4189e2f96
+size 4566483

qwen3-vl-4b/smooth.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a4772a5bc2c0594bade56d31693cee385c522bc1773278ca9c18dbec22f14f6
+size 2773543

qwen3-vl-4b/wgts.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdde16b81c020527f418e855715261a92f4aca0a994c54cbdb9dcb14f1bcbf3c
+size 4519327