jianzongwu commited on Dec 3, 2024

Commit

4271c2c

verified ·

1 Parent(s): 18c56fa

Upload 42 files

Browse files

Files changed (42) hide show

image_generator/clip_image_encoder/config.json +23 -0
image_generator/clip_image_encoder/model.safetensors +3 -0
image_generator/image_proj_model/pytorch_model.bin +3 -0
image_generator/magi_image_encoder/config.json +84 -0
image_generator/magi_image_encoder/model.safetensors +3 -0
image_generator/model_index.json +34 -0
image_generator/scheduler/scheduler_config.json +18 -0
image_generator/text_encoder/config.json +24 -0
image_generator/text_encoder/model.safetensors +3 -0
image_generator/text_encoder_2/config.json +24 -0
image_generator/text_encoder_2/model.safetensors +3 -0
image_generator/tokenizer/merges.txt +0 -0
image_generator/tokenizer/special_tokens_map.json +24 -0
image_generator/tokenizer/tokenizer_config.json +33 -0
image_generator/tokenizer/vocab.json +0 -0
image_generator/tokenizer_2/merges.txt +0 -0
image_generator/tokenizer_2/special_tokens_map.json +24 -0
image_generator/tokenizer_2/tokenizer_config.json +33 -0
image_generator/tokenizer_2/vocab.json +0 -0
image_generator/unet/config.json +70 -0
image_generator/unet/diffsensei_unet.safetensors +3 -0
image_generator/vae/config.json +32 -0
image_generator/vae/diffusion_pytorch_model.safetensors +3 -0
mllm/agent/pytorch_model.bin +3 -0
mllm/llm/config.json +31 -0
mllm/llm/generation_config.json +9 -0
mllm/llm/model-00001-of-00011.safetensors +3 -0
mllm/llm/model-00002-of-00011.safetensors +3 -0
mllm/llm/model-00003-of-00011.safetensors +3 -0
mllm/llm/model-00004-of-00011.safetensors +3 -0
mllm/llm/model-00005-of-00011.safetensors +3 -0
mllm/llm/model-00006-of-00011.safetensors +3 -0
mllm/llm/model-00007-of-00011.safetensors +3 -0
mllm/llm/model-00008-of-00011.safetensors +3 -0
mllm/llm/model-00009-of-00011.safetensors +3 -0
mllm/llm/model-00010-of-00011.safetensors +3 -0
mllm/llm/model-00011-of-00011.safetensors +3 -0
mllm/llm/model.safetensors.index.json +410 -0
mllm/tokenizer/added_tokens.json +332 -0
mllm/tokenizer/special_tokens_map.json +24 -0
mllm/tokenizer/tokenizer.model +3 -0
mllm/tokenizer/tokenizer_config.json +34 -0

image_generator/clip_image_encoder/config.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "_name_or_path": "./image_encoder",
+  "architectures": [
+    "CLIPVisionModelWithProjection"
+  ],
+  "attention_dropout": 0.0,
+  "dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_size": 1280,
+  "image_size": 224,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 5120,
+  "layer_norm_eps": 1e-05,
+  "model_type": "clip_vision_model",
+  "num_attention_heads": 16,
+  "num_channels": 3,
+  "num_hidden_layers": 32,
+  "patch_size": 14,
+  "projection_dim": 1024,
+  "torch_dtype": "float16",
+  "transformers_version": "4.28.0.dev0"
+}

image_generator/clip_image_encoder/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6ca9667da1ca9e0b0f75e46bb030f7e011f44f86cbfb8d5a36590fcd7507b030
+size 2528373448

image_generator/image_proj_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5620c45d343deb1ac090419de50f87c51af77b85890adfa06318ed195949aa3
+size 335934224

image_generator/magi_image_encoder/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+    "_name_or_path": "checkpoints/vit-mae-base",
+    "add_cross_attention": false,
+    "architectures": [
+        "ViTMAEForPreTraining"
+    ],
+    "attention_probs_dropout_prob": 0.0,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "cross_attention_hidden_size": null,
+    "decoder_hidden_size": 512,
+    "decoder_intermediate_size": 2048,
+    "decoder_num_attention_heads": 16,
+    "decoder_num_hidden_layers": 8,
+    "decoder_start_token_id": null,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.0,
+    "hidden_size": 768,
+    "id2label": {
+        "0": "LABEL_0",
+        "1": "LABEL_1"
+    },
+    "image_size": 224,
+    "initializer_range": 0.02,
+    "intermediate_size": 3072,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+        "LABEL_0": 0,
+        "LABEL_1": 1
+    },
+    "layer_norm_eps": 1e-12,
+    "length_penalty": 1.0,
+    "mask_ratio": 0.75,
+    "max_length": 20,
+    "min_length": 0,
+    "model_type": "",
+    "no_repeat_ngram_size": 0,
+    "norm_pix_loss": false,
+    "num_attention_heads": 12,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": null,
+    "patch_size": 16,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "qkv_bias": true,
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": true,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": "float32",
+    "torchscript": false,
+    "typical_p": 1.0,
+    "use_bfloat16": false
+}

image_generator/magi_image_encoder/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a64913540d219494187ec8ed6716a99bd8b050f33118087f1537d36c22f5ef74
+size 343216848

image_generator/model_index.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_class_name": "StableDiffusionXLPipeline",
+  "_diffusers_version": "0.19.0.dev0",
+  "force_zeros_for_empty_prompt": true,
+  "add_watermarker": null,
+  "scheduler": [
+    "diffusers",
+    "EulerDiscreteScheduler"
+  ],
+  "text_encoder": [
+    "transformers",
+    "CLIPTextModel"
+  ],
+  "text_encoder_2": [
+    "transformers",
+    "CLIPTextModelWithProjection"
+  ],
+  "tokenizer": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "tokenizer_2": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "unet": [
+    "diffusers",
+    "UNet2DConditionModel"
+  ],
+  "vae": [
+    "diffusers",
+    "AutoencoderKL"
+  ]
+}

image_generator/scheduler/scheduler_config.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+  "_class_name": "EulerDiscreteScheduler",
+  "_diffusers_version": "0.19.0.dev0",
+  "beta_end": 0.012,
+  "beta_schedule": "scaled_linear",
+  "beta_start": 0.00085,
+  "clip_sample": false,
+  "interpolation_type": "linear",
+  "num_train_timesteps": 1000,
+  "prediction_type": "epsilon",
+  "sample_max_value": 1.0,
+  "set_alpha_to_one": false,
+  "skip_prk_steps": true,
+  "steps_offset": 1,
+  "timestep_spacing": "leading",
+  "trained_betas": null,
+  "use_karras_sigmas": false
+}

image_generator/text_encoder/config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "architectures": [
+    "CLIPTextModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "dropout": 0.0,
+  "eos_token_id": 2,
+  "hidden_act": "quick_gelu",
+  "hidden_size": 768,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 77,
+  "model_type": "clip_text_model",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "projection_dim": 768,
+  "torch_dtype": "float16",
+  "transformers_version": "4.32.0.dev0",
+  "vocab_size": 49408
+}

image_generator/text_encoder/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c3d6454dd2d23414b56aa1b5858a72487a656937847b6fea8d0606d7a42cdbc
+size 492265168

image_generator/text_encoder_2/config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "architectures": [
+    "CLIPTextModelWithProjection"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "dropout": 0.0,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_size": 1280,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 5120,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 77,
+  "model_type": "clip_text_model",
+  "num_attention_heads": 20,
+  "num_hidden_layers": 32,
+  "pad_token_id": 1,
+  "projection_dim": 1280,
+  "torch_dtype": "float16",
+  "transformers_version": "4.32.0.dev0",
+  "vocab_size": 49408
+}

image_generator/text_encoder_2/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a6032f63d37ae02bbc74ccd6a27440578cd71701f96532229d0154f55a8d3ff
+size 2778702264

image_generator/tokenizer/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

image_generator/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

image_generator/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,33 @@

+{
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 77,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

image_generator/tokenizer/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

image_generator/tokenizer_2/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

image_generator/tokenizer_2/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "!",
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

image_generator/tokenizer_2/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,33 @@

+{
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": true,
+  "do_lower_case": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 77,
+  "pad_token": "!",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

image_generator/tokenizer_2/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

image_generator/unet/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+    "_class_name": "UNet2DConditionModel",
+    "_diffusers_version": "0.19.0.dev0",
+    "act_fn": "silu",
+    "addition_embed_type": "text_time",
+    "addition_embed_type_num_heads": 64,
+    "addition_time_embed_dim": 256,
+    "attention_head_dim": [
+      5,
+      10,
+      20
+    ],
+    "block_out_channels": [
+      320,
+      640,
+      1280
+    ],
+    "center_input_sample": false,
+    "class_embed_type": null,
+    "class_embeddings_concat": false,
+    "conv_in_kernel": 3,
+    "conv_out_kernel": 3,
+    "cross_attention_dim": 2048,
+    "cross_attention_norm": null,
+    "down_block_types": [
+      "DownBlock2D",
+      "CrossAttnDownBlock2D",
+      "CrossAttnDownBlock2D"
+    ],
+    "downsample_padding": 1,
+    "dual_cross_attention": false,
+    "encoder_hid_dim": null,
+    "encoder_hid_dim_type": null,
+    "flip_sin_to_cos": true,
+    "freq_shift": 0,
+    "in_channels": 4,
+    "layers_per_block": 2,
+    "mid_block_only_cross_attention": null,
+    "mid_block_scale_factor": 1,
+    "mid_block_type": "UNetMidBlock2DCrossAttn",
+    "norm_eps": 1e-05,
+    "norm_num_groups": 32,
+    "num_attention_heads": null,
+    "num_class_embeds": null,
+    "only_cross_attention": false,
+    "out_channels": 4,
+    "projection_class_embeddings_input_dim": 2816,
+    "resnet_out_scale_factor": 1.0,
+    "resnet_skip_time_act": false,
+    "resnet_time_scale_shift": "default",
+    "sample_size": 128,
+    "time_cond_proj_dim": null,
+    "time_embedding_act_fn": null,
+    "time_embedding_dim": null,
+    "time_embedding_type": "positional",
+    "timestep_post_act": null,
+    "transformer_layers_per_block": [
+      1,
+      2,
+      10
+    ],
+    "up_block_types": [
+      "CrossAttnUpBlock2D",
+      "CrossAttnUpBlock2D",
+      "UpBlock2D"
+    ],
+    "upcast_attention": null,
+    "use_linear_projection": true
+  }

image_generator/unet/diffsensei_unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5b715d2d9405739999039ef474e28ce6991d7bf8f169186114d97adb8dca630
+size 11633249944

image_generator/vae/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_diffusers_version": "0.20.0.dev0",
+  "_name_or_path": "../sdxl-vae/",
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "layers_per_block": 2,
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 1024,
+  "scaling_factor": 0.13025,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ]
+}

image_generator/vae/diffusion_pytorch_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1598f3d24932bcfe6634e8b618ea1e30ab1d57f5aad13a6d2de446d2199f2341
+size 334643268

mllm/agent/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b3fff6d4968d9a192a8b4476bf3f65a5fbe930e55c280649a943a33202da50d
+size 574332016

mllm/llm/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "_name_or_path": "checkpoints/diffsensei/mllm/llm",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "head_dim": 128,
+  "hidden_act": "silu",
+  "hidden_size": 5120,
+  "initializer_range": 0.02,
+  "intermediate_size": 13824,
+  "max_position_embeddings": 2048,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 40,
+  "num_hidden_layers": 40,
+  "num_key_value_heads": 40,
+  "pad_token_id": 0,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.45.2",
+  "use_cache": true,
+  "vocab_size": 32330
+}

mllm/llm/generation_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "temperature": 0.9,
+  "top_p": 0.6,
+  "transformers_version": "4.45.2"
+}

mllm/llm/model-00001-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d905c280ae7f88642fe72152edf6c89b6371e9323bda028da065c29cd155c0c9
+size 4888007736

mllm/llm/model-00002-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01ecd53547d8eb4b6d4e7b66fd9ad8a06413be551b0b287194bf59e8255c36cf
+size 4970419224

mllm/llm/model-00003-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f46b554fc1a8b263678319445c1fb5d3607aa17c92bba1a34583d6784c80bfd
+size 4970419608

mllm/llm/model-00004-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:594ecad28d8c3d4d45d53634caa890487e9e3fec0621e3865c4488580811e693
+size 4970419632

mllm/llm/model-00005-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8644d993edf4b955e3ee8e340c2c0a16fc75c3a3e0c380e0e5ca22ebb4d89f6a
+size 4970419632

mllm/llm/model-00006-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49dd56edadd559d3007129ac7c5f84dfd4c018e899f5f3415610417018f5d5b1
+size 4792120528

mllm/llm/model-00007-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53e3286378ee51b9e70d671341bbe2e2d3f8e0553bc23b8a98ea02ceff45087a
+size 4792161712

mllm/llm/model-00008-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d118a0ddd4d84efff4c11d9e87732e6de84a928cf691e69032c494ded0930e40
+size 4792161712

mllm/llm/model-00009-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ce15d5270fd141ca3ac6b825d88fc2674ab41e138324ebe6541a28099a4fd90
+size 4970419264

mllm/llm/model-00010-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a8ed033aa0e45c32cb4ff5d606b39908a593b73d0b2c279fdc19c34f76b7b26
+size 4970419632

mllm/llm/model-00011-of-00011.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98f3a2e11569fbe313f430111f46a08eff47b58c18ffda835ed5ae5276740928
+size 2990062328

mllm/llm/model.safetensors.index.json ADDED Viewed

	@@ -0,0 +1,410 @@

+{
+  "metadata": {
+    "total_size": 52076984320
+  },
+  "weight_map": {
+    "lm_head.weight": "model-00011-of-00011.safetensors",
+    "model.embed_tokens.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.input_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.mlp.down_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.mlp.up_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.0.self_attn.rotary_emb.inv_freq": "model-00001-of-00011.safetensors",
+    "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.input_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.mlp.down_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.mlp.up_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.1.self_attn.rotary_emb.inv_freq": "model-00001-of-00011.safetensors",
+    "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.10.input_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.mlp.down_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.mlp.gate_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.mlp.up_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.post_attention_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.self_attn.k_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.self_attn.o_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.self_attn.q_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.10.self_attn.rotary_emb.inv_freq": "model-00003-of-00011.safetensors",
+    "model.layers.10.self_attn.v_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.11.input_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.mlp.down_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.mlp.gate_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.mlp.up_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.post_attention_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.self_attn.k_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.11.self_attn.o_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.11.self_attn.q_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.11.self_attn.rotary_emb.inv_freq": "model-00004-of-00011.safetensors",
+    "model.layers.11.self_attn.v_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.input_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.mlp.down_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.mlp.gate_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.mlp.up_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.post_attention_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.self_attn.k_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.self_attn.o_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.self_attn.q_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.12.self_attn.rotary_emb.inv_freq": "model-00004-of-00011.safetensors",
+    "model.layers.12.self_attn.v_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.input_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.mlp.down_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.mlp.gate_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.mlp.up_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.post_attention_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.self_attn.k_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.self_attn.o_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.self_attn.q_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.13.self_attn.rotary_emb.inv_freq": "model-00004-of-00011.safetensors",
+    "model.layers.13.self_attn.v_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.input_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.mlp.down_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.mlp.gate_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.mlp.up_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.post_attention_layernorm.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.self_attn.k_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.self_attn.o_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.self_attn.q_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.14.self_attn.rotary_emb.inv_freq": "model-00004-of-00011.safetensors",
+    "model.layers.14.self_attn.v_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.15.input_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.mlp.down_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.mlp.gate_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.mlp.up_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.post_attention_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.self_attn.k_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.self_attn.o_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.15.self_attn.q_proj.weight": "model-00004-of-00011.safetensors",
+    "model.layers.15.self_attn.rotary_emb.inv_freq": "model-00005-of-00011.safetensors",
+    "model.layers.15.self_attn.v_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.input_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.mlp.down_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.mlp.gate_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.mlp.up_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.post_attention_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.self_attn.k_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.self_attn.o_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.self_attn.q_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.16.self_attn.rotary_emb.inv_freq": "model-00005-of-00011.safetensors",
+    "model.layers.16.self_attn.v_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.input_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.mlp.down_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.mlp.gate_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.mlp.up_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.post_attention_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.self_attn.k_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.self_attn.o_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.self_attn.q_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.17.self_attn.rotary_emb.inv_freq": "model-00005-of-00011.safetensors",
+    "model.layers.17.self_attn.v_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.input_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.mlp.down_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.mlp.gate_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.mlp.up_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.post_attention_layernorm.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.self_attn.k_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.self_attn.o_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.self_attn.q_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.18.self_attn.rotary_emb.inv_freq": "model-00005-of-00011.safetensors",
+    "model.layers.18.self_attn.v_proj.weight": "model-00005-of-00011.safetensors",
+    "model.layers.19.input_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.mlp.down_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.mlp.gate_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.mlp.up_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.post_attention_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.self_attn.k_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.self_attn.o_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.self_attn.q_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.19.self_attn.rotary_emb.inv_freq": "model-00006-of-00011.safetensors",
+    "model.layers.19.self_attn.v_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.2.input_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.mlp.down_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.mlp.up_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.2.self_attn.rotary_emb.inv_freq": "model-00001-of-00011.safetensors",
+    "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.20.input_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.mlp.down_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.mlp.gate_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.mlp.up_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.post_attention_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.self_attn.k_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.self_attn.o_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.self_attn.q_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.20.self_attn.rotary_emb.inv_freq": "model-00006-of-00011.safetensors",
+    "model.layers.20.self_attn.v_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.input_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.mlp.down_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.mlp.gate_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.mlp.up_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.post_attention_layernorm.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.self_attn.k_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.self_attn.o_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.self_attn.q_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.21.self_attn.rotary_emb.inv_freq": "model-00006-of-00011.safetensors",
+    "model.layers.21.self_attn.v_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.input_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.22.mlp.down_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.mlp.gate_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.mlp.up_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.22.post_attention_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.22.self_attn.k_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.self_attn.o_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.self_attn.q_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.22.self_attn.rotary_emb.inv_freq": "model-00006-of-00011.safetensors",
+    "model.layers.22.self_attn.v_proj.weight": "model-00006-of-00011.safetensors",
+    "model.layers.23.input_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.mlp.down_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.mlp.gate_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.mlp.up_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.post_attention_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.self_attn.k_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.self_attn.o_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.self_attn.q_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.23.self_attn.rotary_emb.inv_freq": "model-00007-of-00011.safetensors",
+    "model.layers.23.self_attn.v_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.input_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.mlp.down_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.mlp.gate_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.mlp.up_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.post_attention_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.self_attn.k_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.self_attn.o_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.self_attn.q_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.24.self_attn.rotary_emb.inv_freq": "model-00007-of-00011.safetensors",
+    "model.layers.24.self_attn.v_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.input_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.mlp.down_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.mlp.gate_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.mlp.up_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.post_attention_layernorm.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.self_attn.k_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.self_attn.o_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.self_attn.q_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.25.self_attn.rotary_emb.inv_freq": "model-00007-of-00011.safetensors",
+    "model.layers.25.self_attn.v_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.26.input_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.26.mlp.down_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.26.mlp.gate_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.26.mlp.up_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.26.post_attention_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.26.self_attn.k_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.26.self_attn.o_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.26.self_attn.q_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.26.self_attn.rotary_emb.inv_freq": "model-00007-of-00011.safetensors",
+    "model.layers.26.self_attn.v_proj.weight": "model-00007-of-00011.safetensors",
+    "model.layers.27.input_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.mlp.down_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.mlp.gate_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.mlp.up_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.post_attention_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.self_attn.k_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.self_attn.o_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.self_attn.q_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.27.self_attn.rotary_emb.inv_freq": "model-00008-of-00011.safetensors",
+    "model.layers.27.self_attn.v_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.input_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.mlp.down_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.mlp.gate_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.mlp.up_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.post_attention_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.self_attn.k_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.self_attn.o_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.self_attn.q_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.28.self_attn.rotary_emb.inv_freq": "model-00008-of-00011.safetensors",
+    "model.layers.28.self_attn.v_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.input_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.mlp.down_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.mlp.gate_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.mlp.up_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.post_attention_layernorm.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.self_attn.k_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.self_attn.o_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.self_attn.q_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.29.self_attn.rotary_emb.inv_freq": "model-00008-of-00011.safetensors",
+    "model.layers.29.self_attn.v_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.3.input_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.3.mlp.down_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.3.mlp.gate_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.3.mlp.up_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.3.post_attention_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.3.self_attn.rotary_emb.inv_freq": "model-00001-of-00011.safetensors",
+    "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00011.safetensors",
+    "model.layers.30.input_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.30.mlp.down_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.30.mlp.gate_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.30.mlp.up_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.30.post_attention_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.30.self_attn.k_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.30.self_attn.o_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.30.self_attn.q_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.30.self_attn.rotary_emb.inv_freq": "model-00008-of-00011.safetensors",
+    "model.layers.30.self_attn.v_proj.weight": "model-00008-of-00011.safetensors",
+    "model.layers.31.input_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.mlp.down_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.mlp.gate_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.mlp.up_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.post_attention_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.self_attn.k_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.self_attn.o_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.self_attn.q_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.31.self_attn.rotary_emb.inv_freq": "model-00009-of-00011.safetensors",
+    "model.layers.31.self_attn.v_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.input_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.mlp.down_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.mlp.gate_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.mlp.up_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.post_attention_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.self_attn.k_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.self_attn.o_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.self_attn.q_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.32.self_attn.rotary_emb.inv_freq": "model-00009-of-00011.safetensors",
+    "model.layers.32.self_attn.v_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.input_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.mlp.down_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.mlp.gate_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.mlp.up_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.post_attention_layernorm.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.self_attn.k_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.self_attn.o_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.self_attn.q_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.33.self_attn.rotary_emb.inv_freq": "model-00009-of-00011.safetensors",
+    "model.layers.33.self_attn.v_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.34.input_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.mlp.down_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.mlp.gate_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.mlp.up_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.post_attention_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.self_attn.k_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.34.self_attn.o_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.34.self_attn.q_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.34.self_attn.rotary_emb.inv_freq": "model-00010-of-00011.safetensors",
+    "model.layers.34.self_attn.v_proj.weight": "model-00009-of-00011.safetensors",
+    "model.layers.35.input_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.mlp.down_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.mlp.gate_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.mlp.up_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.post_attention_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.self_attn.k_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.self_attn.o_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.self_attn.q_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.35.self_attn.rotary_emb.inv_freq": "model-00010-of-00011.safetensors",
+    "model.layers.35.self_attn.v_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.input_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.mlp.down_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.mlp.gate_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.mlp.up_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.post_attention_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.self_attn.k_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.self_attn.o_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.self_attn.q_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.36.self_attn.rotary_emb.inv_freq": "model-00010-of-00011.safetensors",
+    "model.layers.36.self_attn.v_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.input_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.mlp.down_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.mlp.gate_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.mlp.up_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.post_attention_layernorm.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.self_attn.k_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.self_attn.o_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.self_attn.q_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.37.self_attn.rotary_emb.inv_freq": "model-00010-of-00011.safetensors",
+    "model.layers.37.self_attn.v_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.38.input_layernorm.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.mlp.down_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.mlp.gate_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.mlp.up_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.post_attention_layernorm.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.self_attn.k_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.38.self_attn.o_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.38.self_attn.q_proj.weight": "model-00010-of-00011.safetensors",
+    "model.layers.38.self_attn.rotary_emb.inv_freq": "model-00011-of-00011.safetensors",
+    "model.layers.38.self_attn.v_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.input_layernorm.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.mlp.down_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.mlp.gate_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.mlp.up_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.post_attention_layernorm.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.self_attn.k_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.self_attn.o_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.self_attn.q_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.39.self_attn.rotary_emb.inv_freq": "model-00011-of-00011.safetensors",
+    "model.layers.39.self_attn.v_proj.weight": "model-00011-of-00011.safetensors",
+    "model.layers.4.input_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.mlp.down_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.mlp.gate_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.mlp.up_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.self_attn.o_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.4.self_attn.rotary_emb.inv_freq": "model-00002-of-00011.safetensors",
+    "model.layers.4.self_attn.v_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.input_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.mlp.down_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.mlp.gate_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.mlp.up_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.self_attn.o_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.5.self_attn.rotary_emb.inv_freq": "model-00002-of-00011.safetensors",
+    "model.layers.5.self_attn.v_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.input_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.mlp.down_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.mlp.gate_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.mlp.up_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.6.self_attn.rotary_emb.inv_freq": "model-00002-of-00011.safetensors",
+    "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.7.input_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.mlp.down_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.mlp.gate_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.mlp.up_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.post_attention_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.7.self_attn.o_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.7.self_attn.rotary_emb.inv_freq": "model-00003-of-00011.safetensors",
+    "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00011.safetensors",
+    "model.layers.8.input_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.mlp.down_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.mlp.gate_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.mlp.up_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.post_attention_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.self_attn.k_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.self_attn.o_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.self_attn.q_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.8.self_attn.rotary_emb.inv_freq": "model-00003-of-00011.safetensors",
+    "model.layers.8.self_attn.v_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.input_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.mlp.down_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.mlp.gate_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.mlp.up_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.post_attention_layernorm.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.self_attn.k_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.self_attn.o_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.self_attn.q_proj.weight": "model-00003-of-00011.safetensors",
+    "model.layers.9.self_attn.rotary_emb.inv_freq": "model-00003-of-00011.safetensors",
+    "model.layers.9.self_attn.v_proj.weight": "model-00003-of-00011.safetensors",
+    "model.norm.weight": "model-00011-of-00011.safetensors"
+  }
+}

mllm/tokenizer/added_tokens.json ADDED Viewed

	@@ -0,0 +1,332 @@

+{
+  "</img>": 32101,
+  "</patch>": 32103,
+  "<box_end>": 32329,
+  "<box_start>": 32328,
+  "<img>": 32100,
+  "<img_00000>": 32000,
+  "<img_00001>": 32001,
+  "<img_00002>": 32002,
+  "<img_00003>": 32003,
+  "<img_00004>": 32004,
+  "<img_00005>": 32005,
+  "<img_00006>": 32006,
+  "<img_00007>": 32007,
+  "<img_00008>": 32008,
+  "<img_00009>": 32009,
+  "<img_00010>": 32010,
+  "<img_00011>": 32011,
+  "<img_00012>": 32012,
+  "<img_00013>": 32013,
+  "<img_00014>": 32014,
+  "<img_00015>": 32015,
+  "<img_00016>": 32016,
+  "<img_00017>": 32017,
+  "<img_00018>": 32018,
+  "<img_00019>": 32019,
+  "<img_00020>": 32020,
+  "<img_00021>": 32021,
+  "<img_00022>": 32022,
+  "<img_00023>": 32023,
+  "<img_00024>": 32024,
+  "<img_00025>": 32025,
+  "<img_00026>": 32026,
+  "<img_00027>": 32027,
+  "<img_00028>": 32028,
+  "<img_00029>": 32029,
+  "<img_00030>": 32030,
+  "<img_00031>": 32031,
+  "<img_00032>": 32032,
+  "<img_00033>": 32033,
+  "<img_00034>": 32034,
+  "<img_00035>": 32035,
+  "<img_00036>": 32036,
+  "<img_00037>": 32037,
+  "<img_00038>": 32038,
+  "<img_00039>": 32039,
+  "<img_00040>": 32040,
+  "<img_00041>": 32041,
+  "<img_00042>": 32042,
+  "<img_00043>": 32043,
+  "<img_00044>": 32044,
+  "<img_00045>": 32045,
+  "<img_00046>": 32046,
+  "<img_00047>": 32047,
+  "<img_00048>": 32048,
+  "<img_00049>": 32049,
+  "<img_00050>": 32050,
+  "<img_00051>": 32051,
+  "<img_00052>": 32052,
+  "<img_00053>": 32053,
+  "<img_00054>": 32054,
+  "<img_00055>": 32055,
+  "<img_00056>": 32056,
+  "<img_00057>": 32057,
+  "<img_00058>": 32058,
+  "<img_00059>": 32059,
+  "<img_00060>": 32060,
+  "<img_00061>": 32061,
+  "<img_00062>": 32062,
+  "<img_00063>": 32063,
+  "<img_00064>": 32064,
+  "<img_00065>": 32065,
+  "<img_00066>": 32066,
+  "<img_00067>": 32067,
+  "<img_00068>": 32068,
+  "<img_00069>": 32069,
+  "<img_00070>": 32070,
+  "<img_00071>": 32071,
+  "<img_00072>": 32072,
+  "<img_00073>": 32073,
+  "<img_00074>": 32074,
+  "<img_00075>": 32075,
+  "<img_00076>": 32076,
+  "<img_00077>": 32077,
+  "<img_00078>": 32078,
+  "<img_00079>": 32079,
+  "<img_00080>": 32080,
+  "<img_00081>": 32081,
+  "<img_00082>": 32082,
+  "<img_00083>": 32083,
+  "<img_00084>": 32084,
+  "<img_00085>": 32085,
+  "<img_00086>": 32086,
+  "<img_00087>": 32087,
+  "<img_00088>": 32088,
+  "<img_00089>": 32089,
+  "<img_00090>": 32090,
+  "<img_00091>": 32091,
+  "<img_00092>": 32092,
+  "<img_00093>": 32093,
+  "<img_00094>": 32094,
+  "<img_00095>": 32095,
+  "<img_00096>": 32096,
+  "<img_00097>": 32097,
+  "<img_00098>": 32098,
+  "<img_00099>": 32099,
+  "<loc-0>": 32104,
+  "<loc-100>": 32204,
+  "<loc-101>": 32205,
+  "<loc-102>": 32206,
+  "<loc-103>": 32207,
+  "<loc-104>": 32208,
+  "<loc-105>": 32209,
+  "<loc-106>": 32210,
+  "<loc-107>": 32211,
+  "<loc-108>": 32212,
+  "<loc-109>": 32213,
+  "<loc-10>": 32114,
+  "<loc-110>": 32214,
+  "<loc-111>": 32215,
+  "<loc-112>": 32216,
+  "<loc-113>": 32217,
+  "<loc-114>": 32218,
+  "<loc-115>": 32219,
+  "<loc-116>": 32220,
+  "<loc-117>": 32221,
+  "<loc-118>": 32222,
+  "<loc-119>": 32223,
+  "<loc-11>": 32115,
+  "<loc-120>": 32224,
+  "<loc-121>": 32225,
+  "<loc-122>": 32226,
+  "<loc-123>": 32227,
+  "<loc-124>": 32228,
+  "<loc-125>": 32229,
+  "<loc-126>": 32230,
+  "<loc-127>": 32231,
+  "<loc-128>": 32232,
+  "<loc-129>": 32233,
+  "<loc-12>": 32116,
+  "<loc-130>": 32234,
+  "<loc-131>": 32235,
+  "<loc-132>": 32236,
+  "<loc-133>": 32237,
+  "<loc-134>": 32238,
+  "<loc-135>": 32239,
+  "<loc-136>": 32240,
+  "<loc-137>": 32241,
+  "<loc-138>": 32242,
+  "<loc-139>": 32243,
+  "<loc-13>": 32117,
+  "<loc-140>": 32244,
+  "<loc-141>": 32245,
+  "<loc-142>": 32246,
+  "<loc-143>": 32247,
+  "<loc-144>": 32248,
+  "<loc-145>": 32249,
+  "<loc-146>": 32250,
+  "<loc-147>": 32251,
+  "<loc-148>": 32252,
+  "<loc-149>": 32253,
+  "<loc-14>": 32118,
+  "<loc-150>": 32254,
+  "<loc-151>": 32255,
+  "<loc-152>": 32256,
+  "<loc-153>": 32257,
+  "<loc-154>": 32258,
+  "<loc-155>": 32259,
+  "<loc-156>": 32260,
+  "<loc-157>": 32261,
+  "<loc-158>": 32262,
+  "<loc-159>": 32263,
+  "<loc-15>": 32119,
+  "<loc-160>": 32264,
+  "<loc-161>": 32265,
+  "<loc-162>": 32266,
+  "<loc-163>": 32267,
+  "<loc-164>": 32268,
+  "<loc-165>": 32269,
+  "<loc-166>": 32270,
+  "<loc-167>": 32271,
+  "<loc-168>": 32272,
+  "<loc-169>": 32273,
+  "<loc-16>": 32120,
+  "<loc-170>": 32274,
+  "<loc-171>": 32275,
+  "<loc-172>": 32276,
+  "<loc-173>": 32277,
+  "<loc-174>": 32278,
+  "<loc-175>": 32279,
+  "<loc-176>": 32280,
+  "<loc-177>": 32281,
+  "<loc-178>": 32282,
+  "<loc-179>": 32283,
+  "<loc-17>": 32121,
+  "<loc-180>": 32284,
+  "<loc-181>": 32285,
+  "<loc-182>": 32286,
+  "<loc-183>": 32287,
+  "<loc-184>": 32288,
+  "<loc-185>": 32289,
+  "<loc-186>": 32290,
+  "<loc-187>": 32291,
+  "<loc-188>": 32292,
+  "<loc-189>": 32293,
+  "<loc-18>": 32122,
+  "<loc-190>": 32294,
+  "<loc-191>": 32295,
+  "<loc-192>": 32296,
+  "<loc-193>": 32297,
+  "<loc-194>": 32298,
+  "<loc-195>": 32299,
+  "<loc-196>": 32300,
+  "<loc-197>": 32301,
+  "<loc-198>": 32302,
+  "<loc-199>": 32303,
+  "<loc-19>": 32123,
+  "<loc-1>": 32105,
+  "<loc-200>": 32304,
+  "<loc-201>": 32305,
+  "<loc-202>": 32306,
+  "<loc-203>": 32307,
+  "<loc-204>": 32308,
+  "<loc-205>": 32309,
+  "<loc-206>": 32310,
+  "<loc-207>": 32311,
+  "<loc-208>": 32312,
+  "<loc-209>": 32313,
+  "<loc-20>": 32124,
+  "<loc-210>": 32314,
+  "<loc-211>": 32315,
+  "<loc-212>": 32316,
+  "<loc-213>": 32317,
+  "<loc-214>": 32318,
+  "<loc-215>": 32319,
+  "<loc-216>": 32320,
+  "<loc-217>": 32321,
+  "<loc-218>": 32322,
+  "<loc-219>": 32323,
+  "<loc-21>": 32125,
+  "<loc-220>": 32324,
+  "<loc-221>": 32325,
+  "<loc-222>": 32326,
+  "<loc-223>": 32327,
+  "<loc-22>": 32126,
+  "<loc-23>": 32127,
+  "<loc-24>": 32128,
+  "<loc-25>": 32129,
+  "<loc-26>": 32130,
+  "<loc-27>": 32131,
+  "<loc-28>": 32132,
+  "<loc-29>": 32133,
+  "<loc-2>": 32106,
+  "<loc-30>": 32134,
+  "<loc-31>": 32135,
+  "<loc-32>": 32136,
+  "<loc-33>": 32137,
+  "<loc-34>": 32138,
+  "<loc-35>": 32139,
+  "<loc-36>": 32140,
+  "<loc-37>": 32141,
+  "<loc-38>": 32142,
+  "<loc-39>": 32143,
+  "<loc-3>": 32107,
+  "<loc-40>": 32144,
+  "<loc-41>": 32145,
+  "<loc-42>": 32146,
+  "<loc-43>": 32147,
+  "<loc-44>": 32148,
+  "<loc-45>": 32149,
+  "<loc-46>": 32150,
+  "<loc-47>": 32151,
+  "<loc-48>": 32152,
+  "<loc-49>": 32153,
+  "<loc-4>": 32108,
+  "<loc-50>": 32154,
+  "<loc-51>": 32155,
+  "<loc-52>": 32156,
+  "<loc-53>": 32157,
+  "<loc-54>": 32158,
+  "<loc-55>": 32159,
+  "<loc-56>": 32160,
+  "<loc-57>": 32161,
+  "<loc-58>": 32162,
+  "<loc-59>": 32163,
+  "<loc-5>": 32109,
+  "<loc-60>": 32164,
+  "<loc-61>": 32165,
+  "<loc-62>": 32166,
+  "<loc-63>": 32167,
+  "<loc-64>": 32168,
+  "<loc-65>": 32169,
+  "<loc-66>": 32170,
+  "<loc-67>": 32171,
+  "<loc-68>": 32172,
+  "<loc-69>": 32173,
+  "<loc-6>": 32110,
+  "<loc-70>": 32174,
+  "<loc-71>": 32175,
+  "<loc-72>": 32176,
+  "<loc-73>": 32177,
+  "<loc-74>": 32178,
+  "<loc-75>": 32179,
+  "<loc-76>": 32180,
+  "<loc-77>": 32181,
+  "<loc-78>": 32182,
+  "<loc-79>": 32183,
+  "<loc-7>": 32111,
+  "<loc-80>": 32184,
+  "<loc-81>": 32185,
+  "<loc-82>": 32186,
+  "<loc-83>": 32187,
+  "<loc-84>": 32188,
+  "<loc-85>": 32189,
+  "<loc-86>": 32190,
+  "<loc-87>": 32191,
+  "<loc-88>": 32192,
+  "<loc-89>": 32193,
+  "<loc-8>": 32112,
+  "<loc-90>": 32194,
+  "<loc-91>": 32195,
+  "<loc-92>": 32196,
+  "<loc-93>": 32197,
+  "<loc-94>": 32198,
+  "<loc-95>": 32199,
+  "<loc-96>": 32200,
+  "<loc-97>": 32201,
+  "<loc-98>": 32202,
+  "<loc-99>": 32203,
+  "<loc-9>": 32113,
+  "<patch>": 32102
+}

mllm/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<unk>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

mllm/tokenizer/tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723

mllm/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "legacy": false,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}