Image-to-Text
Transformers
Safetensors
Japanese
llava-jp
text-generation
vision
image-captioning
VQA
Inference Endpoints
ConvLLaVA-JP-1.3b-768 / model.safetensors.index.json
toshi456's picture
Upload 8 files
5d355b8 verified
raw
history blame
64.2 kB
{
"metadata": {
"total_size": 7061942656
},
"weight_map": {
"lm_head.weight": "model-00002-of-00002.safetensors",
"model.mm_projector.0.bias": "model-00002-of-00002.safetensors",
"model.mm_projector.0.weight": "model-00002-of-00002.safetensors",
"model.mm_projector.2.bias": "model-00002-of-00002.safetensors",
"model.mm_projector.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.0.blocks.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.blocks.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.downsample.0.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.downsample.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.downsample.1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.1.downsample.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.10.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.11.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.12.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.13.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.14.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.15.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.16.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.17.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.18.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.19.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.20.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.21.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.22.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.23.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.24.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.25.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.26.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.3.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.4.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.5.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.6.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.7.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.8.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.blocks.9.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.downsample.0.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.downsample.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.downsample.1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.2.downsample.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.blocks.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.downsample.0.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.downsample.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.downsample.1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.3.downsample.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.3.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.4.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.conv_dw.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.conv_dw.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.mlp.fc1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.mlp.fc1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.mlp.fc2.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.mlp.fc2.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.norm.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.norm.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.blocks.5.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.downsample.0.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.downsample.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.downsample.1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stages.4.downsample.1.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stem.0.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stem.0.weight": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stem.1.bias": "model-00002-of-00002.safetensors",
"model.vision_tower.vision_tower.stem.1.weight": "model-00002-of-00002.safetensors",
"transformer.h.0.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.0.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.0.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.0.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.0.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.0.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.0.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.1.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.1.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.10.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.10.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.11.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.11.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.12.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.12.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.13.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.13.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.14.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.14.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.15.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.15.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.16.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.16.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.17.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.17.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.18.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.18.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.19.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.19.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.2.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.2.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.20.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.20.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.21.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.21.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.22.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.22.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.22.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.22.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.22.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.22.mlp.c_proj.bias": "model-00002-of-00002.safetensors",
"transformer.h.22.mlp.c_proj.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.attn.c_attn.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.attn.c_attn.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.attn.c_proj.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.attn.c_proj.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.ln_1.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.ln_1.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.ln_2.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.ln_2.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.mlp.c_fc.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.mlp.c_fc.weight": "model-00002-of-00002.safetensors",
"transformer.h.23.mlp.c_proj.bias": "model-00002-of-00002.safetensors",
"transformer.h.23.mlp.c_proj.weight": "model-00002-of-00002.safetensors",
"transformer.h.3.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.3.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.3.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.3.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.3.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.3.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.3.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.4.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.4.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.5.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.5.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.6.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.6.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.7.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.7.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.8.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.8.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.attn.c_attn.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.attn.c_attn.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.attn.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.attn.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.ln_1.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.ln_1.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.ln_2.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.ln_2.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.mlp.c_fc.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.mlp.c_fc.weight": "model-00001-of-00002.safetensors",
"transformer.h.9.mlp.c_proj.bias": "model-00001-of-00002.safetensors",
"transformer.h.9.mlp.c_proj.weight": "model-00001-of-00002.safetensors",
"transformer.ln_f.bias": "model-00002-of-00002.safetensors",
"transformer.ln_f.weight": "model-00002-of-00002.safetensors",
"transformer.wpe.weight": "model-00001-of-00002.safetensors",
"transformer.wte.weight": "model-00001-of-00002.safetensors"
}
}