File size: 1,350 Bytes
fd45719
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
{
    "aligner_config": {
        "cls": "MlpProjector",
        "model_type": "aligner",
        "params": {
            "depth": 2,
            "input_dim": 1024,
            "n_embed": 2048,
            "projector_type": "mlp_gelu"
        }
    },
    "architectures": [
        "MultiModalityCausalLM"
    ],
    "language_config": {
        "hidden_size": 2048,
        "intermediate_size": 5632,
        "max_position_embeddings": 16384,
        "model_type": "llama",
        "num_attention_heads": 16,
        "num_hidden_layers": 24,
        "num_key_value_heads": 16,
        "torch_dtype": "float16",
        "vocab_size": 102400
    },
    "model_type": "multi_modality",
    "quantization": {
        "group_size": 64,
        "bits": 4
    },
    "torch_dtype": "float16",
    "transformers_version": "4.38.2",
    "vision_config": {
        "cls": "CLIPVisionTower",
        "model_type": "vision",
        "params": {
            "image_size": 384,
            "model_name": "siglip_large_patch16_384",
            "pixel_mean": [
                0.5,
                0.5,
                0.5
            ],
            "pixel_std": [
                0.5,
                0.5,
                0.5
            ],
            "select_feature": "same",
            "select_layer": -1
        },
        "intermediate_size": 4096
    }
}