Image-Text-to-Text
Transformers
Safetensors
English
idefics2
pretraining
multimodal
vision
Inference Endpoints
5 papers
amyeroberts HF staff commited on
Commit
bc364a7
1 Parent(s): 3392312

Upload folder using huggingface_hub

Browse files
generation_config.json CHANGED
@@ -2,7 +2,7 @@
2
  "_from_model_config": true,
3
  "bad_words_ids": [[32000], [32001]],
4
  "bos_token_id": 1,
5
- "eos_token_id": [2, 32002],
6
  "pad_token_id": 0,
7
  "transformers_version": "4.39.0.dev0"
8
  }
 
2
  "_from_model_config": true,
3
  "bad_words_ids": [[32000], [32001]],
4
  "bos_token_id": 1,
5
+ "eos_token_id": 2,
6
  "pad_token_id": 0,
7
  "transformers_version": "4.39.0.dev0"
8
  }
model-00001-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e22bce3bf26ed85382d419b6484210f95dd82c1c74ab49e5be3c4dd4fc56399
3
- size 4644107280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09856b75a67fbe0ee15190901f7bd9a14ddadeedb73a47fa05bde0c3952c3266
3
+ size 4644107632
model.safetensors.index.json CHANGED
@@ -4,41 +4,41 @@
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00007-of-00007.safetensors",
7
- "model.modality_projection.down_proj.weight": "model-00001-of-00007.safetensors",
8
- "model.modality_projection.gate_proj.weight": "model-00001-of-00007.safetensors",
9
- "model.modality_projection.up_proj.weight": "model-00001-of-00007.safetensors",
10
- "model.perceiver_resampler.latents": "model-00001-of-00007.safetensors",
11
- "model.perceiver_resampler.layers.0.input_context_norm.weight": "model-00001-of-00007.safetensors",
12
- "model.perceiver_resampler.layers.0.input_latents_norm.weight": "model-00001-of-00007.safetensors",
13
- "model.perceiver_resampler.layers.0.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
14
- "model.perceiver_resampler.layers.0.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
15
- "model.perceiver_resampler.layers.0.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
16
- "model.perceiver_resampler.layers.0.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
17
- "model.perceiver_resampler.layers.0.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
18
- "model.perceiver_resampler.layers.0.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
19
- "model.perceiver_resampler.layers.0.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
20
- "model.perceiver_resampler.layers.0.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
21
- "model.perceiver_resampler.layers.1.input_context_norm.weight": "model-00001-of-00007.safetensors",
22
- "model.perceiver_resampler.layers.1.input_latents_norm.weight": "model-00001-of-00007.safetensors",
23
- "model.perceiver_resampler.layers.1.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
24
- "model.perceiver_resampler.layers.1.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
25
- "model.perceiver_resampler.layers.1.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
26
- "model.perceiver_resampler.layers.1.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
27
- "model.perceiver_resampler.layers.1.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
28
- "model.perceiver_resampler.layers.1.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
29
- "model.perceiver_resampler.layers.1.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
30
- "model.perceiver_resampler.layers.1.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
31
- "model.perceiver_resampler.layers.2.input_context_norm.weight": "model-00001-of-00007.safetensors",
32
- "model.perceiver_resampler.layers.2.input_latents_norm.weight": "model-00001-of-00007.safetensors",
33
- "model.perceiver_resampler.layers.2.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
34
- "model.perceiver_resampler.layers.2.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
35
- "model.perceiver_resampler.layers.2.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
36
- "model.perceiver_resampler.layers.2.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
37
- "model.perceiver_resampler.layers.2.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
38
- "model.perceiver_resampler.layers.2.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
39
- "model.perceiver_resampler.layers.2.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
40
- "model.perceiver_resampler.layers.2.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
41
- "model.perceiver_resampler.norm.weight": "model-00001-of-00007.safetensors",
42
  "model.text_model.embed_tokens.weight": "model-00002-of-00007.safetensors",
43
  "model.text_model.layers.0.input_layernorm.weight": "model-00002-of-00007.safetensors",
44
  "model.text_model.layers.0.mlp.down_proj.weight": "model-00002-of-00007.safetensors",
 
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00007-of-00007.safetensors",
7
+ "model.connector.modality_projection.down_proj.weight": "model-00001-of-00007.safetensors",
8
+ "model.connector.modality_projection.gate_proj.weight": "model-00001-of-00007.safetensors",
9
+ "model.connector.modality_projection.up_proj.weight": "model-00001-of-00007.safetensors",
10
+ "model.connector.perceiver_resampler.latents": "model-00001-of-00007.safetensors",
11
+ "model.connector.perceiver_resampler.layers.0.input_context_norm.weight": "model-00001-of-00007.safetensors",
12
+ "model.connector.perceiver_resampler.layers.0.input_latents_norm.weight": "model-00001-of-00007.safetensors",
13
+ "model.connector.perceiver_resampler.layers.0.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
14
+ "model.connector.perceiver_resampler.layers.0.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
15
+ "model.connector.perceiver_resampler.layers.0.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
16
+ "model.connector.perceiver_resampler.layers.0.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
17
+ "model.connector.perceiver_resampler.layers.0.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
18
+ "model.connector.perceiver_resampler.layers.0.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
19
+ "model.connector.perceiver_resampler.layers.0.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
20
+ "model.connector.perceiver_resampler.layers.0.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
21
+ "model.connector.perceiver_resampler.layers.1.input_context_norm.weight": "model-00001-of-00007.safetensors",
22
+ "model.connector.perceiver_resampler.layers.1.input_latents_norm.weight": "model-00001-of-00007.safetensors",
23
+ "model.connector.perceiver_resampler.layers.1.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
24
+ "model.connector.perceiver_resampler.layers.1.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
25
+ "model.connector.perceiver_resampler.layers.1.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
26
+ "model.connector.perceiver_resampler.layers.1.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
27
+ "model.connector.perceiver_resampler.layers.1.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
28
+ "model.connector.perceiver_resampler.layers.1.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
29
+ "model.connector.perceiver_resampler.layers.1.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
30
+ "model.connector.perceiver_resampler.layers.1.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
31
+ "model.connector.perceiver_resampler.layers.2.input_context_norm.weight": "model-00001-of-00007.safetensors",
32
+ "model.connector.perceiver_resampler.layers.2.input_latents_norm.weight": "model-00001-of-00007.safetensors",
33
+ "model.connector.perceiver_resampler.layers.2.mlp.down_proj.weight": "model-00001-of-00007.safetensors",
34
+ "model.connector.perceiver_resampler.layers.2.mlp.gate_proj.weight": "model-00001-of-00007.safetensors",
35
+ "model.connector.perceiver_resampler.layers.2.mlp.up_proj.weight": "model-00001-of-00007.safetensors",
36
+ "model.connector.perceiver_resampler.layers.2.post_attention_layernorm.weight": "model-00001-of-00007.safetensors",
37
+ "model.connector.perceiver_resampler.layers.2.self_attn.k_proj.weight": "model-00001-of-00007.safetensors",
38
+ "model.connector.perceiver_resampler.layers.2.self_attn.o_proj.weight": "model-00001-of-00007.safetensors",
39
+ "model.connector.perceiver_resampler.layers.2.self_attn.q_proj.weight": "model-00001-of-00007.safetensors",
40
+ "model.connector.perceiver_resampler.layers.2.self_attn.v_proj.weight": "model-00001-of-00007.safetensors",
41
+ "model.connector.perceiver_resampler.norm.weight": "model-00001-of-00007.safetensors",
42
  "model.text_model.embed_tokens.weight": "model-00002-of-00007.safetensors",
43
  "model.text_model.layers.0.input_layernorm.weight": "model-00002-of-00007.safetensors",
44
  "model.text_model.layers.0.mlp.down_proj.weight": "model-00002-of-00007.safetensors",