nielsr HF staff commited on
Commit
f19dc2a
1 Parent(s): 8c4f501

Update P model

Browse files
Files changed (1) hide show
  1. config.json +12 -4
config.json CHANGED
@@ -3,12 +3,12 @@
3
  "PerceiverForImageClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
 
6
  "cross_attention_shape_for_attention": "kv",
7
  "cross_attention_widening_factor": 1,
8
  "d_latents": 1024,
9
  "d_model": 512,
10
  "hidden_act": "gelu",
11
- "hidden_dropout_prob": 0.1,
12
  "id2label": {
13
  "0": "tench, Tinca tinca",
14
  "1": "goldfish, Carassius auratus",
@@ -1011,6 +1011,7 @@
1011
  "998": "ear, spike, capitulum",
1012
  "999": "toilet tissue, toilet paper, bathroom tissue"
1013
  },
 
1014
  "initializer_range": 0.02,
1015
  "label2id": {
1016
  "Afghan hound, Afghan": 160,
@@ -2014,22 +2015,29 @@
2014
  "zucchini, courgette": 939
2015
  },
2016
  "layer_norm_eps": 1e-12,
 
2017
  "model_type": "perceiver",
2018
  "num_blocks": 8,
2019
  "num_cross_attention_heads": 1,
 
2020
  "num_latents": 512,
2021
  "num_self_attends_per_block": 6,
2022
  "num_self_attention_heads": 8,
2023
- "position_embedding_init_scale": 0.02,
 
 
 
 
 
2024
  "qk_channels": null,
 
2025
  "self_attention_widening_factor": 1,
2026
- "seq_len": 2048,
2027
  "torch_dtype": "float32",
2028
  "train_size": [
2029
  368,
2030
  496
2031
  ],
2032
- "transformers_version": "4.11.0.dev0",
2033
  "use_query_residual": true,
2034
  "v_channels": null,
2035
  "vocab_size": 262
 
3
  "PerceiverForImageClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
+ "audio_samples_per_frame": 1920,
7
  "cross_attention_shape_for_attention": "kv",
8
  "cross_attention_widening_factor": 1,
9
  "d_latents": 1024,
10
  "d_model": 512,
11
  "hidden_act": "gelu",
 
12
  "id2label": {
13
  "0": "tench, Tinca tinca",
14
  "1": "goldfish, Carassius auratus",
 
1011
  "998": "ear, spike, capitulum",
1012
  "999": "toilet tissue, toilet paper, bathroom tissue"
1013
  },
1014
+ "image_size": 224,
1015
  "initializer_range": 0.02,
1016
  "label2id": {
1017
  "Afghan hound, Afghan": 160,
 
2015
  "zucchini, courgette": 939
2016
  },
2017
  "layer_norm_eps": 1e-12,
2018
+ "max_position_embeddings": 2048,
2019
  "model_type": "perceiver",
2020
  "num_blocks": 8,
2021
  "num_cross_attention_heads": 1,
2022
+ "num_frames": 16,
2023
  "num_latents": 512,
2024
  "num_self_attends_per_block": 6,
2025
  "num_self_attention_heads": 8,
2026
+ "output_shape": [
2027
+ 1,
2028
+ 16,
2029
+ 224,
2030
+ 224
2031
+ ],
2032
  "qk_channels": null,
2033
+ "samples_per_patch": 16,
2034
  "self_attention_widening_factor": 1,
 
2035
  "torch_dtype": "float32",
2036
  "train_size": [
2037
  368,
2038
  496
2039
  ],
2040
+ "transformers_version": "4.12.0.dev0",
2041
  "use_query_residual": true,
2042
  "v_channels": null,
2043
  "vocab_size": 262