Update model
Browse files- config.json +8 -4
config.json
CHANGED
@@ -9,7 +9,6 @@
|
|
9 |
"d_latents": 1024,
|
10 |
"d_model": 261,
|
11 |
"hidden_act": "gelu",
|
12 |
-
"hidden_dropout_prob": 0.1,
|
13 |
"id2label": {
|
14 |
"0": "tench, Tinca tinca",
|
15 |
"1": "goldfish, Carassius auratus",
|
@@ -2016,6 +2015,7 @@
|
|
2016 |
"zucchini, courgette": 939
|
2017 |
},
|
2018 |
"layer_norm_eps": 1e-12,
|
|
|
2019 |
"model_type": "perceiver",
|
2020 |
"num_blocks": 8,
|
2021 |
"num_cross_attention_heads": 1,
|
@@ -2023,17 +2023,21 @@
|
|
2023 |
"num_latents": 512,
|
2024 |
"num_self_attends_per_block": 6,
|
2025 |
"num_self_attention_heads": 8,
|
2026 |
-
"
|
|
|
|
|
|
|
|
|
|
|
2027 |
"qk_channels": null,
|
2028 |
"samples_per_patch": 16,
|
2029 |
"self_attention_widening_factor": 1,
|
2030 |
-
"seq_len": 2048,
|
2031 |
"torch_dtype": "float32",
|
2032 |
"train_size": [
|
2033 |
368,
|
2034 |
496
|
2035 |
],
|
2036 |
-
"transformers_version": "4.
|
2037 |
"use_query_residual": true,
|
2038 |
"v_channels": null,
|
2039 |
"vocab_size": 262
|
|
|
9 |
"d_latents": 1024,
|
10 |
"d_model": 261,
|
11 |
"hidden_act": "gelu",
|
|
|
12 |
"id2label": {
|
13 |
"0": "tench, Tinca tinca",
|
14 |
"1": "goldfish, Carassius auratus",
|
|
|
2015 |
"zucchini, courgette": 939
|
2016 |
},
|
2017 |
"layer_norm_eps": 1e-12,
|
2018 |
+
"max_position_embeddings": 2048,
|
2019 |
"model_type": "perceiver",
|
2020 |
"num_blocks": 8,
|
2021 |
"num_cross_attention_heads": 1,
|
|
|
2023 |
"num_latents": 512,
|
2024 |
"num_self_attends_per_block": 6,
|
2025 |
"num_self_attention_heads": 8,
|
2026 |
+
"output_shape": [
|
2027 |
+
1,
|
2028 |
+
16,
|
2029 |
+
224,
|
2030 |
+
224
|
2031 |
+
],
|
2032 |
"qk_channels": null,
|
2033 |
"samples_per_patch": 16,
|
2034 |
"self_attention_widening_factor": 1,
|
|
|
2035 |
"torch_dtype": "float32",
|
2036 |
"train_size": [
|
2037 |
368,
|
2038 |
496
|
2039 |
],
|
2040 |
+
"transformers_version": "4.12.0.dev0",
|
2041 |
"use_query_residual": true,
|
2042 |
"v_channels": null,
|
2043 |
"vocab_size": 262
|