Feature Extraction
Transformers
clip
vision
Inference Endpoints
kimihailv commited on
Commit
51f9f5d
1 Parent(s): c47f742

Upload torch_config.json

Browse files
Files changed (1) hide show
  1. torch_config.json +26 -0
torch_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "text_encoder": {
3
+ "model_type": "bert",
4
+ "dim": 768,
5
+ "context_dim": 768,
6
+ "vocab_size": 30522,
7
+ "padding_idx": 0,
8
+ "num_layers": 4,
9
+ "num_heads": 12,
10
+ "embedding_dim": 256,
11
+ "multimodal_layers_ids": [2, 3],
12
+ "head_one_neuron": false,
13
+ "pooling": "cls",
14
+ "max_position_embeddings": 77,
15
+ "dropout_prob": 0.1
16
+ },
17
+ "image_encoder": {
18
+ "dim": 768,
19
+ "patch_size": 16,
20
+ "image_size": 224,
21
+ "num_layers": 12,
22
+ "num_heads": 12,
23
+ "embedding_dim": 256,
24
+ "pooling": "cls"
25
+ }
26
+ }