threeColorFr commited on
Commit
0fb6b45
·
1 Parent(s): 58ea365

Upload 2 files

Browse files
Files changed (2) hide show
  1. latest +1 -0
  2. model_config.json +76 -0
latest ADDED
@@ -0,0 +1 @@
 
 
1
+ 1
model_config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_class": "FineTuneVisualGLMModel",
3
+ "tokenizer_type": "THUDM/chatglm-6b",
4
+ "num_layers": 28,
5
+ "hidden_size": 4096,
6
+ "num_attention_heads": 32,
7
+ "vocab_size": 130528,
8
+ "layernorm_order": "post",
9
+ "model_parallel_size": 1,
10
+ "max_sequence_length": 2048,
11
+ "pre_seq_len": 4,
12
+ "lora_rank": 32,
13
+ "use_ptuning": false,
14
+ "use_lora": true,
15
+ "use_qlora": false,
16
+ "layer_range": [],
17
+ "image_length": 32,
18
+ "eva_args": {
19
+ "num_layers": 39,
20
+ "hidden_size": 1408,
21
+ "num_attention_heads": 16,
22
+ "vocab_size": 1,
23
+ "layernorm_order": "pre",
24
+ "model_parallel_size": 1,
25
+ "max_sequence_length": 257,
26
+ "inner_hidden_size": 6144,
27
+ "use_final_layernorm": false,
28
+ "layernorm_epsilon": 1e-06,
29
+ "image_size": [
30
+ 224,
31
+ 224
32
+ ],
33
+ "pre_len": 1,
34
+ "post_len": 0,
35
+ "in_channels": 3,
36
+ "num_classes": 0,
37
+ "patch_size": 14
38
+ },
39
+ "qformer_args": {
40
+ "num_layers": 12,
41
+ "hidden_size": 768,
42
+ "num_attention_heads": 12,
43
+ "vocab_size": 32,
44
+ "layernorm_order": "post",
45
+ "model_parallel_size": 1,
46
+ "max_sequence_length": 0,
47
+ "is_decoder": [
48
+ true,
49
+ false,
50
+ true,
51
+ false,
52
+ true,
53
+ false,
54
+ true,
55
+ false,
56
+ true,
57
+ false,
58
+ true,
59
+ false
60
+ ],
61
+ "cross_attn_hidden_size": 1408,
62
+ "layernorm_epsilon": 1e-12
63
+ },
64
+ "bos_token_id": 130004,
65
+ "mask_token_id": 130000,
66
+ "gmask_token_id": 130001,
67
+ "pad_token_id": 3,
68
+ "image_size": [
69
+ 224,
70
+ 224
71
+ ],
72
+ "pre_len": 1,
73
+ "post_len": 0,
74
+ "in_channels": 3,
75
+ "patch_size": 14
76
+ }