zawnpn commited on
Commit
732dd91
·
1 Parent(s): 512e24b
Files changed (3) hide show
  1. README.md +5 -1
  2. config.json +40 -0
  3. model.safetensors +3 -0
README.md CHANGED
@@ -3,4 +3,8 @@ license: mit
3
  library_name: transformers
4
  tags:
5
  - autoencoder
6
- ---
 
 
 
 
 
3
  library_name: transformers
4
  tags:
5
  - autoencoder
6
+ ---
7
+
8
+ This model is converted from the pretrained VQGAN of Meta's [Chameleon](https://huggingface.co/facebook/chameleon-7b). We adapt the VQGAN model to our [Being-VL](https://github.com/BeingBeyond/Being-VL-0.5) architecture. The license for this VQGAN model follows the original license of [Chameleon](https://ai.meta.com/resources/models-and-libraries/chameleon-license).
9
+
10
+ To use this model, please refer to the [Being-VL documentation](https://github.com/BeingBeyond/Being-VL-0.5).
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "ChameleonVQVAE"
4
+ ],
5
+ "attn_resolutions": [],
6
+ "attn_type": "vanilla",
7
+ "base_channels": 128,
8
+ "ch": 128,
9
+ "ch_mult": [
10
+ 1,
11
+ 1,
12
+ 2,
13
+ 2,
14
+ 4
15
+ ],
16
+ "channel_multiplier": [
17
+ 1,
18
+ 1,
19
+ 2,
20
+ 2,
21
+ 4
22
+ ],
23
+ "double_latent": false,
24
+ "double_z": false,
25
+ "dropout": 0.0,
26
+ "embed_dim": 256,
27
+ "in_channels": 3,
28
+ "initializer_range": 0.02,
29
+ "latent_channels": 256,
30
+ "model_type": "chameleon_vqgan",
31
+ "n_embed": 8192,
32
+ "num_embeddings": 8192,
33
+ "num_res_blocks": 2,
34
+ "out_ch": 3,
35
+ "out_channels": 3,
36
+ "resolution": 512,
37
+ "torch_dtype": "bfloat16",
38
+ "transformers_version": "4.45.0.dev0",
39
+ "z_channels": 256
40
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2b651489d0a1076d51cb81b7afcf107d8352b555119246e14473470fffedbd9
3
+ size 137467246