dg845 commited on
Commit
ef5d074
1 Parent(s): 15a8e39

Upload 22 files

Browse files

Update UniDiffuser-v1 small random testing checkpoint (rename image_processor to clip_image_processor)

clip_image_processor/preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 32,
4
+ "width": 32
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 32
26
+ }
27
+ }
clip_tokenizer/tokenizer_config.json CHANGED
@@ -8,6 +8,7 @@
8
  "rstrip": false,
9
  "single_word": false
10
  },
 
11
  "do_lower_case": true,
12
  "eos_token": {
13
  "__type": "AddedToken",
@@ -19,9 +20,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
- "name_or_path": "hf-internal-testing/tiny-random-clip",
23
  "pad_token": "<|endoftext|>",
24
- "special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
25
  "tokenizer_class": "CLIPTokenizer",
26
  "unk_token": {
27
  "__type": "AddedToken",
 
8
  "rstrip": false,
9
  "single_word": false
10
  },
11
+ "clean_up_tokenization_spaces": true,
12
  "do_lower_case": true,
13
  "eos_token": {
14
  "__type": "AddedToken",
 
20
  },
21
  "errors": "replace",
22
  "model_max_length": 77,
 
23
  "pad_token": "<|endoftext|>",
 
24
  "tokenizer_class": "CLIPTokenizer",
25
  "unk_token": {
26
  "__type": "AddedToken",
image_encoder/config.json CHANGED
@@ -18,5 +18,5 @@
18
  "patch_size": 2,
19
  "projection_dim": 32,
20
  "torch_dtype": "float32",
21
- "transformers_version": "4.26.1"
22
  }
 
18
  "patch_size": 2,
19
  "projection_dim": 32,
20
  "torch_dtype": "float32",
21
+ "transformers_version": "4.29.1"
22
  }
model_index.json CHANGED
@@ -1,6 +1,10 @@
1
  {
2
  "_class_name": "UniDiffuserPipeline",
3
- "_diffusers_version": "0.17.0.dev0",
 
 
 
 
4
  "clip_tokenizer": [
5
  "transformers",
6
  "CLIPTokenizer"
@@ -9,10 +13,6 @@
9
  "transformers",
10
  "CLIPVisionModelWithProjection"
11
  ],
12
- "image_processor": [
13
- "transformers",
14
- "CLIPImageProcessor"
15
- ],
16
  "scheduler": [
17
  "diffusers",
18
  "DPMSolverMultistepScheduler"
 
1
  {
2
  "_class_name": "UniDiffuserPipeline",
3
+ "_diffusers_version": "0.21.0.dev0",
4
+ "clip_image_processor": [
5
+ "transformers",
6
+ "CLIPImageProcessor"
7
+ ],
8
  "clip_tokenizer": [
9
  "transformers",
10
  "CLIPTokenizer"
 
13
  "transformers",
14
  "CLIPVisionModelWithProjection"
15
  ],
 
 
 
 
16
  "scheduler": [
17
  "diffusers",
18
  "DPMSolverMultistepScheduler"
scheduler/scheduler_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "DPMSolverMultistepScheduler",
3
- "_diffusers_version": "0.17.0.dev0",
4
  "algorithm_type": "dpmsolver++",
5
  "beta_end": 0.012,
6
  "beta_schedule": "scaled_linear",
@@ -13,7 +13,9 @@
13
  "sample_max_value": 1.0,
14
  "solver_order": 3,
15
  "solver_type": "midpoint",
 
16
  "thresholding": false,
 
17
  "trained_betas": null,
18
  "use_karras_sigmas": false,
19
  "variance_type": null
 
1
  {
2
  "_class_name": "DPMSolverMultistepScheduler",
3
+ "_diffusers_version": "0.21.0.dev0",
4
  "algorithm_type": "dpmsolver++",
5
  "beta_end": 0.012,
6
  "beta_schedule": "scaled_linear",
 
13
  "sample_max_value": 1.0,
14
  "solver_order": 3,
15
  "solver_type": "midpoint",
16
+ "steps_offset": 0,
17
  "thresholding": false,
18
+ "timestep_spacing": "linspace",
19
  "trained_betas": null,
20
  "use_karras_sigmas": false,
21
  "variance_type": null
text_decoder/config.json CHANGED
@@ -1,7 +1,6 @@
1
  {
2
  "_class_name": "UniDiffuserTextDecoder",
3
- "_diffusers_version": "0.15.0.dev0",
4
- "_name_or_path": "/home/tamamo/scratch/unidiffuser_test/text_decoder",
5
  "activation_function": "gelu",
6
  "attn_pdrop": 0.1,
7
  "embd_pdrop": 0.1,
 
1
  {
2
  "_class_name": "UniDiffuserTextDecoder",
3
+ "_diffusers_version": "0.21.0.dev0",
 
4
  "activation_function": "gelu",
5
  "attn_pdrop": 0.1,
6
  "embd_pdrop": 0.1,
text_decoder/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a67163f549e069e9350a75409d34a5ffc4cd7608e6569e6458539db7d60dc7e
3
  size 5679611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45fc49f24560aab4103739b7d196548121f1a91f9ecaa603d6a97afb6bcc1bbc
3
  size 5679611
text_encoder/config.json CHANGED
@@ -4,7 +4,6 @@
4
  ],
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 0,
7
- "dropout": 0.0,
8
  "eos_token_id": 2,
9
  "hidden_act": "quick_gelu",
10
  "hidden_size": 32,
@@ -19,6 +18,6 @@
19
  "pad_token_id": 1,
20
  "projection_dim": 512,
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.26.1",
23
  "vocab_size": 1000
24
  }
 
4
  ],
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 0,
 
7
  "eos_token_id": 2,
8
  "hidden_act": "quick_gelu",
9
  "hidden_size": 32,
 
18
  "pad_token_id": 1,
19
  "projection_dim": 512,
20
  "torch_dtype": "float32",
21
+ "transformers_version": "4.29.1",
22
  "vocab_size": 1000
23
  }
text_tokenizer/tokenizer_config.json CHANGED
@@ -9,6 +9,7 @@
9
  "rstrip": false,
10
  "single_word": false
11
  },
 
12
  "eos_token": {
13
  "__type": "AddedToken",
14
  "content": "<|endoftext|>",
@@ -19,9 +20,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 512,
22
- "name_or_path": "/home/tamamo/code/unidiffuser/models/new_gpt_tokenizer",
23
  "pad_token": null,
24
- "special_tokens_map_file": null,
25
  "tokenizer_class": "GPT2Tokenizer",
26
  "unk_token": {
27
  "__type": "AddedToken",
 
9
  "rstrip": false,
10
  "single_word": false
11
  },
12
+ "clean_up_tokenization_spaces": true,
13
  "eos_token": {
14
  "__type": "AddedToken",
15
  "content": "<|endoftext|>",
 
20
  },
21
  "errors": "replace",
22
  "model_max_length": 512,
 
23
  "pad_token": null,
 
24
  "tokenizer_class": "GPT2Tokenizer",
25
  "unk_token": {
26
  "__type": "AddedToken",
unet/config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_class_name": "UniDiffuserModel",
3
- "_diffusers_version": "0.17.0.dev0",
4
  "activation_fn": "gelu",
5
  "attention_bias": false,
6
  "attention_head_dim": 8,
 
1
  {
2
  "_class_name": "UniDiffuserModel",
3
+ "_diffusers_version": "0.21.0.dev0",
4
  "activation_fn": "gelu",
5
  "attention_bias": false,
6
  "attention_head_dim": 8,
unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3fb581fccee180478248760437f443b16aca837a3bf1b02ebd0803baa565f48
3
- size 87467
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff85fcccea0e13b2091802eb2f1fab9828cdb8580c346822c020a1c3765b1078
3
+ size 87531
vae/config.json CHANGED
@@ -1,7 +1,6 @@
1
  {
2
  "_class_name": "AutoencoderKL",
3
- "_diffusers_version": "0.15.0.dev0",
4
- "_name_or_path": "/home/tamamo/scratch/unidiffuser_test/vae",
5
  "act_fn": "silu",
6
  "block_out_channels": [
7
  32,
@@ -11,6 +10,7 @@
11
  "DownEncoderBlock2D",
12
  "DownEncoderBlock2D"
13
  ],
 
14
  "in_channels": 3,
15
  "latent_channels": 4,
16
  "layers_per_block": 1,
 
1
  {
2
  "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.21.0.dev0",
 
4
  "act_fn": "silu",
5
  "block_out_channels": [
6
  32,
 
10
  "DownEncoderBlock2D",
11
  "DownEncoderBlock2D"
12
  ],
13
+ "force_upcast": true,
14
  "in_channels": 3,
15
  "latent_channels": 4,
16
  "layers_per_block": 1,
vae/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c72dcad38b28b1a0c043f0e0063feb9e303782f7898c6167af3a5652ecbc1cb5
3
- size 2680745
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e84bb0d30f9de5f723541259119fa2702639a8c73465fe8263085739154eff9f
3
+ size 2681001