boris commited on
Commit
dc79278
1 Parent(s): 335110d

feat: update wandb inference

Browse files
dev/inference/samples.txt CHANGED
@@ -1,6 +1,6 @@
1
  white snow covered mountain under blue sky during daytime
2
- aerial view of the beach at night
3
  aerial view of the beach during daytime
 
4
  a beautiful sunset at a beach with a shell on the shore
5
  a farmhouse surrounded by beautiful flowers
6
  a photo of a fantasy version of New York City
@@ -29,6 +29,7 @@ an avocado armchair flying into space
29
  a cute avocado armchair singing karaoke on stage in front of a crowd of strawberry shaped lamps
30
  an illustration of an avocado in a christmas sweater staring at its reflection in a mirror
31
  illustration of an avocado armchair
 
32
  illustration of an avocado armchair getting married to a pineapple
33
  a muscular banana sitting upright on a bench smoking watching a banana on television, high definition photography
34
  Mohammed Ali and Mike Tyson in a hypothetical match
@@ -48,6 +49,8 @@ a dog eating worthlessness
48
  an elephant made of carrots
49
  an elephant on a unicycle during a circus
50
  photography of a penguin watching television
 
 
51
  rat wearing a crown
52
  a portrait of a nightmare creature watching at you
53
  a white room full of a black substance
@@ -66,6 +69,8 @@ Cartoon of a carrot with big eyes
66
  logo of a robot wearing glasses and reading a book
67
  a bottle of coca-cola on a table
68
  a cactus lifting weights
 
 
69
  a living room with two white armchairs and a painting of the collosseum. The painting is mounted above a modern fireplace.
70
  a long line of alternating green and red blocks
71
  a long line of green blocks on a beach at subset
 
1
  white snow covered mountain under blue sky during daytime
 
2
  aerial view of the beach during daytime
3
+ aerial view of the beach at night
4
  a beautiful sunset at a beach with a shell on the shore
5
  a farmhouse surrounded by beautiful flowers
6
  a photo of a fantasy version of New York City
 
29
  a cute avocado armchair singing karaoke on stage in front of a crowd of strawberry shaped lamps
30
  an illustration of an avocado in a christmas sweater staring at its reflection in a mirror
31
  illustration of an avocado armchair
32
+ illustration of an armchair in the shape of an avocado
33
  illustration of an avocado armchair getting married to a pineapple
34
  a muscular banana sitting upright on a bench smoking watching a banana on television, high definition photography
35
  Mohammed Ali and Mike Tyson in a hypothetical match
 
49
  an elephant made of carrots
50
  an elephant on a unicycle during a circus
51
  photography of a penguin watching television
52
+ a penguin is walking on the Moon, Earth is in the background
53
+ a penguin standing on a tower of books holds onto a rope from a helicopter
54
  rat wearing a crown
55
  a portrait of a nightmare creature watching at you
56
  a white room full of a black substance
 
69
  logo of a robot wearing glasses and reading a book
70
  a bottle of coca-cola on a table
71
  a cactus lifting weights
72
+ illustration of a cactus lifting weigths
73
+ logo of a cactus lifting weights
74
  a living room with two white armchairs and a painting of the collosseum. The painting is mounted above a modern fireplace.
75
  a long line of alternating green and red blocks
76
  a long line of green blocks on a beach at subset
dev/inference/wandb-backend.ipynb CHANGED
@@ -47,7 +47,10 @@
47
  "metadata": {},
48
  "outputs": [],
49
  "source": [
50
- "run_ids = ['k76r0v39']\n",
 
 
 
51
  "ENTITY, PROJECT = 'dalle-mini', 'dalle-mini' # used only for training run\n",
52
  "VQGAN_REPO, VQGAN_COMMIT_ID = 'dalle-mini/vqgan_imagenet_f16_16384', None\n",
53
  "normalize_text = True\n",
@@ -115,16 +118,6 @@
115
  " return logits"
116
  ]
117
  },
118
- {
119
- "cell_type": "code",
120
- "execution_count": null,
121
- "id": "ebf4f7bf-2efa-46cc-b3f4-2d7a54f7b2cb",
122
- "metadata": {},
123
- "outputs": [],
124
- "source": [
125
- "clip_params['logit_scale']"
126
- ]
127
- },
128
  {
129
  "cell_type": "code",
130
  "execution_count": null,
@@ -286,7 +279,8 @@
286
  "\n",
287
  " # generate images\n",
288
  " images = []\n",
289
- " for i in tqdm(range(num_images // jax.device_count()), desc='Generating Images'):\n",
 
290
  " key, subkey = jax.random.split(key)\n",
291
  " encoded_images = p_generate(tokenized_prompt, shard_prng_key(subkey), model_params)\n",
292
  " encoded_images = encoded_images.sequences[..., 1:]\n",
@@ -296,7 +290,7 @@
296
  " images.append(Image.fromarray(np.asarray(img * 255, dtype=np.uint8)))\n",
297
  "\n",
298
  " # get clip scores\n",
299
- " print('Calculating CLIP scores')\n",
300
  " clip_inputs = processor(text=batch, images=images, return_tensors='np', padding='max_length', max_length=77, truncation=True).data\n",
301
  " # each shard will have one prompt, images need to be reorganized to be associated to the correct shard\n",
302
  " images_per_prompt_indices = np.asarray(range(0, len(images), batch_size))\n",
 
47
  "metadata": {},
48
  "outputs": [],
49
  "source": [
50
+ "run_ids = ['he9rrc3q']\n",
51
+ "# poorly shuffled 1nj161cl\n",
52
+ "# well shuffled he9rrc3q\n",
53
+ "# non normalized 1fwxpyfh ! requires changing normalize_text\n",
54
  "ENTITY, PROJECT = 'dalle-mini', 'dalle-mini' # used only for training run\n",
55
  "VQGAN_REPO, VQGAN_COMMIT_ID = 'dalle-mini/vqgan_imagenet_f16_16384', None\n",
56
  "normalize_text = True\n",
 
118
  " return logits"
119
  ]
120
  },
 
 
 
 
 
 
 
 
 
 
121
  {
122
  "cell_type": "code",
123
  "execution_count": null,
 
279
  "\n",
280
  " # generate images\n",
281
  " images = []\n",
282
+ " pbar = tqdm(range(num_images // jax.device_count()), desc='Generating Images', leave=None)\n",
283
+ " for i in pbar:\n",
284
  " key, subkey = jax.random.split(key)\n",
285
  " encoded_images = p_generate(tokenized_prompt, shard_prng_key(subkey), model_params)\n",
286
  " encoded_images = encoded_images.sequences[..., 1:]\n",
 
290
  " images.append(Image.fromarray(np.asarray(img * 255, dtype=np.uint8)))\n",
291
  "\n",
292
  " # get clip scores\n",
293
+ " pbar.set_description('Calculating CLIP scores')\n",
294
  " clip_inputs = processor(text=batch, images=images, return_tensors='np', padding='max_length', max_length=77, truncation=True).data\n",
295
  " # each shard will have one prompt, images need to be reorganized to be associated to the correct shard\n",
296
  " images_per_prompt_indices = np.asarray(range(0, len(images), batch_size))\n",