DongfuJiang commited on
Commit
a952753
1 Parent(s): 5854fc5
Files changed (2) hide show
  1. examples/all_subsets.json +45 -15
  2. examples/test.ipynb +34 -14
examples/all_subsets.json CHANGED
@@ -36,7 +36,9 @@
36
  "from": "gpt",
37
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
38
  }
39
- ]
 
 
40
  },
41
  {
42
  "id": "real_r100916",
@@ -67,7 +69,9 @@
67
  "from": "gpt",
68
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
69
  }
70
- ]
 
 
71
  },
72
  {
73
  "id": "real_r004061",
@@ -106,7 +110,9 @@
106
  "from": "gpt",
107
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
108
  }
109
- ]
 
 
110
  },
111
  {
112
  "id": "worsen_gen_b404675",
@@ -137,7 +143,9 @@
137
  "from": "gpt",
138
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 1\n"
139
  }
140
- ]
 
 
141
  },
142
  {
143
  "id": "worsen_gen_b402727",
@@ -168,7 +176,9 @@
168
  "from": "gpt",
169
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 1\n"
170
  }
171
- ]
 
 
172
  },
173
  {
174
  "id": "worsen_gen_b304986",
@@ -199,7 +209,9 @@
199
  "from": "gpt",
200
  "value": "visual quality: 3\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 1\n"
201
  }
202
- ]
 
 
203
  },
204
  {
205
  "id": "static_d500937",
@@ -230,7 +242,9 @@
230
  "from": "gpt",
231
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
232
  }
233
- ]
 
 
234
  },
235
  {
236
  "id": "static_d500506",
@@ -261,7 +275,9 @@
261
  "from": "gpt",
262
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
263
  }
264
- ]
 
 
265
  },
266
  {
267
  "id": "static_d401950",
@@ -292,7 +308,9 @@
292
  "from": "gpt",
293
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
294
  }
295
- ]
 
 
296
  },
297
  {
298
  "id": "insf_a500251",
@@ -323,7 +341,9 @@
323
  "from": "gpt",
324
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
325
  }
326
- ]
 
 
327
  },
328
  {
329
  "id": "insf_a400480",
@@ -354,7 +374,9 @@
354
  "from": "gpt",
355
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
356
  }
357
- ]
 
 
358
  },
359
  {
360
  "id": "insf_a500010",
@@ -385,7 +407,9 @@
385
  "from": "gpt",
386
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
387
  }
388
- ]
 
 
389
  },
390
  {
391
  "id": "lab_3005033",
@@ -416,7 +440,9 @@
416
  "from": "gpt",
417
  "value": "visual quality: 3\n object consistency: 2\n dynamic degree: 3\n motion smoothness: 2\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 2\n"
418
  }
419
- ]
 
 
420
  },
421
  {
422
  "id": "lab_7004180",
@@ -439,7 +465,9 @@
439
  "from": "gpt",
440
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
441
  }
442
- ]
 
 
443
  },
444
  {
445
  "id": "lab_1006309",
@@ -470,6 +498,8 @@
470
  "from": "gpt",
471
  "value": "visual quality: 3\n object consistency: 2\n dynamic degree: 3\n motion smoothness: 2\n text-to-video alignment: 3\n factual consistency: 2\n overall score: 3\n"
472
  }
473
- ]
 
 
474
  }
475
  ]
 
36
  "from": "gpt",
37
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
38
  }
39
+ ],
40
+ "video": "r003679.mp4",
41
+ "prompt": "dog rolls over and falls off couch"
42
  },
43
  {
44
  "id": "real_r100916",
 
69
  "from": "gpt",
70
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
71
  }
72
+ ],
73
+ "video": "r100916.mp4",
74
+ "prompt": "A young man is standing in front of a glacier with mountains in the background."
75
  },
76
  {
77
  "id": "real_r004061",
 
110
  "from": "gpt",
111
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
112
  }
113
+ ],
114
+ "video": "r004061.mp4",
115
+ "prompt": "a man wearing a striped blanket over his backpack runs behind two other men."
116
  },
117
  {
118
  "id": "worsen_gen_b404675",
 
143
  "from": "gpt",
144
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 1\n"
145
  }
146
+ ],
147
+ "video": "b404675.mp4",
148
+ "prompt": "After a few years, Ghulam Muhammad became the owner of his business"
149
  },
150
  {
151
  "id": "worsen_gen_b402727",
 
176
  "from": "gpt",
177
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 1\n"
178
  }
179
+ ],
180
+ "video": "b402727.mp4",
181
+ "prompt": "view down to the path in the field, moving forward, night, dark."
182
  },
183
  {
184
  "id": "worsen_gen_b304986",
 
209
  "from": "gpt",
210
  "value": "visual quality: 3\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 1\n"
211
  }
212
+ ],
213
+ "video": "b304986.mp4",
214
+ "prompt": "Old Philippino man, close up, subtle smile, teats of joy, in old wood room"
215
  },
216
  {
217
  "id": "static_d500937",
 
242
  "from": "gpt",
243
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
244
  }
245
+ ],
246
+ "video": "d500937.mp4",
247
+ "prompt": "write y in the garden with flowers"
248
  },
249
  {
250
  "id": "static_d500506",
 
275
  "from": "gpt",
276
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
277
  }
278
+ ],
279
+ "video": "d500506.mp4",
280
+ "prompt": "a boy paiting a beautiful landscape"
281
  },
282
  {
283
  "id": "static_d401950",
 
308
  "from": "gpt",
309
  "value": "visual quality: 1\n object consistency: 3\n dynamic degree: 1\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
310
  }
311
+ ],
312
+ "video": "d401950.mp4",
313
+ "prompt": "sneaker with exclusive design worth 1 billion"
314
  },
315
  {
316
  "id": "insf_a500251",
 
341
  "from": "gpt",
342
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
343
  }
344
+ ],
345
+ "video": "a500251.mp4",
346
+ "prompt": ":sci fi war in the moon"
347
  },
348
  {
349
  "id": "insf_a400480",
 
374
  "from": "gpt",
375
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
376
  }
377
+ ],
378
+ "video": "a400480.mp4",
379
+ "prompt": "for a dog accessories brand a welcome image: brand name: hot doggies"
380
  },
381
  {
382
  "id": "insf_a500010",
 
407
  "from": "gpt",
408
  "value": "visual quality: 1\n object consistency: 1\n dynamic degree: 3\n motion smoothness: 1\n text-to-video alignment: 1\n factual consistency: 1\n overall score: 1\n"
409
  }
410
+ ],
411
+ "video": "a500010.mp4",
412
+ "prompt": "a druid in the forest cinematic"
413
  },
414
  {
415
  "id": "lab_3005033",
 
440
  "from": "gpt",
441
  "value": "visual quality: 3\n object consistency: 2\n dynamic degree: 3\n motion smoothness: 2\n text-to-video alignment: 2\n factual consistency: 3\n overall score: 2\n"
442
  }
443
+ ],
444
+ "video": "3005033.mp4",
445
+ "prompt": "a robot vacuum traveling through southeast asian countries"
446
  },
447
  {
448
  "id": "lab_7004180",
 
465
  "from": "gpt",
466
  "value": "visual quality: 3\n object consistency: 3\n dynamic degree: 3\n motion smoothness: 3\n text-to-video alignment: 3\n factual consistency: 3\n overall score: 3\n"
467
  }
468
+ ],
469
+ "video": "7004180.mp4",
470
+ "prompt": "jiaxuan is the most beautiful \uff0celegant\uff0ccharming girl in the world. billions of boys fell in love with her"
471
  },
472
  {
473
  "id": "lab_1006309",
 
498
  "from": "gpt",
499
  "value": "visual quality: 3\n object consistency: 2\n dynamic degree: 3\n motion smoothness: 2\n text-to-video alignment: 3\n factual consistency: 2\n overall score: 3\n"
500
  }
501
+ ],
502
+ "video": "1006309.mp4",
503
+ "prompt": "scary halloween skeletons are having a conversation with each other"
504
  }
505
  ]
examples/test.ipynb CHANGED
@@ -105,7 +105,7 @@
105
  },
106
  {
107
  "cell_type": "code",
108
- "execution_count": 3,
109
  "metadata": {},
110
  "outputs": [
111
  {
@@ -113,15 +113,35 @@
113
  "output_type": "stream",
114
  "text": [
115
  "dog rolls over and falls off couch\n",
116
- "Created video for r003679\n"
117
- ]
118
- },
119
- {
120
- "name": "stderr",
121
- "output_type": "stream",
122
- "text": [
123
- "[ERROR:0@119.424] global cap_ffmpeg_impl.hpp:3130 open Could not find encoder for codec_id=27, error: Encoder not found\n",
124
- "[ERROR:0@119.424] global cap_ffmpeg_impl.hpp:3208 open VIDEOIO/FFMPEG: Failed to initialize VideoWriter\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
125
  ]
126
  }
127
  ],
@@ -148,8 +168,8 @@
148
  " item['prompt'] = prompt.strip()\n",
149
  " \n",
150
  " # Initialize the video writer\n",
151
- " # fourcc = cv2.VideoWriter_fourcc(*'H264') # Codec for .mp4 file|\n",
152
- " fourcc = cv2.VideoWriter_fourcc(*'avc3') # Codec for .mp4 file|\n",
153
  " frame_rate = 8\n",
154
  " video = cv2.VideoWriter(output_file, fourcc, frame_rate, (width, height))\n",
155
  "\n",
@@ -163,13 +183,13 @@
163
  "\n",
164
  " # Release the video writer\n",
165
  " video.release()\n",
166
- " break\n",
167
  " "
168
  ]
169
  },
170
  {
171
  "cell_type": "code",
172
- "execution_count": 26,
173
  "metadata": {},
174
  "outputs": [],
175
  "source": [
 
105
  },
106
  {
107
  "cell_type": "code",
108
+ "execution_count": 6,
109
  "metadata": {},
110
  "outputs": [
111
  {
 
113
  "output_type": "stream",
114
  "text": [
115
  "dog rolls over and falls off couch\n",
116
+ "Created video for r003679\n",
117
+ "A young man is standing in front of a glacier with mountains in the background.\n",
118
+ "Created video for r100916\n",
119
+ "a man wearing a striped blanket over his backpack runs behind two other men.\n",
120
+ "Created video for r004061\n",
121
+ "After a few years, Ghulam Muhammad became the owner of his business \n",
122
+ "Created video for b404675\n",
123
+ "view down to the path in the field, moving forward, night, dark. \n",
124
+ "Created video for b402727\n",
125
+ "Old Philippino man, close up, subtle smile, teats of joy, in old wood room \n",
126
+ "Created video for b304986\n",
127
+ "write y in the garden with flowers \n",
128
+ "Created video for d500937\n",
129
+ "a boy paiting a beautiful landscape \n",
130
+ "Created video for d500506\n",
131
+ "sneaker with exclusive design worth 1 billion \n",
132
+ "Created video for d401950\n",
133
+ ":sci fi war in the moon \n",
134
+ "Created video for a500251\n",
135
+ "for a dog accessories brand a welcome image: brand name: hot doggies \n",
136
+ "Created video for a400480\n",
137
+ "a druid in the forest cinematic \n",
138
+ "Created video for a500010\n",
139
+ "a robot vacuum traveling through southeast asian countries \n",
140
+ "Created video for 3005033\n",
141
+ "jiaxuan is the most beautiful ,elegant,charming girl in the world. billions of boys fell in love with her \n",
142
+ "Created video for 7004180\n",
143
+ "scary halloween skeletons are having a conversation with each other \n",
144
+ "Created video for 1006309\n"
145
  ]
146
  }
147
  ],
 
168
  " item['prompt'] = prompt.strip()\n",
169
  " \n",
170
  " # Initialize the video writer\n",
171
+ " fourcc = cv2.VideoWriter_fourcc(*'mp4v') # Codec for .mp4 file|\n",
172
+ " # fourcc = cv2.VideoWriter_fourcc(*'avc3') # Codec for .mp4 file|\n",
173
  " frame_rate = 8\n",
174
  " video = cv2.VideoWriter(output_file, fourcc, frame_rate, (width, height))\n",
175
  "\n",
 
183
  "\n",
184
  " # Release the video writer\n",
185
  " video.release()\n",
186
+ " # break\n",
187
  " "
188
  ]
189
  },
190
  {
191
  "cell_type": "code",
192
+ "execution_count": 7,
193
  "metadata": {},
194
  "outputs": [],
195
  "source": [