weathon
commited on
Commit
·
46edcef
1
Parent(s):
71ff04e
- app.py +18 -15
- image_neg_prompt.ipynb +325 -0
- sample_prompts.json +1153 -0
- src/__pycache__/sd3_pipeline.cpython-310.pyc +0 -0
- src/sd3_pipeline.py +18 -13
- wheel.webp +0 -0
app.py
CHANGED
|
@@ -15,7 +15,6 @@ from diffusers import AutoencoderKLWan
|
|
| 15 |
from vsfwan.pipeline import WanPipeline
|
| 16 |
from vsfwan.processor import WanAttnProcessor2_0
|
| 17 |
from diffusers import WanVACEPipeline
|
| 18 |
-
from diffusers.utils import export_to_video
|
| 19 |
import uuid
|
| 20 |
|
| 21 |
import sys
|
|
@@ -73,7 +72,7 @@ pipe = pipe.to("cuda")
|
|
| 73 |
nag_pipe = nag_pipe.to("cuda")
|
| 74 |
import os
|
| 75 |
@spaces.GPU
|
| 76 |
-
def
|
| 77 |
global pipe, nag_pipe
|
| 78 |
lambda total: progress.tqdm(range(total))
|
| 79 |
|
|
@@ -142,12 +141,12 @@ def load_sample():
|
|
| 142 |
with open("anti_aesthetics.json", "r") as f:
|
| 143 |
anti_aesthetics_prompts = json.load(f)
|
| 144 |
|
| 145 |
-
def load_anti_aesthetics_sample():
|
| 146 |
sample = np.random.choice(anti_aesthetics_prompts)
|
| 147 |
return sample['prompt'], sample['missing_element']
|
| 148 |
|
| 149 |
nouns = ["cat", "dog", "car", "bicycle", "tree", "house", "computer", "phone", "book", "chair", "table", "lamp", "flower", "mountain", "river", "ocean", "cloud", "bird", "fish", "butterfly", "sun", "moon", "planet", "robot", "alien", "castle", "dragon", "unicorn", "fairy", "wizard"]
|
| 150 |
-
methods = ["painting", "sketch", "drawing", "watercolor", "oil painting", "low poly art", "color pencil drawing", "crayon art"]
|
| 151 |
def load_abstract_prompt():
|
| 152 |
noun = np.random.choice(nouns)
|
| 153 |
method = np.random.choice(methods)
|
|
@@ -182,12 +181,12 @@ from PIL import Image
|
|
| 182 |
|
| 183 |
|
| 184 |
with gr.Blocks(title="Value Sign Flip SD3.5 Demo") as demo:
|
| 185 |
-
gr.Markdown("# Value Sign Flip SD3.5 Demo \n\n This demo is based on SD3.5-L-Turbo model and uses Value Sign Flip technique to generate
|
| 186 |
gr.Markdown("To help with further research, all generations will be logged anonymously. If you do not wish to participate, please do not use the demo. Please keep prompts safe for work and non-offensive. ")
|
| 187 |
gr.Markdown("This project is supported by [Lambda Cloud](https://lambda.ai/), [Weathon Software](https://weasoft.com), and [Canada Foundation for Innovation](https://www.innovation.ca/). ")
|
| 188 |
-
gr.Markdown("Using negative prompts for abstract arts and anti-aesthetics arts are also one of our contributions and can be applied to either VSF or NAG techniques. Details in papaer appendix N or [this paper](https://www.researchgate.net/publication/397595102)")
|
| 189 |
|
| 190 |
-
# gr.Markdown("# Value Sign Flip Wan 2.1 Demo \n\n This demo is based on Wan 2.1 T2V model and uses Value Sign Flip technique to generate
|
| 191 |
|
| 192 |
with gr.Row(min_height=200):
|
| 193 |
pos = gr.Textbox(label="Positive Prompt", value="A polished bicycle frame leans against a weathered brick wall under soft morning light.", lines=5)
|
|
@@ -195,7 +194,7 @@ with gr.Blocks(title="Value Sign Flip SD3.5 Demo") as demo:
|
|
| 195 |
|
| 196 |
# rephase = gr.Button("Rephrase Prompt")
|
| 197 |
with gr.Row():
|
| 198 |
-
sample = gr.Button("Load A Sample Prompt")
|
| 199 |
sample.click(fn=load_sample, inputs=[], outputs=[pos, neg])
|
| 200 |
anti_aesthetic_sample = gr.Button("Load An Anti-Aesthetic Sample Prompt (Could Cause Unease)")
|
| 201 |
anti_aesthetic_sample.click(fn=load_anti_aesthetics_sample, inputs=[], outputs=[pos, neg])
|
|
@@ -211,20 +210,24 @@ with gr.Blocks(title="Value Sign Flip SD3.5 Demo") as demo:
|
|
| 211 |
seed = gr.Number(label="Seed", value=0, precision=0)
|
| 212 |
randomize_seed = gr.Button("Randomize Seed")
|
| 213 |
randomize_seed.click(fn=lambda : np.random.randint(0, 1000000), inputs=[], outputs=[seed])
|
| 214 |
-
set_strong_vsf = gr.Button("
|
| 215 |
set_strong_vsf.click(fn=lambda : (3.8, 0.2), inputs=[], outputs=[guidance, bias])
|
| 216 |
-
|
| 217 |
-
|
|
|
|
|
|
|
| 218 |
|
| 219 |
with gr.Row():
|
| 220 |
gr.Markdown("## NAG Generation Parameters")
|
| 221 |
nag_guidance = gr.Slider(1, 12, step=0.1, label="Guidance Scale", value=5)
|
| 222 |
nag_alpha = gr.Slider(0.1, 1.0, step=0.01, label="Alpha", value=0.25)
|
| 223 |
nag_tau = gr.Slider(1, 10, step=0.01, label="Tau", value=3.0)
|
| 224 |
-
nag_step = gr.Slider(4, 15, step=1, label="Step", value=
|
| 225 |
-
set_strong = gr.Button("
|
| 226 |
set_strong.click(fn=lambda : (11, 0.5, 5.0), inputs=[], outputs=[nag_guidance, nag_alpha, nag_tau])
|
| 227 |
-
|
|
|
|
|
|
|
| 228 |
set_mild.click(fn=lambda : (4, 0.125, 2.5), inputs=[], outputs=[nag_guidance, nag_alpha, nag_tau])
|
| 229 |
|
| 230 |
|
|
@@ -235,7 +238,7 @@ with gr.Blocks(title="Value Sign Flip SD3.5 Demo") as demo:
|
|
| 235 |
normal_out = gr.Image(label="Without Negative Guidance")
|
| 236 |
|
| 237 |
btn = gr.Button("Generate")
|
| 238 |
-
btn.click(fn=
|
| 239 |
|
| 240 |
|
| 241 |
demo.launch(share=True)
|
|
|
|
| 15 |
from vsfwan.pipeline import WanPipeline
|
| 16 |
from vsfwan.processor import WanAttnProcessor2_0
|
| 17 |
from diffusers import WanVACEPipeline
|
|
|
|
| 18 |
import uuid
|
| 19 |
|
| 20 |
import sys
|
|
|
|
| 72 |
nag_pipe = nag_pipe.to("cuda")
|
| 73 |
import os
|
| 74 |
@spaces.GPU
|
| 75 |
+
def generate_image(positive_prompt, negative_prompt, guidance_scale, bias, step, seed, nag_guidance, nag_alpha, nag_tau, nag_step, progress=gr.Progress(track_tqdm=False)):
|
| 76 |
global pipe, nag_pipe
|
| 77 |
lambda total: progress.tqdm(range(total))
|
| 78 |
|
|
|
|
| 141 |
with open("anti_aesthetics.json", "r") as f:
|
| 142 |
anti_aesthetics_prompts = json.load(f)
|
| 143 |
|
| 144 |
+
def load_anti_aesthetics_sample():
|
| 145 |
sample = np.random.choice(anti_aesthetics_prompts)
|
| 146 |
return sample['prompt'], sample['missing_element']
|
| 147 |
|
| 148 |
nouns = ["cat", "dog", "car", "bicycle", "tree", "house", "computer", "phone", "book", "chair", "table", "lamp", "flower", "mountain", "river", "ocean", "cloud", "bird", "fish", "butterfly", "sun", "moon", "planet", "robot", "alien", "castle", "dragon", "unicorn", "fairy", "wizard"]
|
| 149 |
+
methods = ["painting", "sketch", "drawing", "watercolor", "oil painting", "low poly art", "color pencil drawing", "crayon art", "ink wash", "paper cutout", "line art"]
|
| 150 |
def load_abstract_prompt():
|
| 151 |
noun = np.random.choice(nouns)
|
| 152 |
method = np.random.choice(methods)
|
|
|
|
| 181 |
|
| 182 |
|
| 183 |
with gr.Blocks(title="Value Sign Flip SD3.5 Demo") as demo:
|
| 184 |
+
gr.Markdown("# Value Sign Flip SD3.5 Demo \n\n This demo is based on SD3.5-L-Turbo model and uses Value Sign Flip technique to generate images with different guidance scales and biases. More on [GitHub](https://github.com/weathon/VSF/blob/main/wan.md) and [ArXiv](https://arxiv.org/pdf/2508.10931) \n\nPositive prompt should be at least 1 sentence long or the results will be weird. ")
|
| 185 |
gr.Markdown("To help with further research, all generations will be logged anonymously. If you do not wish to participate, please do not use the demo. Please keep prompts safe for work and non-offensive. ")
|
| 186 |
gr.Markdown("This project is supported by [Lambda Cloud](https://lambda.ai/), [Weathon Software](https://weasoft.com), and [Canada Foundation for Innovation](https://www.innovation.ca/). ")
|
| 187 |
+
gr.Markdown("Using negative prompts for abstract arts and anti-aesthetics arts are also one of our contributions and can be applied to either VSF or NAG techniques. Details in papaer appendix N or [this paper](https://www.researchgate.net/publication/397595102).")
|
| 188 |
|
| 189 |
+
# gr.Markdown("# Value Sign Flip Wan 2.1 Demo \n\n This demo is based on Wan 2.1 T2V model and uses Value Sign Flip technique to generate images with different guidance scales and biases. More on [GitHub](https://github.com/weathon/VSF/blob/main/wan.md)\n\nPositive prompt should be at least 2 sentence long or the results will be weird.")
|
| 190 |
|
| 191 |
with gr.Row(min_height=200):
|
| 192 |
pos = gr.Textbox(label="Positive Prompt", value="A polished bicycle frame leans against a weathered brick wall under soft morning light.", lines=5)
|
|
|
|
| 194 |
|
| 195 |
# rephase = gr.Button("Rephrase Prompt")
|
| 196 |
with gr.Row():
|
| 197 |
+
sample = gr.Button("Load A Sample Prompt (Uncurated)")
|
| 198 |
sample.click(fn=load_sample, inputs=[], outputs=[pos, neg])
|
| 199 |
anti_aesthetic_sample = gr.Button("Load An Anti-Aesthetic Sample Prompt (Could Cause Unease)")
|
| 200 |
anti_aesthetic_sample.click(fn=load_anti_aesthetics_sample, inputs=[], outputs=[pos, neg])
|
|
|
|
| 210 |
seed = gr.Number(label="Seed", value=0, precision=0)
|
| 211 |
randomize_seed = gr.Button("Randomize Seed")
|
| 212 |
randomize_seed.click(fn=lambda : np.random.randint(0, 1000000), inputs=[], outputs=[seed])
|
| 213 |
+
set_strong_vsf = gr.Button("Strong")
|
| 214 |
set_strong_vsf.click(fn=lambda : (3.8, 0.2), inputs=[], outputs=[guidance, bias])
|
| 215 |
+
set_normal_vsf = gr.Button("Normal")
|
| 216 |
+
set_normal_vsf.click(fn=lambda : (3.3, 0.2), inputs=[], outputs=[guidance, bias])
|
| 217 |
+
set_mild_vsf = gr.Button("Quality")
|
| 218 |
+
set_mild_vsf.click(fn=lambda : (2.5, 0.2), inputs=[], outputs=[guidance, bias])
|
| 219 |
|
| 220 |
with gr.Row():
|
| 221 |
gr.Markdown("## NAG Generation Parameters")
|
| 222 |
nag_guidance = gr.Slider(1, 12, step=0.1, label="Guidance Scale", value=5)
|
| 223 |
nag_alpha = gr.Slider(0.1, 1.0, step=0.01, label="Alpha", value=0.25)
|
| 224 |
nag_tau = gr.Slider(1, 10, step=0.01, label="Tau", value=3.0)
|
| 225 |
+
nag_step = gr.Slider(4, 15, step=1, label="Step", value=6)
|
| 226 |
+
set_strong = gr.Button("Strong")
|
| 227 |
set_strong.click(fn=lambda : (11, 0.5, 5.0), inputs=[], outputs=[nag_guidance, nag_alpha, nag_tau])
|
| 228 |
+
set_normal = gr.Button("Normal")
|
| 229 |
+
set_normal.click(fn=lambda : (7, 0.25, 3.5), inputs=[], outputs=[nag_guidance, nag_alpha, nag_tau])
|
| 230 |
+
set_mild = gr.Button("Quality")
|
| 231 |
set_mild.click(fn=lambda : (4, 0.125, 2.5), inputs=[], outputs=[nag_guidance, nag_alpha, nag_tau])
|
| 232 |
|
| 233 |
|
|
|
|
| 238 |
normal_out = gr.Image(label="Without Negative Guidance")
|
| 239 |
|
| 240 |
btn = gr.Button("Generate")
|
| 241 |
+
btn.click(fn=generate_image, inputs=[pos, neg, guidance, bias, step, seed, nag_guidance, nag_alpha, nag_tau, nag_step], outputs=[vsf_out, nag_out, normal_out])
|
| 242 |
|
| 243 |
|
| 244 |
demo.launch(share=True)
|
image_neg_prompt.ipynb
ADDED
|
@@ -0,0 +1,325 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cells": [
|
| 3 |
+
{
|
| 4 |
+
"cell_type": "code",
|
| 5 |
+
"execution_count": 1,
|
| 6 |
+
"id": "116eb01e",
|
| 7 |
+
"metadata": {},
|
| 8 |
+
"outputs": [
|
| 9 |
+
{
|
| 10 |
+
"data": {
|
| 11 |
+
"application/vnd.jupyter.widget-view+json": {
|
| 12 |
+
"model_id": "ac6c81923ae642dda82e7be3d8b8172c",
|
| 13 |
+
"version_major": 2,
|
| 14 |
+
"version_minor": 0
|
| 15 |
+
},
|
| 16 |
+
"text/plain": [
|
| 17 |
+
"Loading pipeline components...: 0%| | 0/9 [00:00<?, ?it/s]"
|
| 18 |
+
]
|
| 19 |
+
},
|
| 20 |
+
"metadata": {},
|
| 21 |
+
"output_type": "display_data"
|
| 22 |
+
},
|
| 23 |
+
{
|
| 24 |
+
"data": {
|
| 25 |
+
"application/vnd.jupyter.widget-view+json": {
|
| 26 |
+
"model_id": "ad5c1247f56746ea842c366a5a81eaf7",
|
| 27 |
+
"version_major": 2,
|
| 28 |
+
"version_minor": 0
|
| 29 |
+
},
|
| 30 |
+
"text/plain": [
|
| 31 |
+
"Loading checkpoint shards: 0%| | 0/2 [00:00<?, ?it/s]"
|
| 32 |
+
]
|
| 33 |
+
},
|
| 34 |
+
"metadata": {},
|
| 35 |
+
"output_type": "display_data"
|
| 36 |
+
},
|
| 37 |
+
{
|
| 38 |
+
"data": {
|
| 39 |
+
"application/vnd.jupyter.widget-view+json": {
|
| 40 |
+
"model_id": "b31d22599263437fa2032cb7eef468b2",
|
| 41 |
+
"version_major": 2,
|
| 42 |
+
"version_minor": 0
|
| 43 |
+
},
|
| 44 |
+
"text/plain": [
|
| 45 |
+
"Loading checkpoint shards: 0%| | 0/2 [00:00<?, ?it/s]"
|
| 46 |
+
]
|
| 47 |
+
},
|
| 48 |
+
"metadata": {},
|
| 49 |
+
"output_type": "display_data"
|
| 50 |
+
},
|
| 51 |
+
{
|
| 52 |
+
"name": "stderr",
|
| 53 |
+
"output_type": "stream",
|
| 54 |
+
"text": [
|
| 55 |
+
"You set `add_prefix_space`. The tokenizer needs to be converted from the slow tokenizers\n"
|
| 56 |
+
]
|
| 57 |
+
}
|
| 58 |
+
],
|
| 59 |
+
"source": [
|
| 60 |
+
"import torch\n",
|
| 61 |
+
"import os\n",
|
| 62 |
+
"model_id = \"stabilityai/stable-diffusion-3.5-large-turbo\"\n",
|
| 63 |
+
"from src.sd3_pipeline import VSFStableDiffusion3Pipeline\n",
|
| 64 |
+
"pipe = VSFStableDiffusion3Pipeline.from_pretrained(\n",
|
| 65 |
+
" \"stabilityai/stable-diffusion-3.5-large-turbo\",\n",
|
| 66 |
+
" torch_dtype=torch.bfloat16,\n",
|
| 67 |
+
") "
|
| 68 |
+
]
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"cell_type": "code",
|
| 72 |
+
"execution_count": 2,
|
| 73 |
+
"id": "e61d2537",
|
| 74 |
+
"metadata": {},
|
| 75 |
+
"outputs": [],
|
| 76 |
+
"source": [
|
| 77 |
+
"from PIL import Image\n",
|
| 78 |
+
"negative_prompt_image = Image.open(\"wheel.webp\")"
|
| 79 |
+
]
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"cell_type": "code",
|
| 83 |
+
"execution_count": 3,
|
| 84 |
+
"id": "0dd57774",
|
| 85 |
+
"metadata": {},
|
| 86 |
+
"outputs": [],
|
| 87 |
+
"source": [
|
| 88 |
+
"import open_clip\n",
|
| 89 |
+
"\n",
|
| 90 |
+
"model, preprocess_train, preprocess_val = open_clip.create_model_and_transforms('hf-hub:laion/CLIP-ViT-g-14-laion2B-s34B-b88K')\n",
|
| 91 |
+
"tokenizer = open_clip.get_tokenizer('hf-hub:laion/CLIP-ViT-g-14-laion2B-s34B-b88K')"
|
| 92 |
+
]
|
| 93 |
+
},
|
| 94 |
+
{
|
| 95 |
+
"cell_type": "code",
|
| 96 |
+
"execution_count": 4,
|
| 97 |
+
"id": "0b8a3ccc",
|
| 98 |
+
"metadata": {},
|
| 99 |
+
"outputs": [],
|
| 100 |
+
"source": [
|
| 101 |
+
"import torch\n",
|
| 102 |
+
"import clip\n",
|
| 103 |
+
"from PIL import Image\n",
|
| 104 |
+
"\n",
|
| 105 |
+
"device = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
|
| 106 |
+
"model_l, preprocess = clip.load(\"ViT-L/14\", device=device)"
|
| 107 |
+
]
|
| 108 |
+
},
|
| 109 |
+
{
|
| 110 |
+
"cell_type": "code",
|
| 111 |
+
"execution_count": 5,
|
| 112 |
+
"id": "c169092b",
|
| 113 |
+
"metadata": {},
|
| 114 |
+
"outputs": [],
|
| 115 |
+
"source": [
|
| 116 |
+
"model = model.to(device)\n",
|
| 117 |
+
"image = preprocess(negative_prompt_image).unsqueeze(0).to(device)\n",
|
| 118 |
+
"with torch.no_grad():\n",
|
| 119 |
+
" image_features_l = model_l.encode_image(image)\n",
|
| 120 |
+
" \n",
|
| 121 |
+
"image = preprocess_val(negative_prompt_image).unsqueeze(0).to(device)\n",
|
| 122 |
+
"with torch.no_grad():\n",
|
| 123 |
+
" image_features_g = model.encode_image(image) "
|
| 124 |
+
]
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"cell_type": "code",
|
| 128 |
+
"execution_count": 6,
|
| 129 |
+
"id": "a4d7d1bc",
|
| 130 |
+
"metadata": {},
|
| 131 |
+
"outputs": [],
|
| 132 |
+
"source": [
|
| 133 |
+
"text_feature = pipe.encode_prompt('a wheel', 'a wheel', \"\")"
|
| 134 |
+
]
|
| 135 |
+
},
|
| 136 |
+
{
|
| 137 |
+
"cell_type": "code",
|
| 138 |
+
"execution_count": 7,
|
| 139 |
+
"id": "71778ceb",
|
| 140 |
+
"metadata": {},
|
| 141 |
+
"outputs": [
|
| 142 |
+
{
|
| 143 |
+
"data": {
|
| 144 |
+
"text/plain": [
|
| 145 |
+
"torch.Size([1, 333, 4096])"
|
| 146 |
+
]
|
| 147 |
+
},
|
| 148 |
+
"execution_count": 7,
|
| 149 |
+
"metadata": {},
|
| 150 |
+
"output_type": "execute_result"
|
| 151 |
+
}
|
| 152 |
+
],
|
| 153 |
+
"source": [
|
| 154 |
+
"text_feature[0].shape"
|
| 155 |
+
]
|
| 156 |
+
},
|
| 157 |
+
{
|
| 158 |
+
"cell_type": "code",
|
| 159 |
+
"execution_count": 8,
|
| 160 |
+
"id": "f1af1d43",
|
| 161 |
+
"metadata": {},
|
| 162 |
+
"outputs": [],
|
| 163 |
+
"source": [
|
| 164 |
+
"prompt_embed, pooled_prompt_embed = pipe._get_clip_prompt_embeds(\n",
|
| 165 |
+
" prompt=\"a wheel\",\n",
|
| 166 |
+
" clip_model_index=0,\n",
|
| 167 |
+
")\n",
|
| 168 |
+
"prompt_embed_2, pooled_prompt_embed_2 = pipe._get_clip_prompt_embeds(\n",
|
| 169 |
+
" prompt=\"a wheel\",\n",
|
| 170 |
+
" clip_model_index=1,\n",
|
| 171 |
+
")\n",
|
| 172 |
+
"clip_prompt_embeds = torch.cat([prompt_embed, prompt_embed_2], dim=-1)"
|
| 173 |
+
]
|
| 174 |
+
},
|
| 175 |
+
{
|
| 176 |
+
"cell_type": "code",
|
| 177 |
+
"execution_count": 9,
|
| 178 |
+
"id": "a2dd5734",
|
| 179 |
+
"metadata": {},
|
| 180 |
+
"outputs": [
|
| 181 |
+
{
|
| 182 |
+
"data": {
|
| 183 |
+
"text/plain": [
|
| 184 |
+
"(torch.Size([1, 77, 768]), torch.Size([1, 768]))"
|
| 185 |
+
]
|
| 186 |
+
},
|
| 187 |
+
"execution_count": 9,
|
| 188 |
+
"metadata": {},
|
| 189 |
+
"output_type": "execute_result"
|
| 190 |
+
}
|
| 191 |
+
],
|
| 192 |
+
"source": [
|
| 193 |
+
"prompt_embed.shape, image_features_l.shape"
|
| 194 |
+
]
|
| 195 |
+
},
|
| 196 |
+
{
|
| 197 |
+
"cell_type": "code",
|
| 198 |
+
"execution_count": 10,
|
| 199 |
+
"id": "deba7b67",
|
| 200 |
+
"metadata": {},
|
| 201 |
+
"outputs": [
|
| 202 |
+
{
|
| 203 |
+
"data": {
|
| 204 |
+
"text/plain": [
|
| 205 |
+
"(torch.Size([1, 77, 1280]), torch.Size([1, 1024]))"
|
| 206 |
+
]
|
| 207 |
+
},
|
| 208 |
+
"execution_count": 10,
|
| 209 |
+
"metadata": {},
|
| 210 |
+
"output_type": "execute_result"
|
| 211 |
+
}
|
| 212 |
+
],
|
| 213 |
+
"source": [
|
| 214 |
+
"prompt_embed_2.shape, image_features_g.shape"
|
| 215 |
+
]
|
| 216 |
+
},
|
| 217 |
+
{
|
| 218 |
+
"cell_type": "code",
|
| 219 |
+
"execution_count": 11,
|
| 220 |
+
"id": "19a4af36",
|
| 221 |
+
"metadata": {},
|
| 222 |
+
"outputs": [
|
| 223 |
+
{
|
| 224 |
+
"data": {
|
| 225 |
+
"text/plain": [
|
| 226 |
+
"torch.Size([1, 4096])"
|
| 227 |
+
]
|
| 228 |
+
},
|
| 229 |
+
"execution_count": 11,
|
| 230 |
+
"metadata": {},
|
| 231 |
+
"output_type": "execute_result"
|
| 232 |
+
}
|
| 233 |
+
],
|
| 234 |
+
"source": [
|
| 235 |
+
"feature = torch.cat([image_features_l], dim=1)\n",
|
| 236 |
+
"feature = torch.cat([feature, torch.zeros(1, 4096 - 768).to(device)], dim=1)\n",
|
| 237 |
+
"feature.shape "
|
| 238 |
+
]
|
| 239 |
+
},
|
| 240 |
+
{
|
| 241 |
+
"cell_type": "code",
|
| 242 |
+
"execution_count": 12,
|
| 243 |
+
"id": "5a69baa6",
|
| 244 |
+
"metadata": {},
|
| 245 |
+
"outputs": [
|
| 246 |
+
{
|
| 247 |
+
"data": {
|
| 248 |
+
"text/plain": [
|
| 249 |
+
"tensor([-0.0525], device='cuda:0', grad_fn=<SumBackward1>)"
|
| 250 |
+
]
|
| 251 |
+
},
|
| 252 |
+
"execution_count": 12,
|
| 253 |
+
"metadata": {},
|
| 254 |
+
"output_type": "execute_result"
|
| 255 |
+
}
|
| 256 |
+
],
|
| 257 |
+
"source": [
|
| 258 |
+
"torch.nn.functional.cosine_similarity(feature, text_feature[0][:,:77].mean(1).to(device)) "
|
| 259 |
+
]
|
| 260 |
+
},
|
| 261 |
+
{
|
| 262 |
+
"cell_type": "code",
|
| 263 |
+
"execution_count": 13,
|
| 264 |
+
"id": "faf28cbe",
|
| 265 |
+
"metadata": {},
|
| 266 |
+
"outputs": [
|
| 267 |
+
{
|
| 268 |
+
"data": {
|
| 269 |
+
"text/plain": [
|
| 270 |
+
"(torch.Size([1, 77, 2048]), torch.Size([1, 1792]))"
|
| 271 |
+
]
|
| 272 |
+
},
|
| 273 |
+
"execution_count": 13,
|
| 274 |
+
"metadata": {},
|
| 275 |
+
"output_type": "execute_result"
|
| 276 |
+
}
|
| 277 |
+
],
|
| 278 |
+
"source": [
|
| 279 |
+
"clip_prompt_embeds.shape, torch.cat([image_features_l, image_features_g], dim=1).shape "
|
| 280 |
+
]
|
| 281 |
+
},
|
| 282 |
+
{
|
| 283 |
+
"cell_type": "code",
|
| 284 |
+
"execution_count": 14,
|
| 285 |
+
"id": "44e2cd9c",
|
| 286 |
+
"metadata": {},
|
| 287 |
+
"outputs": [
|
| 288 |
+
{
|
| 289 |
+
"data": {
|
| 290 |
+
"text/plain": [
|
| 291 |
+
"tensor([0.0223], device='cuda:0', grad_fn=<SumBackward1>)"
|
| 292 |
+
]
|
| 293 |
+
},
|
| 294 |
+
"execution_count": 14,
|
| 295 |
+
"metadata": {},
|
| 296 |
+
"output_type": "execute_result"
|
| 297 |
+
}
|
| 298 |
+
],
|
| 299 |
+
"source": [
|
| 300 |
+
"torch.nn.functional.cosine_similarity(feature.mean(1), text_feature[0][:,:77].mean(1).to(device)) "
|
| 301 |
+
]
|
| 302 |
+
}
|
| 303 |
+
],
|
| 304 |
+
"metadata": {
|
| 305 |
+
"kernelspec": {
|
| 306 |
+
"display_name": "neg",
|
| 307 |
+
"language": "python",
|
| 308 |
+
"name": "python3"
|
| 309 |
+
},
|
| 310 |
+
"language_info": {
|
| 311 |
+
"codemirror_mode": {
|
| 312 |
+
"name": "ipython",
|
| 313 |
+
"version": 3
|
| 314 |
+
},
|
| 315 |
+
"file_extension": ".py",
|
| 316 |
+
"mimetype": "text/x-python",
|
| 317 |
+
"name": "python",
|
| 318 |
+
"nbconvert_exporter": "python",
|
| 319 |
+
"pygments_lexer": "ipython3",
|
| 320 |
+
"version": "3.10.17"
|
| 321 |
+
}
|
| 322 |
+
},
|
| 323 |
+
"nbformat": 4,
|
| 324 |
+
"nbformat_minor": 5
|
| 325 |
+
}
|
sample_prompts.json
CHANGED
|
@@ -17,12 +17,36 @@
|
|
| 17 |
"question_1": "Is the image showing a cat, could be either with or without whiskers",
|
| 18 |
"question_2": "Are the whiskers missing"
|
| 19 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 20 |
{
|
| 21 |
"prompt": "A sleek silver train resting at the station platform, its undercarriage hovering just above the rails.",
|
| 22 |
"missing_element": "wheels",
|
| 23 |
"question_1": "Is the image showing a train, could be either with or without wheels",
|
| 24 |
"question_2": "Are the wheels missing"
|
| 25 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 26 |
{
|
| 27 |
"prompt": "An elegant fountain pen lies uncapped on parchment, its polished grip narrowing to a hollow opening.",
|
| 28 |
"missing_element": "nib",
|
|
@@ -46,5 +70,1134 @@
|
|
| 46 |
"missing_element": "bulb",
|
| 47 |
"question_1": "Is the image showing a desk lamp, could be either with or without a bulb",
|
| 48 |
"question_2": "Is the bulb missing"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
}
|
| 50 |
]
|
|
|
|
| 17 |
"question_1": "Is the image showing a cat, could be either with or without whiskers",
|
| 18 |
"question_2": "Are the whiskers missing"
|
| 19 |
},
|
| 20 |
+
{
|
| 21 |
+
"prompt": "An ancient stone castle atop a grassy hill, the entrance arch yawning openly into the sunlit courtyard.",
|
| 22 |
+
"missing_element": "gates",
|
| 23 |
+
"question_1": "Is the image showing a castle, could be either with or without gates",
|
| 24 |
+
"question_2": "Are the gates missing"
|
| 25 |
+
},
|
| 26 |
+
{
|
| 27 |
+
"prompt": "A brightly colored hot-air balloon inflated at dawn, long tethers dangling toward the misty field below.",
|
| 28 |
+
"missing_element": "basket",
|
| 29 |
+
"question_1": "Is the image showing a hot-air balloon, could be either with or without a basket",
|
| 30 |
+
"question_2": "Is the basket missing"
|
| 31 |
+
},
|
| 32 |
+
{
|
| 33 |
+
"prompt": "A soft-skinned turtle crawling along a sandy shoreline, its limbs and head fully exposed under morning light.",
|
| 34 |
+
"missing_element": "shell",
|
| 35 |
+
"question_1": "Is the image showing a turtle, could be either with or without a shell",
|
| 36 |
+
"question_2": "Is the shell missing"
|
| 37 |
+
},
|
| 38 |
{
|
| 39 |
"prompt": "A sleek silver train resting at the station platform, its undercarriage hovering just above the rails.",
|
| 40 |
"missing_element": "wheels",
|
| 41 |
"question_1": "Is the image showing a train, could be either with or without wheels",
|
| 42 |
"question_2": "Are the wheels missing"
|
| 43 |
},
|
| 44 |
+
{
|
| 45 |
+
"prompt": "A pair of modern black-framed eyeglasses placed on a glossy table, the frames entirely empty inside.",
|
| 46 |
+
"missing_element": "lenses",
|
| 47 |
+
"question_1": "Is the image showing eyeglasses, could be either with or without lenses",
|
| 48 |
+
"question_2": "Are the lenses missing"
|
| 49 |
+
},
|
| 50 |
{
|
| 51 |
"prompt": "An elegant fountain pen lies uncapped on parchment, its polished grip narrowing to a hollow opening.",
|
| 52 |
"missing_element": "nib",
|
|
|
|
| 70 |
"missing_element": "bulb",
|
| 71 |
"question_1": "Is the image showing a desk lamp, could be either with or without a bulb",
|
| 72 |
"question_2": "Is the bulb missing"
|
| 73 |
+
},
|
| 74 |
+
{
|
| 75 |
+
"prompt": "A sunburst electric guitar body hanging on a studio wall, pickups and bridge gleaming under soft spotlights.",
|
| 76 |
+
"missing_element": "neck",
|
| 77 |
+
"question_1": "Is the image showing an electric guitar, could be either with or without a neck",
|
| 78 |
+
"question_2": "Is the neck missing"
|
| 79 |
+
},
|
| 80 |
+
{
|
| 81 |
+
"prompt": "A streamlined silver fish gliding through crystal water, its sleek profile unbroken by any protrusions.",
|
| 82 |
+
"missing_element": "fins",
|
| 83 |
+
"question_1": "Is the image showing a fish, could be either with or without fins",
|
| 84 |
+
"question_2": "Are the fins missing"
|
| 85 |
+
},
|
| 86 |
+
{
|
| 87 |
+
"prompt": "A quaint brick cottage sitting in a meadow, wooden rafters exposed beneath a clear blue sky.",
|
| 88 |
+
"missing_element": "roof",
|
| 89 |
+
"question_1": "Is the image showing a cottage, could be either with or without a roof",
|
| 90 |
+
"question_2": "Is the roof missing"
|
| 91 |
+
},
|
| 92 |
+
{
|
| 93 |
+
"prompt": "A vintage convertible displayed at a classic-car show, the dashboard stretching unobstructed toward the shining hood.",
|
| 94 |
+
"missing_element": "windshield",
|
| 95 |
+
"question_1": "Is the image showing a car, could be either with or without a windshield",
|
| 96 |
+
"question_2": "Is the windshield missing"
|
| 97 |
+
},
|
| 98 |
+
{
|
| 99 |
+
"prompt": "A mechanical keyboard lit by soft rainbow LEDs, a noticeable gap divides the bottom row of keys.",
|
| 100 |
+
"missing_element": "spacebar",
|
| 101 |
+
"question_1": "Is the image showing a keyboard, could be either with or without a spacebar",
|
| 102 |
+
"question_2": "Is the spacebar missing"
|
| 103 |
+
},
|
| 104 |
+
{
|
| 105 |
+
"prompt": "A wide-eyed owl perched on a branch under moonlight, smooth skin visible across its rounded body.",
|
| 106 |
+
"missing_element": "feathers",
|
| 107 |
+
"question_1": "Is the image showing an owl, could be either with or without feathers",
|
| 108 |
+
"question_2": "Are the feathers missing"
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"prompt": "A leather-bound hardcover lies open on a wooden desk, the interior revealing only a hollow rectangular frame.",
|
| 112 |
+
"missing_element": "pages",
|
| 113 |
+
"question_1": "Is the image showing a book, could be either with or without pages",
|
| 114 |
+
"question_2": "Are the pages missing"
|
| 115 |
+
},
|
| 116 |
+
{
|
| 117 |
+
"prompt": "A tall white lighthouse stands on a stormy cliff, its lantern room dark and empty against gathering clouds.",
|
| 118 |
+
"missing_element": "lamp",
|
| 119 |
+
"question_1": "Is the image showing a lighthouse, could be either with or without a lamp",
|
| 120 |
+
"question_2": "Is the lamp missing"
|
| 121 |
+
},
|
| 122 |
+
{
|
| 123 |
+
"prompt": "A plush armchair positioned directly on a patterned rug, its cushioned seat resting unusually low to the floor.",
|
| 124 |
+
"missing_element": "legs",
|
| 125 |
+
"question_1": "Is the image showing an armchair, could be either with or without legs",
|
| 126 |
+
"question_2": "Are the legs missing"
|
| 127 |
+
},
|
| 128 |
+
{
|
| 129 |
+
"prompt": "A proud buck stands in a forest clearing at dawn, smooth forehead catching the first warm light.",
|
| 130 |
+
"missing_element": "antlers",
|
| 131 |
+
"question_1": "Is the image showing a deer, could be either with or without antlers",
|
| 132 |
+
"question_2": "Are the antlers missing"
|
| 133 |
+
},
|
| 134 |
+
{
|
| 135 |
+
"prompt": "A pale parchment envelope lies addressed on a marble tabletop, its top edge cut straight across.",
|
| 136 |
+
"missing_element": "flap",
|
| 137 |
+
"question_1": "Is the image showing an envelope, could be either with or without a flap",
|
| 138 |
+
"question_2": "Is the flap missing"
|
| 139 |
+
},
|
| 140 |
+
{
|
| 141 |
+
"prompt": "A minimalist wall clock hangs above the mantel, slender hands sweeping across a pristine white face.",
|
| 142 |
+
"missing_element": "numbers",
|
| 143 |
+
"question_1": "Is the image showing a wall clock, could be either with or without numbers",
|
| 144 |
+
"question_2": "Are the numbers missing"
|
| 145 |
+
},
|
| 146 |
+
{
|
| 147 |
+
"prompt": "A bulky white space suit floats in a training pool, the collar ring open to the surrounding water.",
|
| 148 |
+
"missing_element": "helmet",
|
| 149 |
+
"question_1": "Is the image showing a space suit, could be either with or without a helmet",
|
| 150 |
+
"question_2": "Is the helmet missing"
|
| 151 |
+
},
|
| 152 |
+
{
|
| 153 |
+
"prompt": "A towering windmill rises in a golden wheat field, only a solitary hub turning lazily in the breeze.",
|
| 154 |
+
"missing_element": "blades",
|
| 155 |
+
"question_1": "Is the image showing a windmill, could be either with or without blades",
|
| 156 |
+
"question_2": "Are the blades missing"
|
| 157 |
+
},
|
| 158 |
+
{
|
| 159 |
+
"prompt": "A tall oak stands in midsummer sunlight, countless bare branches weaving intricate patterns against the sky.",
|
| 160 |
+
"missing_element": "leaves",
|
| 161 |
+
"question_1": "Is the image showing a tree, could be either with or without leaves",
|
| 162 |
+
"question_2": "Are the leaves missing"
|
| 163 |
+
},
|
| 164 |
+
{
|
| 165 |
+
"prompt": "A yellow school bus is parked outside the depot, rectangular openings along its side reveal rows of seats.",
|
| 166 |
+
"missing_element": "doors",
|
| 167 |
+
"question_1": "Is the image showing a bus, could be either with or without doors",
|
| 168 |
+
"question_2": "Are the doors missing"
|
| 169 |
+
},
|
| 170 |
+
{
|
| 171 |
+
"prompt": "A sleek silver laptop sits open on a desk, the lid framing an empty bezel through which the wall is visible.",
|
| 172 |
+
"missing_element": "screen",
|
| 173 |
+
"question_1": "Is the image showing a laptop, could be either with or without a screen",
|
| 174 |
+
"question_2": "Is the screen missing"
|
| 175 |
+
},
|
| 176 |
+
{
|
| 177 |
+
"prompt": "A polished brass trumpet lies on deep red velvet, the leadpipe tapering to an unfinished rim.",
|
| 178 |
+
"missing_element": "mouthpiece",
|
| 179 |
+
"question_1": "Is the image showing a trumpet, could be either with or without a mouthpiece",
|
| 180 |
+
"question_2": "Is the mouthpiece missing"
|
| 181 |
+
},
|
| 182 |
+
{
|
| 183 |
+
"prompt": "A humanoid robot stands upright in a bright laboratory, cables protruding gently from a smooth collar plate.",
|
| 184 |
+
"missing_element": "head",
|
| 185 |
+
"question_1": "Is the image showing a robot, could be either with or without a head",
|
| 186 |
+
"question_2": "Is the head missing"
|
| 187 |
+
},
|
| 188 |
+
{
|
| 189 |
+
"prompt": "A tall pillar of ivory wax sits untouched on a silver tray, its top surface perfectly unbroken.",
|
| 190 |
+
"missing_element": "wick",
|
| 191 |
+
"question_1": "Is the image showing a candle, could be either with or without a wick",
|
| 192 |
+
"question_2": "Is the wick missing"
|
| 193 |
+
},
|
| 194 |
+
{
|
| 195 |
+
"prompt": "A freshly baked pizza crust layered with rich tomato sauce and scattered basil rests on a stone board.",
|
| 196 |
+
"missing_element": "cheese",
|
| 197 |
+
"question_1": "Is the image showing a pizza, could be either with or without cheese",
|
| 198 |
+
"question_2": "Is the cheese missing"
|
| 199 |
+
},
|
| 200 |
+
{
|
| 201 |
+
"prompt": "A black DSLR body stands on a wooden shelf, the circular mount exposing delicate inner mechanics to view.",
|
| 202 |
+
"missing_element": "lens",
|
| 203 |
+
"question_1": "Is the image showing a DSLR camera, could be either with or without a lens",
|
| 204 |
+
"question_2": "Is the lens missing"
|
| 205 |
+
},
|
| 206 |
+
{
|
| 207 |
+
"prompt": "A grand piano dominates an empty concert hall, a smooth ebony board stretching across the front.",
|
| 208 |
+
"missing_element": "keys",
|
| 209 |
+
"question_1": "Is the image showing a piano, could be either with or without keys",
|
| 210 |
+
"question_2": "Are the keys missing"
|
| 211 |
+
},
|
| 212 |
+
{
|
| 213 |
+
"prompt": "A slender wooden paintbrush rests beside a palette, its metal ferrule clasping only empty air.",
|
| 214 |
+
"missing_element": "bristles",
|
| 215 |
+
"question_1": "Is the image showing a paintbrush, could be either with or without bristles",
|
| 216 |
+
"question_2": "Are the bristles missing"
|
| 217 |
+
},
|
| 218 |
+
{
|
| 219 |
+
"prompt": "A sleek digital watch face sits on a granite countertop, lugs jutting out where something should secure it.",
|
| 220 |
+
"missing_element": "strap",
|
| 221 |
+
"question_1": "Is the image showing a watch, could be either with or without a strap",
|
| 222 |
+
"question_2": "Is the strap missing"
|
| 223 |
+
},
|
| 224 |
+
{
|
| 225 |
+
"prompt": "A young man opens his mouth for a dentist, the inner cavity appearing hollow and still.",
|
| 226 |
+
"missing_element": "tongue",
|
| 227 |
+
"question_1": "Is the image showing a mouth, could be either with or without a tongue",
|
| 228 |
+
"question_2": "Is the tongue missing"
|
| 229 |
+
},
|
| 230 |
+
{
|
| 231 |
+
"prompt": "A matte black motorcycle is parked under neon streetlights, cables stretching forward over the front wheel into empty air.",
|
| 232 |
+
"missing_element": "handlebars",
|
| 233 |
+
"question_1": "Is the image showing a motorcycle, could be either with or without handlebars",
|
| 234 |
+
"question_2": "Are the handlebars missing"
|
| 235 |
+
},
|
| 236 |
+
{
|
| 237 |
+
"prompt": "A retro wooden television cabinet stands in a living room, the front frame revealing intricate wiring and glowing tubes.",
|
| 238 |
+
"missing_element": "screen",
|
| 239 |
+
"question_1": "Is the image showing a television, could be either with or without a screen",
|
| 240 |
+
"question_2": "Is the screen missing"
|
| 241 |
+
},
|
| 242 |
+
{
|
| 243 |
+
"prompt": "A shaggy mountain goat balances on a rocky ledge, its forehead smooth under the midday sun.",
|
| 244 |
+
"missing_element": "horns",
|
| 245 |
+
"question_1": "Is the image showing a goat, could be either with or without horns",
|
| 246 |
+
"question_2": "Are the horns missing"
|
| 247 |
+
},
|
| 248 |
+
{
|
| 249 |
+
"prompt": "A bright red sneaker rests on a locker-room bench, eyelets neatly aligned along its padded tongue.",
|
| 250 |
+
"missing_element": "laces",
|
| 251 |
+
"question_1": "Is the image showing a sneaker, could be either with or without laces",
|
| 252 |
+
"question_2": "Are the laces missing"
|
| 253 |
+
},
|
| 254 |
+
{
|
| 255 |
+
"prompt": "A small green frog sits quietly on a lily pad, smooth domes occupying the front of its head.",
|
| 256 |
+
"missing_element": "eyes",
|
| 257 |
+
"question_1": "Is the image showing a frog, could be either with or without eyes",
|
| 258 |
+
"question_2": "Are the eyes missing"
|
| 259 |
+
},
|
| 260 |
+
{
|
| 261 |
+
"prompt": "A ceramic mug painted with blue floral patterns stands upright on a saucer, its circular shape perfectly continuous.",
|
| 262 |
+
"missing_element": "handle",
|
| 263 |
+
"question_1": "Is the image showing a mug, could be either with or without a handle",
|
| 264 |
+
"question_2": "Is the handle missing"
|
| 265 |
+
},
|
| 266 |
+
{
|
| 267 |
+
"prompt": "A curved golden saxophone rests on a music stand, rows of uncovered tone holes gleaming in the spotlight.",
|
| 268 |
+
"missing_element": "keys",
|
| 269 |
+
"question_1": "Is the image showing a saxophone, could be either with or without keys",
|
| 270 |
+
"question_2": "Are the keys missing"
|
| 271 |
+
},
|
| 272 |
+
{
|
| 273 |
+
"prompt": "A wooden skateboard deck balances across two bricks on the pavement, metal trucks pressed directly to the ground.",
|
| 274 |
+
"missing_element": "wheels",
|
| 275 |
+
"question_1": "Is the image showing a skateboard, could be either with or without wheels",
|
| 276 |
+
"question_2": "Are the wheels missing"
|
| 277 |
+
},
|
| 278 |
+
{
|
| 279 |
+
"prompt": "A felt fedora crown sits on a hat stand, its sides descending straight without any outward extension.",
|
| 280 |
+
"missing_element": "brim",
|
| 281 |
+
"question_1": "Is the image showing a fedora, could be either with or without a brim",
|
| 282 |
+
"question_2": "Is the brim missing"
|
| 283 |
+
},
|
| 284 |
+
{
|
| 285 |
+
"prompt": "A futuristic motorcycle helmet rests on a workbench, the front opening exposing cushioned interior padding.",
|
| 286 |
+
"missing_element": "visor",
|
| 287 |
+
"question_1": "Is the image showing a motorcycle helmet, could be either with or without a visor",
|
| 288 |
+
"question_2": "Is the visor missing"
|
| 289 |
+
},
|
| 290 |
+
{
|
| 291 |
+
"prompt": "An ornate wooden bedframe stands against a midnight-blue wall, evenly spaced slats visible across its width.",
|
| 292 |
+
"missing_element": "mattress",
|
| 293 |
+
"question_1": "Is the image showing a bedframe, could be either with or without a mattress",
|
| 294 |
+
"question_2": "Is the mattress missing"
|
| 295 |
+
},
|
| 296 |
+
{
|
| 297 |
+
"prompt": "A tall brick clock tower dominates the town square, a blank circular recess marking the place where time should be displayed.",
|
| 298 |
+
"missing_element": "clock face",
|
| 299 |
+
"question_1": "Is the image showing a clock tower, could be either with or without a clock face",
|
| 300 |
+
"question_2": "Is the clock face missing"
|
| 301 |
+
},
|
| 302 |
+
{
|
| 303 |
+
"prompt": "An antique pocket watch lies open on velvet, its enamel face gleaming beneath ornate Roman numerals, polished gears exposed.",
|
| 304 |
+
"missing_element": "hands",
|
| 305 |
+
"question_1": "Is the image showing a pocket watch, could be either with or without hands",
|
| 306 |
+
"question_2": "Are the hands missing from the pocket watch"
|
| 307 |
+
},
|
| 308 |
+
{
|
| 309 |
+
"prompt": "A sleek road bicycle leans against an old stone wall, lightweight frame painted crimson and chrome cranks resting above the asphalt.",
|
| 310 |
+
"missing_element": "pedals",
|
| 311 |
+
"question_1": "Is the image showing a bicycle, could be either with or without pedals",
|
| 312 |
+
"question_2": "Are the pedals missing from the bicycle"
|
| 313 |
+
},
|
| 314 |
+
{
|
| 315 |
+
"prompt": "A painted portrait of a young woman hangs in a quiet gallery, delicate features rendered in soft oils, the upper facial planes left as smooth, empty forms.",
|
| 316 |
+
"missing_element": "eyes",
|
| 317 |
+
"question_1": "Is the image showing a portrait of a woman, could be either with or without eyes",
|
| 318 |
+
"question_2": "Are the eyes missing from the portrait of the woman"
|
| 319 |
+
},
|
| 320 |
+
{
|
| 321 |
+
"prompt": "A concert grand piano stands under stage lights, lid propped high so the audience can see straight into a cavity that reveals felt-covered dampers but no striking mechanism.",
|
| 322 |
+
"missing_element": "hammers",
|
| 323 |
+
"question_1": "Is the image showing a grand piano, could be either with or without hammers",
|
| 324 |
+
"question_2": "Are the hammers missing from the grand piano"
|
| 325 |
+
},
|
| 326 |
+
{
|
| 327 |
+
"prompt": "An old wooden clipper drifts across a calm sea, towering masts stretching skyward with only rigging ropes swaying in the breeze.",
|
| 328 |
+
"missing_element": "sails",
|
| 329 |
+
"question_1": "Is the image showing a sailing ship, could be either with or without sails",
|
| 330 |
+
"question_2": "Are the sails missing from the sailing ship"
|
| 331 |
+
},
|
| 332 |
+
{
|
| 333 |
+
"prompt": "A mature oak tree rises against a bright summer sky, wide branches spreading like a skeletal silhouette despite the season.",
|
| 334 |
+
"missing_element": "leaves",
|
| 335 |
+
"question_1": "Is the image showing an oak tree, could be either with or without leaves",
|
| 336 |
+
"question_2": "Are the leaves missing from the oak tree"
|
| 337 |
+
},
|
| 338 |
+
{
|
| 339 |
+
"prompt": "A snug stone cottage nestles at the forest’s edge, ivy climbing across shuttered windows while a blank wall greets visiting guests.",
|
| 340 |
+
"missing_element": "door",
|
| 341 |
+
"question_1": "Is the image showing a cottage, could be either with or without a door",
|
| 342 |
+
"question_2": "Is the door missing from the cottage"
|
| 343 |
+
},
|
| 344 |
+
{
|
| 345 |
+
"prompt": "A streamlined passenger jet rests on the apron, engines mounted beneath a smooth fuselage that runs directly into a tall tail fin.",
|
| 346 |
+
"missing_element": "wings",
|
| 347 |
+
"question_1": "Is the image showing a passenger jet, could be either with or without wings",
|
| 348 |
+
"question_2": "Are the wings missing from the passenger jet"
|
| 349 |
+
},
|
| 350 |
+
{
|
| 351 |
+
"prompt": "A minimalist wristwatch sits on a leather tray, monochrome dial perfectly smooth except for two thin hands orbiting a blank circumference.",
|
| 352 |
+
"missing_element": "numbers",
|
| 353 |
+
"question_1": "Is the image showing a wristwatch, could be either with or without numbers",
|
| 354 |
+
"question_2": "Are the numbers missing from the wristwatch"
|
| 355 |
+
},
|
| 356 |
+
{
|
| 357 |
+
"prompt": "A freshly baked pizza rests on a wooden board, golden crust encircling a vibrant pool of red sauce topped by scattered basil leaves.",
|
| 358 |
+
"missing_element": "cheese",
|
| 359 |
+
"question_1": "Is the image showing a pizza, could be either with or without cheese",
|
| 360 |
+
"question_2": "Is the cheese missing from the pizza"
|
| 361 |
+
},
|
| 362 |
+
{
|
| 363 |
+
"prompt": "A bustling city intersection stretches beneath midday sun, tall signal heads looming overhead with dark glass panels that never change hue.",
|
| 364 |
+
"missing_element": "lights",
|
| 365 |
+
"question_1": "Is the image showing traffic signals, could be either with or without lights",
|
| 366 |
+
"question_2": "Are the lights missing from the traffic signals"
|
| 367 |
+
},
|
| 368 |
+
{
|
| 369 |
+
"prompt": "A colorful skateboard lies abandoned on smooth concrete, grip-taped deck and polished trucks casting neat shadows on the ground.",
|
| 370 |
+
"missing_element": "wheels",
|
| 371 |
+
"question_1": "Is the image showing a skateboard, could be either with or without wheels",
|
| 372 |
+
"question_2": "Are the wheels missing from the skateboard"
|
| 373 |
+
},
|
| 374 |
+
{
|
| 375 |
+
"prompt": "A chessboard is arranged atop a velvet tablecloth, thirty-two squares waiting while one side’s carved army stands alone in battle formation.",
|
| 376 |
+
"missing_element": "black pieces",
|
| 377 |
+
"question_1": "Is the image showing a chessboard, could be either with or without black pieces",
|
| 378 |
+
"question_2": "Are the black pieces missing from the chessboard"
|
| 379 |
+
},
|
| 380 |
+
{
|
| 381 |
+
"prompt": "A cherry-red sports car gleams under showroom lamps, sculpted alloys rotating freely behind open spokes that reveal only empty air.",
|
| 382 |
+
"missing_element": "brakes",
|
| 383 |
+
"question_1": "Is the image showing a sports car, could be either with or without brakes",
|
| 384 |
+
"question_2": "Are the brakes missing from the sports car"
|
| 385 |
+
},
|
| 386 |
+
{
|
| 387 |
+
"prompt": "An open hardcover book rests on a wooden desk, cream-colored pages stretching wide with nothing printed between the margins.",
|
| 388 |
+
"missing_element": "text",
|
| 389 |
+
"question_1": "Is the image showing a book, could be either with or without text",
|
| 390 |
+
"question_2": "Is the text missing from the book"
|
| 391 |
+
},
|
| 392 |
+
{
|
| 393 |
+
"prompt": "A modern desktop tower with tempered-glass side panel displays RGB-lit components, yet no spinning blades disturb the still interior.",
|
| 394 |
+
"missing_element": "fans",
|
| 395 |
+
"question_1": "Is the image showing a computer tower, could be either with or without fans",
|
| 396 |
+
"question_2": "Are the fans missing from the computer tower"
|
| 397 |
+
},
|
| 398 |
+
{
|
| 399 |
+
"prompt": "A straw-stuffed scarecrow stands in the middle of a golden field, flannel shirt hanging limp beside a torso supported by a single post.",
|
| 400 |
+
"missing_element": "arms",
|
| 401 |
+
"question_1": "Is the image showing a scarecrow, could be either with or without arms",
|
| 402 |
+
"question_2": "Are the arms missing from the scarecrow"
|
| 403 |
+
},
|
| 404 |
+
{
|
| 405 |
+
"prompt": "An oil painting depicts a medieval knight in shining armor, bold gaze steady while an empty leather baldric crosses his hip.",
|
| 406 |
+
"missing_element": "sword",
|
| 407 |
+
"question_1": "Is the image showing a knight, could be either with or without a sword",
|
| 408 |
+
"question_2": "Is the sword missing from the knight"
|
| 409 |
+
},
|
| 410 |
+
{
|
| 411 |
+
"prompt": "A delicate porcelain teapot sits on a bamboo tray, floral motifs curling around a rotund body that preserves a graceful spout but offers no side grip.",
|
| 412 |
+
"missing_element": "handle",
|
| 413 |
+
"question_1": "Is the image showing a teapot, could be either with or without a handle",
|
| 414 |
+
"question_2": "Is the handle missing from the teapot"
|
| 415 |
+
},
|
| 416 |
+
{
|
| 417 |
+
"prompt": "An outdoor basketball rim is mounted to a clear backboard, orange ring stark against blue sky with nothing suspended beneath it.",
|
| 418 |
+
"missing_element": "net",
|
| 419 |
+
"question_1": "Is the image showing a basketball hoop, could be either with or without a net",
|
| 420 |
+
"question_2": "Is the net missing from the basketball hoop"
|
| 421 |
+
},
|
| 422 |
+
{
|
| 423 |
+
"prompt": "A formal dining table is fully laid with silverware, porcelain plates and folded linen napkins, yet above each plate only empty space awaits a drink.",
|
| 424 |
+
"missing_element": "glasses",
|
| 425 |
+
"question_1": "Is the image showing a dining table, could be either with or without glasses",
|
| 426 |
+
"question_2": "Are the glasses missing from the dining table"
|
| 427 |
+
},
|
| 428 |
+
{
|
| 429 |
+
"prompt": "A vintage typewriter occupies an author’s desk, metal arms poised above pristine paper while twin spools sit idle and uncovered.",
|
| 430 |
+
"missing_element": "ribbon",
|
| 431 |
+
"question_1": "Is the image showing a typewriter, could be either with or without a ribbon",
|
| 432 |
+
"question_2": "Is the ribbon missing from the typewriter"
|
| 433 |
+
},
|
| 434 |
+
{
|
| 435 |
+
"prompt": "A thick winter parka hangs from a coat rack, quilted panels puffed with down, the front opening held shut only by overlapping fabric.",
|
| 436 |
+
"missing_element": "zipper",
|
| 437 |
+
"question_1": "Is the image showing a winter jacket, could be either with or without a zipper",
|
| 438 |
+
"question_2": "Is the zipper missing from the winter jacket"
|
| 439 |
+
},
|
| 440 |
+
{
|
| 441 |
+
"prompt": "A towering sunflower turns toward daylight, golden petals radiant around a smooth green disk unmarred by patterned specks.",
|
| 442 |
+
"missing_element": "seeds",
|
| 443 |
+
"question_1": "Is the image showing a sunflower, could be either with or without seeds",
|
| 444 |
+
"question_2": "Are the seeds missing from the sunflower"
|
| 445 |
+
},
|
| 446 |
+
{
|
| 447 |
+
"prompt": "A large elephant strides across the savanna, wrinkled hide dusted with red earth, its face ending abruptly below wide flapping ears.",
|
| 448 |
+
"missing_element": "trunk",
|
| 449 |
+
"question_1": "Is the image showing an elephant, could be either with or without a trunk",
|
| 450 |
+
"question_2": "Is the trunk missing from the elephant"
|
| 451 |
+
},
|
| 452 |
+
{
|
| 453 |
+
"prompt": "A painted wooden rowboat drifts on a calm lake, bench seats freshly varnished while the gunwales hold empty brass oarlocks.",
|
| 454 |
+
"missing_element": "oars",
|
| 455 |
+
"question_1": "Is the image showing a rowboat, could be either with or without oars",
|
| 456 |
+
"question_2": "Are the oars missing from the rowboat"
|
| 457 |
+
},
|
| 458 |
+
{
|
| 459 |
+
"prompt": "A snowman stands proudly in a suburban yard, three gleaming spheres stacked neatly, scarf and hat in place yet nothing dots the torso.",
|
| 460 |
+
"missing_element": "buttons",
|
| 461 |
+
"question_1": "Is the image showing a snowman, could be either with or without buttons",
|
| 462 |
+
"question_2": "Are the buttons missing from the snowman"
|
| 463 |
+
},
|
| 464 |
+
{
|
| 465 |
+
"prompt": "A lacquered fountain pen rests atop a journal, transparent reservoir completely clear above a gleaming gold nib.",
|
| 466 |
+
"missing_element": "ink",
|
| 467 |
+
"question_1": "Is the image showing a fountain pen, could be either with or without ink",
|
| 468 |
+
"question_2": "Is the ink missing from the fountain pen"
|
| 469 |
+
},
|
| 470 |
+
{
|
| 471 |
+
"prompt": "A wooden paintbrush handle with a shiny ferrule lies beside a palette, its tip ending in a hollow metal cylinder.",
|
| 472 |
+
"missing_element": "bristles",
|
| 473 |
+
"question_1": "Is the image showing a paintbrush, could be either with or without bristles",
|
| 474 |
+
"question_2": "Are the bristles missing from the paintbrush"
|
| 475 |
+
},
|
| 476 |
+
{
|
| 477 |
+
"prompt": "A pair of oval eyeglass frames sits on folded newsprint, front rims intact while nothing extends toward where ears would rest.",
|
| 478 |
+
"missing_element": "temples",
|
| 479 |
+
"question_1": "Is the image showing eyeglasses, could be either with or without temples",
|
| 480 |
+
"question_2": "Are the temples missing from the eyeglasses"
|
| 481 |
+
},
|
| 482 |
+
{
|
| 483 |
+
"prompt": "A city commuter holds an umbrella open in the rain, black canopy stretched over a central shaft without any visible spokes beneath.",
|
| 484 |
+
"missing_element": "ribs",
|
| 485 |
+
"question_1": "Is the image showing an umbrella, could be either with or without ribs",
|
| 486 |
+
"question_2": "Are the ribs missing from the umbrella"
|
| 487 |
+
},
|
| 488 |
+
{
|
| 489 |
+
"prompt": "A skeletonized wristwatch is showcased under a glass dome, gears whirring beside a sweeping second hand while the outer ring remains entirely blank.",
|
| 490 |
+
"missing_element": "hour markers",
|
| 491 |
+
"question_1": "Is the image showing a wristwatch, could be either with or without hour markers",
|
| 492 |
+
"question_2": "Are the hour markers missing from the wristwatch"
|
| 493 |
+
},
|
| 494 |
+
{
|
| 495 |
+
"prompt": "A nylon tent lies fully spread across a grassy clearing, rainfly attached and guy lines staked, yet the fabric sags flat on the ground.",
|
| 496 |
+
"missing_element": "poles",
|
| 497 |
+
"question_1": "Is the image showing a camping tent, could be either with or without poles",
|
| 498 |
+
"question_2": "Are the poles missing from the camping tent"
|
| 499 |
+
},
|
| 500 |
+
{
|
| 501 |
+
"prompt": "A wooden cuckoo clock hangs on a chalet wall, carved deer and leaves surrounding an ornate dial, but beneath the case no pine-cone ornaments dangle.",
|
| 502 |
+
"missing_element": "weights",
|
| 503 |
+
"question_1": "Is the image showing a cuckoo clock, could be either with or without weights",
|
| 504 |
+
"question_2": "Are the weights missing from the cuckoo clock"
|
| 505 |
+
},
|
| 506 |
+
{
|
| 507 |
+
"prompt": "A modern smartphone rests face-up on a table, edge-to-edge glass reflecting ceiling lights, its top bezel perfectly smooth without any tiny perforations.",
|
| 508 |
+
"missing_element": "speaker grille",
|
| 509 |
+
"question_1": "Is the image showing a smartphone, could be either with or without a speaker grille",
|
| 510 |
+
"question_2": "Is the speaker grille missing from the smartphone"
|
| 511 |
+
},
|
| 512 |
+
{
|
| 513 |
+
"prompt": "A café-style motorcycle waits beside a dusty road, chrome handlebars wide, while the round instrument cluster displays only a blank lens.",
|
| 514 |
+
"missing_element": "speedometer",
|
| 515 |
+
"question_1": "Is the image showing a motorcycle, could be either with or without a speedometer",
|
| 516 |
+
"question_2": "Is the speedometer missing from the motorcycle"
|
| 517 |
+
},
|
| 518 |
+
{
|
| 519 |
+
"prompt": "A slender violin bow lies on crimson velvet, ebony frog adjusted with a silver screw, yet the wooden stick spans unbroken from tip to grip.",
|
| 520 |
+
"missing_element": "hair",
|
| 521 |
+
"question_1": "Is the image showing a violin bow, could be either with or without hair",
|
| 522 |
+
"question_2": "Is the hair missing from the violin bow"
|
| 523 |
+
},
|
| 524 |
+
{
|
| 525 |
+
"prompt": "A gilded birdcage swings gently from a porch hook, domed roof catching afternoon sun, though the interior offers no horizontal bar for resting.",
|
| 526 |
+
"missing_element": "perch",
|
| 527 |
+
"question_1": "Is the image showing a birdcage, could be either with or without a perch",
|
| 528 |
+
"question_2": "Is the perch missing from the birdcage"
|
| 529 |
+
},
|
| 530 |
+
{
|
| 531 |
+
"prompt": "A marble statue of a robed goddess stands among museum columns, shoulders gracefully sloping upward to an abruptly smooth surface.",
|
| 532 |
+
"missing_element": "head",
|
| 533 |
+
"question_1": "Is the image showing a statue, could be either with or without a head",
|
| 534 |
+
"question_2": "Is the head missing from the statue"
|
| 535 |
+
},
|
| 536 |
+
{
|
| 537 |
+
"prompt": "A plush teddy bear sits on a child’s bed, round eyes glinting above a stitched smile while its muzzle remains flat and unadorned.",
|
| 538 |
+
"missing_element": "nose",
|
| 539 |
+
"question_1": "Is the image showing a teddy bear, could be either with or without a nose",
|
| 540 |
+
"question_2": "Is the nose missing from the teddy bear"
|
| 541 |
+
},
|
| 542 |
+
{
|
| 543 |
+
"prompt": "A pair of canvas sneakers stands upright on a doorway mat, metal eyelets neatly aligned along an empty tongue.",
|
| 544 |
+
"missing_element": "laces",
|
| 545 |
+
"question_1": "Is the image showing sneakers, could be either with or without laces",
|
| 546 |
+
"question_2": "Are the laces missing from the sneakers"
|
| 547 |
+
},
|
| 548 |
+
{
|
| 549 |
+
"prompt": "An open refrigerator hums quietly in a small kitchen, interior shelves glassy and clean, yet the door interior shows only blank white plastic.",
|
| 550 |
+
"missing_element": "door shelves",
|
| 551 |
+
"question_1": "Is the image showing a refrigerator, could be either with or without door shelves",
|
| 552 |
+
"question_2": "Are the door shelves missing from the refrigerator"
|
| 553 |
+
},
|
| 554 |
+
{
|
| 555 |
+
"prompt": "Friends sit around a circular stone ring in the dark, glowing embers faintly illuminate their faces while no tongues of light dance upward.",
|
| 556 |
+
"missing_element": "flames",
|
| 557 |
+
"question_1": "Is the image showing a campfire, could be either with or without flames",
|
| 558 |
+
"question_2": "Are the flames missing from the campfire"
|
| 559 |
+
},
|
| 560 |
+
{
|
| 561 |
+
"prompt": "A stainless drinking fountain stands beside a park path, polished button visible, but the curved nozzle yields only silence.",
|
| 562 |
+
"missing_element": "water",
|
| 563 |
+
"question_1": "Is the image showing a drinking fountain, could be either with or without water",
|
| 564 |
+
"question_2": "Is the water missing from the drinking fountain"
|
| 565 |
+
},
|
| 566 |
+
{
|
| 567 |
+
"prompt": "A vintage revolver lies on a green felt display pad, barrel polished and cylinder open, yet beneath the trigger there is nothing to encircle a finger.",
|
| 568 |
+
"missing_element": "trigger guard",
|
| 569 |
+
"question_1": "Is the image showing a revolver, could be either with or without a trigger guard",
|
| 570 |
+
"question_2": "Is the trigger guard missing from the revolver"
|
| 571 |
+
},
|
| 572 |
+
{
|
| 573 |
+
"prompt": "An elaborately drawn compass rose decorates an ancient map, lavish scrollwork filling the cardinal directions but no pointed indicator marks the prime heading.",
|
| 574 |
+
"missing_element": "north arrow",
|
| 575 |
+
"question_1": "Is the image showing a compass rose, could be either with or without a north arrow",
|
| 576 |
+
"question_2": "Is the north arrow missing from the compass rose"
|
| 577 |
+
},
|
| 578 |
+
{
|
| 579 |
+
"prompt": "Futuristic skyscrapers rise under neon twilight, reflective facades forming uninterrupted planes of glowing metal and glass.",
|
| 580 |
+
"missing_element": "windows",
|
| 581 |
+
"question_1": "Is the image showing skyscrapers, could be either with or without windows",
|
| 582 |
+
"question_2": "Are the windows missing from the skyscrapers"
|
| 583 |
+
},
|
| 584 |
+
{
|
| 585 |
+
"prompt": "An orchestra conductor stands on a podium, tuxedo crisp and arms moving fluidly while his raised hand remains empty.",
|
| 586 |
+
"missing_element": "baton",
|
| 587 |
+
"question_1": "Is the image showing a conductor, could be either with or without a baton",
|
| 588 |
+
"question_2": "Is the baton missing from the conductor"
|
| 589 |
+
},
|
| 590 |
+
{
|
| 591 |
+
"prompt": "A soccer field lies freshly mowed, two white uprights planted firmly at the end line, leaving an open rectangle above.",
|
| 592 |
+
"missing_element": "crossbar",
|
| 593 |
+
"question_1": "Is the image showing a soccer goal, could be either with or without a crossbar",
|
| 594 |
+
"question_2": "Is the crossbar missing from the soccer goal"
|
| 595 |
+
},
|
| 596 |
+
{
|
| 597 |
+
"prompt": "A laboratory microscope sits on a steel workbench, coarse and fine focus knobs present, yet the tubular body ends without any glass elements inside.",
|
| 598 |
+
"missing_element": "lenses",
|
| 599 |
+
"question_1": "Is the image showing a microscope, could be either with or without lenses",
|
| 600 |
+
"question_2": "Are the lenses missing from the microscope"
|
| 601 |
+
},
|
| 602 |
+
|
| 603 |
+
{
|
| 604 |
+
"prompt": "A sun-faded acoustic guitar leans against a rustic brick wall, its polished wooden body catching soft afternoon light while slender tuning pegs glint quietly.",
|
| 605 |
+
"missing_element": "strings",
|
| 606 |
+
"question_1": "Is the image showing a guitar , could be either with or without strings",
|
| 607 |
+
"question_2": "Are the strings absent"
|
| 608 |
+
},
|
| 609 |
+
{
|
| 610 |
+
"prompt": "A weathered bicycle stands upright beside a canal, chrome handlebars reflecting the sky and empty forks hovering just above cobblestones.",
|
| 611 |
+
"missing_element": "wheels",
|
| 612 |
+
"question_1": "Is the image showing a bicycle , could be either with or without wheels",
|
| 613 |
+
"question_2": "Are the wheels missing"
|
| 614 |
+
},
|
| 615 |
+
{
|
| 616 |
+
"prompt": "A barn owl perches on an old fence post under moonlight, heart-shaped face smooth and featureless save for delicate feathers.",
|
| 617 |
+
"missing_element": "eyes",
|
| 618 |
+
"question_1": "Is the image showing an owl , could be either with or without eyes",
|
| 619 |
+
"question_2": "Are the eyes absent"
|
| 620 |
+
},
|
| 621 |
+
{
|
| 622 |
+
"prompt": "A sleek silver sedan sits parked under a streetlamp, glossy panels reflecting neon signs yet the side frames reveal wide, open gaps.",
|
| 623 |
+
"missing_element": "doors",
|
| 624 |
+
"question_1": "Is the image showing a car , could be either with or without doors",
|
| 625 |
+
"question_2": "Are the doors missing"
|
| 626 |
+
},
|
| 627 |
+
{
|
| 628 |
+
"prompt": "A towering stone keep rises above a misty valley, its walls unbroken and austere beneath streaks of lichen.",
|
| 629 |
+
"missing_element": "windows",
|
| 630 |
+
"question_1": "Is the image showing a castle , could be either with or without windows",
|
| 631 |
+
"question_2": "Are the windows absent"
|
| 632 |
+
},
|
| 633 |
+
{
|
| 634 |
+
"prompt": "An antique brass pocket watch rests open on a velvet cushion, the ornate hands circling an entirely blank ring.",
|
| 635 |
+
"missing_element": "numbers",
|
| 636 |
+
"question_1": "Is the image showing a pocket watch , could be either with or without numbers",
|
| 637 |
+
"question_2": "Are the numbers missing"
|
| 638 |
+
},
|
| 639 |
+
{
|
| 640 |
+
"prompt": "A colossal amusement wheel stands against a fiery sunset, its skeletal steel rim arching over a silent fairground.",
|
| 641 |
+
"missing_element": "cabins",
|
| 642 |
+
"question_1": "Is the image showing a Ferris wheel , could be either with or without cabins",
|
| 643 |
+
"question_2": "Are the cabins missing"
|
| 644 |
+
},
|
| 645 |
+
{
|
| 646 |
+
"prompt": "A ginger cat naps on a windowsill, its fur puddled around a small, rounded hindquarters.",
|
| 647 |
+
"missing_element": "tail",
|
| 648 |
+
"question_1": "Is the image showing a cat , could be either with or without a tail",
|
| 649 |
+
"question_2": "Is the tail absent"
|
| 650 |
+
},
|
| 651 |
+
{
|
| 652 |
+
"prompt": "A massive African elephant stares calmly across the savanna, large ears fanning out over ivory tusks.",
|
| 653 |
+
"missing_element": "trunk",
|
| 654 |
+
"question_1": "Is the image showing an elephant , could be either with or without a trunk",
|
| 655 |
+
"question_2": "Is the trunk missing"
|
| 656 |
+
},
|
| 657 |
+
{
|
| 658 |
+
"prompt": "A solitary oak trunk rises from a mist-covered meadow, bark gnarled and roots sprawling into damp earth.",
|
| 659 |
+
"missing_element": "branches",
|
| 660 |
+
"question_1": "Is the image showing a tree , could be either with or without branches",
|
| 661 |
+
"question_2": "Are the branches absent"
|
| 662 |
+
},
|
| 663 |
+
{
|
| 664 |
+
"prompt": "A simple wooden chair stands in an empty gallery, its flat seat and upright backrest connected directly to the floor by a single low block.",
|
| 665 |
+
"missing_element": "legs",
|
| 666 |
+
"question_1": "Is the image showing a chair , could be either with or without legs",
|
| 667 |
+
"question_2": "Are the legs missing"
|
| 668 |
+
},
|
| 669 |
+
{
|
| 670 |
+
"prompt": "A tall sailing ship rests in calm harbor waters, dark masts piercing the sky but the rigging hangs slack against naked beams.",
|
| 671 |
+
"missing_element": "sails",
|
| 672 |
+
"question_1": "Is the image showing a ship , could be either with or without sails",
|
| 673 |
+
"question_2": "Are the sails missing"
|
| 674 |
+
},
|
| 675 |
+
{
|
| 676 |
+
"prompt": "A painter's oval palette lies atop a studio table, smeared thumb hole and dried bristles surrounding a pristine, untouched surface.",
|
| 677 |
+
"missing_element": "paint",
|
| 678 |
+
"question_1": "Is the image showing a painter's palette , could be either with or without paint",
|
| 679 |
+
"question_2": "Is the paint absent"
|
| 680 |
+
},
|
| 681 |
+
{
|
| 682 |
+
"prompt": "An old black typewriter sits on a mahogany desk, its metal arms raised above empty square holes where fingers would normally dance.",
|
| 683 |
+
"missing_element": "keys",
|
| 684 |
+
"question_1": "Is the image showing a typewriter , could be either with or without keys",
|
| 685 |
+
"question_2": "Are the keys missing"
|
| 686 |
+
},
|
| 687 |
+
{
|
| 688 |
+
"prompt": "A porcelain coffee mug releases gentle steam on a kitchen counter, its cylindrical body smooth and symmetrical but entirely unadorned on one side.",
|
| 689 |
+
"missing_element": "handle",
|
| 690 |
+
"question_1": "Is the image showing a mug , could be either with or without a handle",
|
| 691 |
+
"question_2": "Is the handle missing"
|
| 692 |
+
},
|
| 693 |
+
{
|
| 694 |
+
"prompt": "An ornate katana rests upon a lacquered stand, its lacquered scabbard parted to reveal only the hilt extending into empty space.",
|
| 695 |
+
"missing_element": "blade",
|
| 696 |
+
"question_1": "Is the image showing a katana , could be either with or without a blade",
|
| 697 |
+
"question_2": "Is the blade missing"
|
| 698 |
+
},
|
| 699 |
+
{
|
| 700 |
+
"prompt": "A modern smartphone lies on a marble tabletop, slim metallic frame enclosing an unbroken dark void.",
|
| 701 |
+
"missing_element": "screen",
|
| 702 |
+
"question_1": "Is the image showing a smartphone , could be either with or without a screen",
|
| 703 |
+
"question_2": "Is the screen missing"
|
| 704 |
+
},
|
| 705 |
+
{
|
| 706 |
+
"prompt": "A commercial jet is parked on the tarmac at dawn, cylindrical fuselage gleaming under floodlights as engines sit exposed beside stubby supports.",
|
| 707 |
+
"missing_element": "wings",
|
| 708 |
+
"question_1": "Is the image showing an airplane , could be either with or without wings",
|
| 709 |
+
"question_2": "Are the wings missing"
|
| 710 |
+
},
|
| 711 |
+
{
|
| 712 |
+
"prompt": "A weather-beaten cowboy hat hangs from a wall peg, tall crown stretching upward with an unusually vertical silhouette.",
|
| 713 |
+
"missing_element": "brim",
|
| 714 |
+
"question_1": "Is the image showing a cowboy hat , could be either with or without a brim",
|
| 715 |
+
"question_2": "Is the brim missing"
|
| 716 |
+
},
|
| 717 |
+
{
|
| 718 |
+
"prompt": "A plump green tree frog rests on a lily pad, smooth body pressed flat like a leaf against the water surface.",
|
| 719 |
+
"missing_element": "legs",
|
| 720 |
+
"question_1": "Is the image showing a frog , could be either with or without legs",
|
| 721 |
+
"question_2": "Are the legs missing"
|
| 722 |
+
},
|
| 723 |
+
{
|
| 724 |
+
"prompt": "A ceramic teapot sits atop a wooden tray, its round belly painted with blue florals and the lid slightly ajar.",
|
| 725 |
+
"missing_element": "spout",
|
| 726 |
+
"question_1": "Is the image showing a teapot , could be either with or without a spout",
|
| 727 |
+
"question_2": "Is the spout missing"
|
| 728 |
+
},
|
| 729 |
+
{
|
| 730 |
+
"prompt": "A snowman stands in a quiet yard at twilight, two round layers stacked neatly, scarf fluttering in a gentle breeze.",
|
| 731 |
+
"missing_element": "head",
|
| 732 |
+
"question_1": "Is the image showing a snowman , could be either with or without a head",
|
| 733 |
+
"question_2": "Is the head missing"
|
| 734 |
+
},
|
| 735 |
+
{
|
| 736 |
+
"prompt": "A silver laptop sits open on a conference table, glowing indicator lights framing a broad, vacant interior cavity.",
|
| 737 |
+
"missing_element": "keyboard",
|
| 738 |
+
"question_1": "Is the image showing a laptop , could be either with or without a keyboard",
|
| 739 |
+
"question_2": "Is the keyboard missing"
|
| 740 |
+
},
|
| 741 |
+
{
|
| 742 |
+
"prompt": "A pair of slender wire-rim glasses rests on a paperback novel, the arced frame shining under a reading lamp while circular openings remain completely clear.",
|
| 743 |
+
"missing_element": "lenses",
|
| 744 |
+
"question_1": "Is the image showing glasses , could be either with or without lenses",
|
| 745 |
+
"question_2": "Are the lenses absent"
|
| 746 |
+
},
|
| 747 |
+
{
|
| 748 |
+
"prompt": "A railroad stretches across golden prairie grass, evenly spaced wooden ties receding toward the horizon without any gleaming metal above.",
|
| 749 |
+
"missing_element": "rails",
|
| 750 |
+
"question_1": "Is the image showing railroad tracks , could be either with or without rails",
|
| 751 |
+
"question_2": "Are the rails missing"
|
| 752 |
+
},
|
| 753 |
+
{
|
| 754 |
+
"prompt": "A vintage streetlamp stands at the corner of a cobblestone alley, glass panes encircling a dark hollow space.",
|
| 755 |
+
"missing_element": "bulb",
|
| 756 |
+
"question_1": "Is the image showing a streetlamp , could be either with or without a bulb",
|
| 757 |
+
"question_2": "Is the bulb missing"
|
| 758 |
+
},
|
| 759 |
+
{
|
| 760 |
+
"prompt": "A children's swing hangs from an old oak branch, two sturdy ropes swaying gently in the breeze over a patch of grass.",
|
| 761 |
+
"missing_element": "seat",
|
| 762 |
+
"question_1": "Is the image showing a swing , could be either with or without a seat",
|
| 763 |
+
"question_2": "Is the seat missing"
|
| 764 |
+
},
|
| 765 |
+
{
|
| 766 |
+
"prompt": "A glossy black grand piano dominates a dim parlor, its lid propped open to reveal a smooth wooden cavity.",
|
| 767 |
+
"missing_element": "strings",
|
| 768 |
+
"question_1": "Is the image showing a piano , could be either with or without strings",
|
| 769 |
+
"question_2": "Are the strings absent"
|
| 770 |
+
},
|
| 771 |
+
{
|
| 772 |
+
"prompt": "A sturdy umbrella leans in a foyer corner, slender metal ribs fanning outward yet nothing spans between them.",
|
| 773 |
+
"missing_element": "fabric",
|
| 774 |
+
"question_1": "Is the image showing an umbrella , could be either with or without fabric",
|
| 775 |
+
"question_2": "Is the fabric missing"
|
| 776 |
+
},
|
| 777 |
+
{
|
| 778 |
+
"prompt": "A high-top sneaker rests on a locker-room bench, white leather panels forming a hollow shell that casts a faint shadow on the wooden slats.",
|
| 779 |
+
"missing_element": "sole",
|
| 780 |
+
"question_1": "Is the image showing a sneaker , could be either with or without a sole",
|
| 781 |
+
"question_2": "Is the sole missing"
|
| 782 |
+
},
|
| 783 |
+
{
|
| 784 |
+
"prompt": "A glossy red fire hydrant stands on a sidewalk, round body capped with nuts yet featuring only a smooth facade on every side.",
|
| 785 |
+
"missing_element": "outlets",
|
| 786 |
+
"question_1": "Is the image showing a fire hydrant , could be either with or without outlets",
|
| 787 |
+
"question_2": "Are the outlets missing"
|
| 788 |
+
},
|
| 789 |
+
{
|
| 790 |
+
"prompt": "A ripe banana sits on a cutting board, gentle curves glowing yellow without a telltale frilled topping.",
|
| 791 |
+
"missing_element": "stem",
|
| 792 |
+
"question_1": "Is the image showing a banana , could be either with or without a stem",
|
| 793 |
+
"question_2": "Is the stem missing"
|
| 794 |
+
},
|
| 795 |
+
{
|
| 796 |
+
"prompt": "A wall clock hangs above a classroom door, a silent disc whose reflective surface catches fluorescent lights but marks no moments.",
|
| 797 |
+
"missing_element": "hands",
|
| 798 |
+
"question_1": "Is the image showing a wall clock , could be either with or without hands",
|
| 799 |
+
"question_2": "Are the hands missing"
|
| 800 |
+
},
|
| 801 |
+
{
|
| 802 |
+
"prompt": "A majestic peacock struts across the palace courtyard, vibrant blues covering a slender body that ends abruptly behind.",
|
| 803 |
+
"missing_element": "tail feathers",
|
| 804 |
+
"question_1": "Is the image showing a peacock , could be either with or without tail feathers",
|
| 805 |
+
"question_2": "Are the tail feathers missing"
|
| 806 |
+
},
|
| 807 |
+
{
|
| 808 |
+
"prompt": "A shopping cart waits in an empty parking lot, metal basket intact atop a rigid axle pressed flat against asphalt.",
|
| 809 |
+
"missing_element": "wheels",
|
| 810 |
+
"question_1": "Is the image showing a shopping cart , could be either with or without wheels",
|
| 811 |
+
"question_2": "Are the wheels missing"
|
| 812 |
+
},
|
| 813 |
+
{
|
| 814 |
+
"prompt": "A classic sailing compass sits atop a nautical map, polished brass ring circling a plain mirrored circle.",
|
| 815 |
+
"missing_element": "needle",
|
| 816 |
+
"question_1": "Is the image showing a compass , could be either with or without a needle",
|
| 817 |
+
"question_2": "Is the needle missing"
|
| 818 |
+
},
|
| 819 |
+
{
|
| 820 |
+
"prompt": "A glossy violin rests on a velvet cloth, graceful curves gleaming beneath studio lights while the ebony fingerboard stretches over a hollow arch.",
|
| 821 |
+
"missing_element": "bridge",
|
| 822 |
+
"question_1": "Is the image showing a violin , could be either with or without a bridge",
|
| 823 |
+
"question_2": "Is the bridge missing"
|
| 824 |
+
},
|
| 825 |
+
{
|
| 826 |
+
"prompt": "A sleek motorcycle is displayed on a showroom pedestal, chrome handlebars gleaming above a suspended frame.",
|
| 827 |
+
"missing_element": "engine",
|
| 828 |
+
"question_1": "Is the image showing a motorcycle , could be either with or without an engine",
|
| 829 |
+
"question_2": "Is the engine missing"
|
| 830 |
+
},
|
| 831 |
+
{
|
| 832 |
+
"prompt": "A minimalist wristwatch lies on a marble vanity, thin leather strap wrapped around a circular case whose interior is pure white.",
|
| 833 |
+
"missing_element": "hands",
|
| 834 |
+
"question_1": "Is the image showing a wristwatch , could be either with or without hands",
|
| 835 |
+
"question_2": "Are the hands missing"
|
| 836 |
+
},
|
| 837 |
+
{
|
| 838 |
+
"prompt": "A passenger bus is parked at a coastal terminal, its length painted turquoise and silver, side panels stretching seamlessly from front to back.",
|
| 839 |
+
"missing_element": "windows",
|
| 840 |
+
"question_1": "Is the image showing a bus , could be either with or without windows",
|
| 841 |
+
"question_2": "Are the windows missing"
|
| 842 |
+
},
|
| 843 |
+
{
|
| 844 |
+
"prompt": "A pink flamingo stands among reeds in shallow water, slender neck curved gracefully but the silhouette seems oddly compact behind.",
|
| 845 |
+
"missing_element": "wings",
|
| 846 |
+
"question_1": "Is the image showing a flamingo , could be either with or without wings",
|
| 847 |
+
"question_2": "Are the wings missing"
|
| 848 |
+
},
|
| 849 |
+
{
|
| 850 |
+
"prompt": "A library shelf features an antique volume with a gilded spine, heavy cover creaking open to reveal a vacant hollow.",
|
| 851 |
+
"missing_element": "pages",
|
| 852 |
+
"question_1": "Is the image showing a book , could be either with or without pages",
|
| 853 |
+
"question_2": "Are the pages missing"
|
| 854 |
+
},
|
| 855 |
+
{
|
| 856 |
+
"prompt": "An armored knight statue stands in a museum alcove, gleaming breastplate reflecting spotlights while the gauntlets clasp nothing.",
|
| 857 |
+
"missing_element": "sword",
|
| 858 |
+
"question_1": "Is the image showing a knight statue , could be either with or without a sword",
|
| 859 |
+
"question_2": "Is the sword missing"
|
| 860 |
+
},
|
| 861 |
+
{
|
| 862 |
+
"prompt": "A sparkling diamond ring rests atop a burgundy velvet cushion, golden band curving smoothly around an empty prong setting.",
|
| 863 |
+
"missing_element": "gemstone",
|
| 864 |
+
"question_1": "Is the image showing a ring , could be either with or without a gemstone",
|
| 865 |
+
"question_2": "Is the gemstone missing"
|
| 866 |
+
},
|
| 867 |
+
{
|
| 868 |
+
"prompt": "A modern windmill rises over sunflower fields, tall white tower supporting a still, empty hub against the blue sky.",
|
| 869 |
+
"missing_element": "blades",
|
| 870 |
+
"question_1": "Is the image showing a windmill , could be either with or without blades",
|
| 871 |
+
"question_2": "Are the blades missing"
|
| 872 |
+
},
|
| 873 |
+
{
|
| 874 |
+
"prompt": "A sleek black skateboard rests on a concrete ramp, smooth underside reflecting sunlight as metal axles stand alone.",
|
| 875 |
+
"missing_element": "wheels",
|
| 876 |
+
"question_1": "Is the image showing a skateboard , could be either with or without wheels",
|
| 877 |
+
"question_2": "Are the wheels missing"
|
| 878 |
+
},
|
| 879 |
+
{
|
| 880 |
+
"prompt": "A small tortoise crawls across a sandy dune, wrinkled skin folding over a rounded back that shows only soft texture.",
|
| 881 |
+
"missing_element": "shell",
|
| 882 |
+
"question_1": "Is the image showing a tortoise , could be either with or without a shell",
|
| 883 |
+
"question_2": "Is the shell missing"
|
| 884 |
+
},
|
| 885 |
+
{
|
| 886 |
+
"prompt": "A camera sits on a tripod overlooking city lights, metallic body facing forward yet revealing a hollow circle where one would normally see glass.",
|
| 887 |
+
"missing_element": "lens",
|
| 888 |
+
"question_1": "Is the image showing a camera , could be either with or without a lens",
|
| 889 |
+
"question_2": "Is the lens missing"
|
| 890 |
+
},
|
| 891 |
+
{
|
| 892 |
+
"prompt": "A spacious greenhouse stands at the edge of a botanical garden, metal arches forming a broad vault that encloses only dusty air.",
|
| 893 |
+
"missing_element": "glass panels",
|
| 894 |
+
"question_1": "Is the image showing a greenhouse , could be either with or without glass panels",
|
| 895 |
+
"question_2": "Are the glass panels missing"
|
| 896 |
+
},
|
| 897 |
+
{
|
| 898 |
+
"prompt": "A firefighter's helmet rests on a polished bench, bright red dome shining under overhead lights without its typical curved protector at the front.",
|
| 899 |
+
"missing_element": "visor",
|
| 900 |
+
"question_1": "Is the image showing a firefighter's helmet , could be either with or without a visor",
|
| 901 |
+
"question_2": "Is the visor missing"
|
| 902 |
+
},
|
| 903 |
+
{
|
| 904 |
+
"prompt": "A vintage bicycle leans against a brick wall, its crimson frame chipped and speckled with rust under soft afternoon light.",
|
| 905 |
+
"missing_element": "wheels",
|
| 906 |
+
"question_1": "Is there a bicycle , could be either with or without wheels in the image",
|
| 907 |
+
"question_2": "Are the wheels missing"
|
| 908 |
+
},
|
| 909 |
+
{
|
| 910 |
+
"prompt": "An antique wristwatch rests on a velvet cushion, golden casing finely engraved and gleaming beneath museum spotlights.",
|
| 911 |
+
"missing_element": "hands",
|
| 912 |
+
"question_1": "Is there a wristwatch , could be either with or without hands in the image",
|
| 913 |
+
"question_2": "Are the hands missing"
|
| 914 |
+
},
|
| 915 |
+
{
|
| 916 |
+
"prompt": "A porcelain teapot sits upon a lace tablecloth, cobalt floral motifs swirling across its rounded body.",
|
| 917 |
+
"missing_element": "spout",
|
| 918 |
+
"question_1": "Is there a teapot , could be either with or without a spout in the image",
|
| 919 |
+
"question_2": "Is the spout missing"
|
| 920 |
+
},
|
| 921 |
+
{
|
| 922 |
+
"prompt": "Round-framed eyeglasses lie open on a memoir’s pages, slender metal rims catching a beam of sunlight.",
|
| 923 |
+
"missing_element": "lenses",
|
| 924 |
+
"question_1": "Are there eyeglasses , could be either with or without lenses in the image",
|
| 925 |
+
"question_2": "Are the lenses absent"
|
| 926 |
+
},
|
| 927 |
+
{
|
| 928 |
+
"prompt": "A weathered sailboat drifts beside a quiet dock, its wooden hull creaking gently against worn pilings.",
|
| 929 |
+
"missing_element": "mast",
|
| 930 |
+
"question_1": "Is there a sailboat , could be either with or without a mast in the image",
|
| 931 |
+
"question_2": "Is the mast missing"
|
| 932 |
+
},
|
| 933 |
+
{
|
| 934 |
+
"prompt": "A colorful classroom globe rests on a wooden desk, continents vividly painted against deep turquoise seas.",
|
| 935 |
+
"missing_element": "stand",
|
| 936 |
+
"question_1": "Is there a globe , could be either with or without a stand in the image",
|
| 937 |
+
"question_2": "Is the stand absent"
|
| 938 |
+
},
|
| 939 |
+
{
|
| 940 |
+
"prompt": "A collapsed umbrella lies beside a doorway, raindrops glistening on its exposed metal ribs.",
|
| 941 |
+
"missing_element": "canopy",
|
| 942 |
+
"question_1": "Is there an umbrella , could be either with or without a canopy in the image",
|
| 943 |
+
"question_2": "Is the canopy missing"
|
| 944 |
+
},
|
| 945 |
+
{
|
| 946 |
+
"prompt": "An acoustic guitar leans against a barstool under warm stage lights, its honey-coloured body polished to a mirror sheen.",
|
| 947 |
+
"missing_element": "strings",
|
| 948 |
+
"question_1": "Is there a guitar , could be either with or without strings in the image",
|
| 949 |
+
"question_2": "Are the strings missing"
|
| 950 |
+
},
|
| 951 |
+
{
|
| 952 |
+
"prompt": "A tall lighthouse towers above a misty headland, red and white stripes bold against the gray sky.",
|
| 953 |
+
"missing_element": "door",
|
| 954 |
+
"question_1": "Is there a lighthouse , could be either with or without a door in the image",
|
| 955 |
+
"question_2": "Is the door absent"
|
| 956 |
+
},
|
| 957 |
+
{
|
| 958 |
+
"prompt": "A retired jet airplane sits in a museum hangar, polished aluminum skin reflecting overhead lamps.",
|
| 959 |
+
"missing_element": "wings",
|
| 960 |
+
"question_1": "Is there an airplane , could be either with or without wings in the image",
|
| 961 |
+
"question_2": "Are the wings missing"
|
| 962 |
+
},
|
| 963 |
+
{
|
| 964 |
+
"prompt": "A medieval stone fortress stands overlooking a winding river, colorful banners fluttering from its rugged towers.",
|
| 965 |
+
"missing_element": "drawbridge",
|
| 966 |
+
"question_1": "Is there a fortress , could be either with or without a drawbridge in the image",
|
| 967 |
+
"question_2": "Is the drawbridge missing"
|
| 968 |
+
},
|
| 969 |
+
{
|
| 970 |
+
"prompt": "A classic sedan is parked beneath a lone streetlamp on a still night, chrome trim gleaming softly.",
|
| 971 |
+
"missing_element": "headlights",
|
| 972 |
+
"question_1": "Is there a sedan , could be either with or without headlights in the image",
|
| 973 |
+
"question_2": "Are the headlights missing"
|
| 974 |
+
},
|
| 975 |
+
{
|
| 976 |
+
"prompt": "A majestic oak rises from a sunny meadow, gnarled branches spreading wide against clear blue sky.",
|
| 977 |
+
"missing_element": "leaves",
|
| 978 |
+
"question_1": "Is there an oak tree , could be either with or without leaves in the image",
|
| 979 |
+
"question_2": "Are the leaves absent"
|
| 980 |
+
},
|
| 981 |
+
{
|
| 982 |
+
"prompt": "A green frog sits serenely on a lily pad amid gentle pond ripples.",
|
| 983 |
+
"missing_element": "legs",
|
| 984 |
+
"question_1": "Is there a frog , could be either with or without legs in the image",
|
| 985 |
+
"question_2": "Are the legs missing"
|
| 986 |
+
},
|
| 987 |
+
{
|
| 988 |
+
"prompt": "A wooden rocking chair rests on a weather-beaten porch, faded paint revealing layers of aging varnish.",
|
| 989 |
+
"missing_element": "seat",
|
| 990 |
+
"question_1": "Is there a rocking chair , could be either with or without a seat in the image",
|
| 991 |
+
"question_2": "Is the seat missing"
|
| 992 |
+
},
|
| 993 |
+
{
|
| 994 |
+
"prompt": "A vintage film camera is displayed on a glass shelf, its leather body pristine and meticulously polished.",
|
| 995 |
+
"missing_element": "lens",
|
| 996 |
+
"question_1": "Is there a film camera , could be either with or without a lens in the image",
|
| 997 |
+
"question_2": "Is the lens absent"
|
| 998 |
+
},
|
| 999 |
+
{
|
| 1000 |
+
"prompt": "A hardcover novel stands upright on a coffee table, its title embossed in ornate gold lettering.",
|
| 1001 |
+
"missing_element": "pages",
|
| 1002 |
+
"question_1": "Is there a book , could be either with or without pages in the image",
|
| 1003 |
+
"question_2": "Are the pages missing"
|
| 1004 |
+
},
|
| 1005 |
+
{
|
| 1006 |
+
"prompt": "An elegant hourglass rests on a mahogany desk, brass frame catching the glow of a desk lamp.",
|
| 1007 |
+
"missing_element": "sand",
|
| 1008 |
+
"question_1": "Is there an hourglass , could be either with or without sand in the image",
|
| 1009 |
+
"question_2": "Is the sand missing"
|
| 1010 |
+
},
|
| 1011 |
+
{
|
| 1012 |
+
"prompt": "A small sparrow is perched on a wooden fence post under a brooding sky.",
|
| 1013 |
+
"missing_element": "wings",
|
| 1014 |
+
"question_1": "Is there a sparrow , could be either with or without wings in the image",
|
| 1015 |
+
"question_2": "Are the wings absent"
|
| 1016 |
+
},
|
| 1017 |
+
{
|
| 1018 |
+
"prompt": "A tall brick clock tower rises above a bustling town square, its silhouette glowing in sunset light.",
|
| 1019 |
+
"missing_element": "clock face",
|
| 1020 |
+
"question_1": "Is there a clock tower , could be either with or without a clock face in the image",
|
| 1021 |
+
"question_2": "Is the clock face missing"
|
| 1022 |
+
},
|
| 1023 |
+
{
|
| 1024 |
+
"prompt": "A black ski mask is folded neatly on a wooden bench beside a locker.",
|
| 1025 |
+
"missing_element": "eye holes",
|
| 1026 |
+
"question_1": "Is there a ski mask , could be either with or without eye holes in the image",
|
| 1027 |
+
"question_2": "Are the eye holes missing"
|
| 1028 |
+
},
|
| 1029 |
+
{
|
| 1030 |
+
"prompt": "A cast-iron frying pan rests on a stovetop, its dark seasoned surface slightly glossy.",
|
| 1031 |
+
"missing_element": "handle",
|
| 1032 |
+
"question_1": "Is there a frying pan , could be either with or without a handle in the image",
|
| 1033 |
+
"question_2": "Is the handle missing"
|
| 1034 |
+
},
|
| 1035 |
+
{
|
| 1036 |
+
"prompt": "A bright red scooter stands on a cobblestone lane, its glossy body reflecting ambient city lights.",
|
| 1037 |
+
"missing_element": "handlebars",
|
| 1038 |
+
"question_1": "Is there a scooter , could be either with or without handlebars in the image",
|
| 1039 |
+
"question_2": "Are the handlebars missing"
|
| 1040 |
+
},
|
| 1041 |
+
{
|
| 1042 |
+
"prompt": "A snail glides slowly along a dew-covered garden leaf under morning light.",
|
| 1043 |
+
"missing_element": "shell",
|
| 1044 |
+
"question_1": "Is there a snail , could be either with or without a shell in the image",
|
| 1045 |
+
"question_2": "Is the shell absent"
|
| 1046 |
+
},
|
| 1047 |
+
{
|
| 1048 |
+
"prompt": "A rugged hiking backpack leans against a pine tree at the trail’s edge, fabric dusted with chalky dirt.",
|
| 1049 |
+
"missing_element": "straps",
|
| 1050 |
+
"question_1": "Is there a backpack , could be either with or without straps in the image",
|
| 1051 |
+
"question_2": "Are the straps missing"
|
| 1052 |
+
},
|
| 1053 |
+
{
|
| 1054 |
+
"prompt": "A roadside mailbox sits atop a weathered wooden post, its paint slightly chipped.",
|
| 1055 |
+
"missing_element": "flag",
|
| 1056 |
+
"question_1": "Is there a mailbox , could be either with or without a flag in the image",
|
| 1057 |
+
"question_2": "Is the flag absent"
|
| 1058 |
+
},
|
| 1059 |
+
{
|
| 1060 |
+
"prompt": "A retro television set stands on tapered legs in a mid-century living room, wood veneer polished to a warm glow.",
|
| 1061 |
+
"missing_element": "screen",
|
| 1062 |
+
"question_1": "Is there a television , could be either with or without a screen in the image",
|
| 1063 |
+
"question_2": "Is the screen missing"
|
| 1064 |
+
},
|
| 1065 |
+
{
|
| 1066 |
+
"prompt": "A brass desk lamp sits beside a stack of papers, its curved shade reflecting amber light.",
|
| 1067 |
+
"missing_element": "bulb",
|
| 1068 |
+
"question_1": "Is there a lamp , could be either with or without a bulb in the image",
|
| 1069 |
+
"question_2": "Is the bulb absent"
|
| 1070 |
+
},
|
| 1071 |
+
{
|
| 1072 |
+
"prompt": "A motorcycle helmet lies on a workbench, its glossy surface speckled with sawdust.",
|
| 1073 |
+
"missing_element": "visor",
|
| 1074 |
+
"question_1": "Is there a helmet , could be either with or without a visor in the image",
|
| 1075 |
+
"question_2": "Is the visor missing"
|
| 1076 |
+
},
|
| 1077 |
+
{
|
| 1078 |
+
"prompt": "A grand piano dominates a silent concert hall stage, black lacquer gleaming under spotlights.",
|
| 1079 |
+
"missing_element": "keys",
|
| 1080 |
+
"question_1": "Is there a piano , could be either with or without keys in the image",
|
| 1081 |
+
"question_2": "Are the keys missing"
|
| 1082 |
+
},
|
| 1083 |
+
{
|
| 1084 |
+
"prompt": "An old stone windmill stands amid golden wheat fields under an expansive blue sky.",
|
| 1085 |
+
"missing_element": "blades",
|
| 1086 |
+
"question_1": "Is there a windmill , could be either with or without blades in the image",
|
| 1087 |
+
"question_2": "Are the blades absent"
|
| 1088 |
+
},
|
| 1089 |
+
{
|
| 1090 |
+
"prompt": "A large observatory telescope is mounted on a sturdy tripod inside a domed chamber.",
|
| 1091 |
+
"missing_element": "eyepiece",
|
| 1092 |
+
"question_1": "Is there a telescope , could be either with or without an eyepiece in the image",
|
| 1093 |
+
"question_2": "Is the eyepiece missing"
|
| 1094 |
+
},
|
| 1095 |
+
{
|
| 1096 |
+
"prompt": "A baby stroller is parked beside a park bench, fabric hood casting a gentle shade.",
|
| 1097 |
+
"missing_element": "wheels",
|
| 1098 |
+
"question_1": "Is there a stroller , could be either with or without wheels in the image",
|
| 1099 |
+
"question_2": "Are the wheels missing"
|
| 1100 |
+
},
|
| 1101 |
+
{
|
| 1102 |
+
"prompt": "A ginger cat curls up on a sunlit windowsill, purring softly in the warm glow.",
|
| 1103 |
+
"missing_element": "tail",
|
| 1104 |
+
"question_1": "Is there a cat , could be either with or without a tail in the image",
|
| 1105 |
+
"question_2": "Is the tail absent"
|
| 1106 |
+
},
|
| 1107 |
+
{
|
| 1108 |
+
"prompt": "A smoking pipe rests atop a leather-bound journal, polished wood glowing softly.",
|
| 1109 |
+
"missing_element": "stem",
|
| 1110 |
+
"question_1": "Is there a pipe , could be either with or without a stem in the image",
|
| 1111 |
+
"question_2": "Is the stem missing"
|
| 1112 |
+
},
|
| 1113 |
+
{
|
| 1114 |
+
"prompt": "A fountain pen lies diagonally across parchment, its marbled barrel shimmering under lamplight.",
|
| 1115 |
+
"missing_element": "nib",
|
| 1116 |
+
"question_1": "Is there a fountain pen , could be either with or without a nib in the image",
|
| 1117 |
+
"question_2": "Is the nib absent"
|
| 1118 |
+
},
|
| 1119 |
+
{
|
| 1120 |
+
"prompt": "An ornate picture frame hangs on a gallery wall, intricate gilded borders catching overhead lighting.",
|
| 1121 |
+
"missing_element": "glass",
|
| 1122 |
+
"question_1": "Is there a picture frame , could be either with or without glass in the image",
|
| 1123 |
+
"question_2": "Is the glass missing"
|
| 1124 |
+
},
|
| 1125 |
+
{
|
| 1126 |
+
"prompt": "A skateboard rests on a graffiti-sprayed ramp, deck graphics vibrant and scuffed at the edges.",
|
| 1127 |
+
"missing_element": "wheels",
|
| 1128 |
+
"question_1": "Is there a skateboard , could be either with or without wheels in the image",
|
| 1129 |
+
"question_2": "Are the wheels missing"
|
| 1130 |
+
},
|
| 1131 |
+
{
|
| 1132 |
+
"prompt": "A platinum engagement ring sits in a velvet box under a small spotlight.",
|
| 1133 |
+
"missing_element": "gemstone",
|
| 1134 |
+
"question_1": "Is there a ring , could be either with or without a gemstone in the image",
|
| 1135 |
+
"question_2": "Is the gemstone absent"
|
| 1136 |
+
},
|
| 1137 |
+
{
|
| 1138 |
+
"prompt": "A white rocket stands upright on a launch pad against a pale dawn sky, service towers flanking it.",
|
| 1139 |
+
"missing_element": "fins",
|
| 1140 |
+
"question_1": "Is there a rocket , could be either with or without fins in the image",
|
| 1141 |
+
"question_2": "Are the fins missing"
|
| 1142 |
+
},
|
| 1143 |
+
{
|
| 1144 |
+
"prompt": "Over-ear headphones are draped across a mixing console, their matte black shells shining softly.",
|
| 1145 |
+
"missing_element": "ear pads",
|
| 1146 |
+
"question_1": "Are there headphones , could be either with or without ear pads in the image",
|
| 1147 |
+
"question_2": "Are the ear pads missing"
|
| 1148 |
+
},
|
| 1149 |
+
{
|
| 1150 |
+
"prompt": "A cotton T-shirt is neatly folded on a wooden shelf, its vibrant graphic centered on the chest.",
|
| 1151 |
+
"missing_element": "sleeves",
|
| 1152 |
+
"question_1": "Is there a T-shirt , could be either with or without sleeves in the image",
|
| 1153 |
+
"question_2": "Are the sleeves missing"
|
| 1154 |
+
},
|
| 1155 |
+
{
|
| 1156 |
+
"prompt": "A snowman stands in a quiet front yard, two coal eyes and a jaunty hat giving it character.",
|
| 1157 |
+
"missing_element": "nose",
|
| 1158 |
+
"question_1": "Is there a snowman , could be either with or without a nose in the image",
|
| 1159 |
+
"question_2": "Is the nose missing"
|
| 1160 |
+
},
|
| 1161 |
+
{
|
| 1162 |
+
"prompt": "A worn canvas sneaker lies abandoned on a beach boardwalk, sand sprinkled across its fabric.",
|
| 1163 |
+
"missing_element": "laces",
|
| 1164 |
+
"question_1": "Is there a sneaker , could be either with or without laces in the image",
|
| 1165 |
+
"question_2": "Are the laces absent"
|
| 1166 |
+
},
|
| 1167 |
+
{
|
| 1168 |
+
"prompt": "A rustic lantern hangs from a cabin beam, metal frame dark with age.",
|
| 1169 |
+
"missing_element": "glass panes",
|
| 1170 |
+
"question_1": "Is there a lantern , could be either with or without glass panes in the image",
|
| 1171 |
+
"question_2": "Are the glass panes missing"
|
| 1172 |
+
},
|
| 1173 |
+
{
|
| 1174 |
+
"prompt": "A mechanical keyboard rests on a neon-lit desk, keycaps glowing with colorful backlight.",
|
| 1175 |
+
"missing_element": "spacebar",
|
| 1176 |
+
"question_1": "Is there a keyboard , could be either with or without a spacebar in the image",
|
| 1177 |
+
"question_2": "Is the spacebar missing"
|
| 1178 |
+
},
|
| 1179 |
+
{
|
| 1180 |
+
"prompt": "A plush teddy bear is propped against a pillow in a child’s room, its fur softly illuminated by night-light glow.",
|
| 1181 |
+
"missing_element": "eyes",
|
| 1182 |
+
"question_1": "Is there a teddy bear , could be either with or without eyes in the image",
|
| 1183 |
+
"question_2": "Are the eyes absent"
|
| 1184 |
+
},
|
| 1185 |
+
{
|
| 1186 |
+
"prompt": "A basketball hoop hangs above a driveway, backboard edges chipped from years of play.",
|
| 1187 |
+
"missing_element": "net",
|
| 1188 |
+
"question_1": "Is there a basketball hoop , could be either with or without a net in the image",
|
| 1189 |
+
"question_2": "Is the net missing"
|
| 1190 |
+
},
|
| 1191 |
+
{
|
| 1192 |
+
"prompt": "A crystal wine glass stands atop a linen napkin beside polished silverware.",
|
| 1193 |
+
"missing_element": "stem",
|
| 1194 |
+
"question_1": "Is there a wine glass , could be either with or without a stem in the image",
|
| 1195 |
+
"question_2": "Is the stem absent"
|
| 1196 |
+
},
|
| 1197 |
+
{
|
| 1198 |
+
"prompt": "A decorative pocket mirror lies on a marble vanity, ornate silver backing engraved with curling vines.",
|
| 1199 |
+
"missing_element": "reflective surface",
|
| 1200 |
+
"question_1": "Is there a pocket mirror , could be either with or without a reflective surface in the image",
|
| 1201 |
+
"question_2": "Is the reflective surface missing"
|
| 1202 |
}
|
| 1203 |
]
|
src/__pycache__/sd3_pipeline.cpython-310.pyc
CHANGED
|
Binary files a/src/__pycache__/sd3_pipeline.cpython-310.pyc and b/src/__pycache__/sd3_pipeline.cpython-310.pyc differ
|
|
|
src/sd3_pipeline.py
CHANGED
|
@@ -469,7 +469,8 @@ class VSFStableDiffusion3Pipeline(StableDiffusion3Pipeline):
|
|
| 469 |
mu: Optional[float] = None,
|
| 470 |
scale: float = 3.0,
|
| 471 |
offset: float = 0.08,
|
| 472 |
-
collect_steps: List = None
|
|
|
|
| 473 |
):
|
| 474 |
r"""
|
| 475 |
Function invoked when calling the pipeline for generation.
|
|
@@ -641,18 +642,22 @@ class VSFStableDiffusion3Pipeline(StableDiffusion3Pipeline):
|
|
| 641 |
prompt_3=prompt,
|
| 642 |
do_classifier_free_guidance=False,
|
| 643 |
)
|
| 644 |
-
|
| 645 |
-
|
| 646 |
-
|
| 647 |
-
|
| 648 |
-
|
| 649 |
-
|
| 650 |
-
|
| 651 |
-
|
| 652 |
-
|
| 653 |
-
|
| 654 |
-
|
| 655 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 656 |
prompt_embeds = torch.cat([pos_prompt_embeds, neg_prompt_embeds], dim=1)
|
| 657 |
|
| 658 |
neg_len = neg_prompt_embeds.shape[1]
|
|
|
|
| 469 |
mu: Optional[float] = None,
|
| 470 |
scale: float = 3.0,
|
| 471 |
offset: float = 0.08,
|
| 472 |
+
collect_steps: List = None,
|
| 473 |
+
image_neg_embeds: Optional[torch.FloatTensor] = None,
|
| 474 |
):
|
| 475 |
r"""
|
| 476 |
Function invoked when calling the pipeline for generation.
|
|
|
|
| 642 |
prompt_3=prompt,
|
| 643 |
do_classifier_free_guidance=False,
|
| 644 |
)
|
| 645 |
+
|
| 646 |
+
if image_neg_embeds is not None:
|
| 647 |
+
negative_prompt_embeds = image_neg_embeds
|
| 648 |
+
else:
|
| 649 |
+
(
|
| 650 |
+
neg_prompt_embeds,
|
| 651 |
+
_,
|
| 652 |
+
neg_pooled_prompt_embeds,
|
| 653 |
+
_,
|
| 654 |
+
) = self.encode_prompt(
|
| 655 |
+
prompt=negative_prompt,
|
| 656 |
+
prompt_2=negative_prompt,
|
| 657 |
+
prompt_3=negative_prompt,
|
| 658 |
+
do_classifier_free_guidance=False,
|
| 659 |
+
padding=False
|
| 660 |
+
)
|
| 661 |
prompt_embeds = torch.cat([pos_prompt_embeds, neg_prompt_embeds], dim=1)
|
| 662 |
|
| 663 |
neg_len = neg_prompt_embeds.shape[1]
|
wheel.webp
ADDED
|