Spaces:
Runtime error
Runtime error
Add caption+grounding tasks
#1
by
leoxiaobin
- opened
app.py
CHANGED
|
@@ -135,6 +135,33 @@ def process_image(image, task_prompt, text_input=None, model_id='microsoft/Flore
|
|
| 135 |
task_prompt = '<MORE_DETAILED_CAPTION>'
|
| 136 |
results = run_example(task_prompt, image, model_id=model_id)
|
| 137 |
return results, None
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 138 |
elif task_prompt == 'Object Detection':
|
| 139 |
task_prompt = '<OD>'
|
| 140 |
results = run_example(task_prompt, image, model_id=model_id)
|
|
@@ -210,7 +237,8 @@ with gr.Blocks(css=css) as demo:
|
|
| 210 |
input_img = gr.Image(label="Input Picture")
|
| 211 |
model_selector = gr.Dropdown(choices=list(models.keys()), label="Model", value='microsoft/Florence-2-large')
|
| 212 |
task_prompt = gr.Dropdown(choices=[
|
| 213 |
-
'Caption', 'Detailed Caption', 'More Detailed Caption', '
|
|
|
|
| 214 |
'Dense Region Caption', 'Region Proposal', 'Caption to Phrase Grounding',
|
| 215 |
'Referring Expression Segmentation', 'Region to Segmentation',
|
| 216 |
'Open Vocabulary Detection', 'Region to Category', 'Region to Description',
|
|
|
|
| 135 |
task_prompt = '<MORE_DETAILED_CAPTION>'
|
| 136 |
results = run_example(task_prompt, image, model_id=model_id)
|
| 137 |
return results, None
|
| 138 |
+
elif task_prompt == 'Caption + Grounding':
|
| 139 |
+
task_prompt = '<CAPTION>'
|
| 140 |
+
results = run_example(task_prompt, image, model_id=model_id)
|
| 141 |
+
text_input = results[task_prompt]
|
| 142 |
+
task_prompt = '<CAPTION_TO_PHRASE_GROUNDING>'
|
| 143 |
+
results = run_example(task_prompt, image, text_input, model_id)
|
| 144 |
+
results['<CAPTION>'] = text_input
|
| 145 |
+
fig = plot_bbox(image, results['<CAPTION_TO_PHRASE_GROUNDING>'])
|
| 146 |
+
return results, fig_to_pil(fig)
|
| 147 |
+
elif task_prompt == 'Detailed Caption + Grounding':
|
| 148 |
+
task_prompt = '<DETAILED_CAPTION>'
|
| 149 |
+
results = run_example(task_prompt, image, model_id=model_id)
|
| 150 |
+
text_input = results[task_prompt]
|
| 151 |
+
task_prompt = '<CAPTION_TO_PHRASE_GROUNDING>'
|
| 152 |
+
results = run_example(task_prompt, image, text_input, model_id)
|
| 153 |
+
results['<DETAILED_CAPTION>'] = text_input
|
| 154 |
+
fig = plot_bbox(image, results['<CAPTION_TO_PHRASE_GROUNDING>'])
|
| 155 |
+
return results, fig_to_pil(fig)
|
| 156 |
+
elif task_prompt == 'More Detailed Caption + Grounding':
|
| 157 |
+
task_prompt = '<MORE_DETAILED_CAPTION>'
|
| 158 |
+
results = run_example(task_prompt, image, model_id=model_id)
|
| 159 |
+
text_input = results[task_prompt]
|
| 160 |
+
task_prompt = '<CAPTION_TO_PHRASE_GROUNDING>'
|
| 161 |
+
results = run_example(task_prompt, image, text_input, model_id)
|
| 162 |
+
results['<MORE_DETAILED_CAPTION>'] = text_input
|
| 163 |
+
fig = plot_bbox(image, results['<CAPTION_TO_PHRASE_GROUNDING>'])
|
| 164 |
+
return results, fig_to_pil(fig)
|
| 165 |
elif task_prompt == 'Object Detection':
|
| 166 |
task_prompt = '<OD>'
|
| 167 |
results = run_example(task_prompt, image, model_id=model_id)
|
|
|
|
| 237 |
input_img = gr.Image(label="Input Picture")
|
| 238 |
model_selector = gr.Dropdown(choices=list(models.keys()), label="Model", value='microsoft/Florence-2-large')
|
| 239 |
task_prompt = gr.Dropdown(choices=[
|
| 240 |
+
'Caption', 'Detailed Caption', 'More Detailed Caption', 'Caption + Grounding',
|
| 241 |
+
'Detailed Caption + Grounding', 'More Detailed Caption + Grounding', 'Object Detection',
|
| 242 |
'Dense Region Caption', 'Region Proposal', 'Caption to Phrase Grounding',
|
| 243 |
'Referring Expression Segmentation', 'Region to Segmentation',
|
| 244 |
'Open Vocabulary Detection', 'Region to Category', 'Region to Description',
|