Docmatix-Florence-2

Running on Zero

App Files Files Community

gokaygokay commited on Jun 19, 2024

Commit

9d0b540

verified ·

1 Parent(s): d69fd19

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -8

app.py CHANGED Viewed

@@ -121,34 +121,34 @@ def process_image(image, task_prompt, text_input=None):
     elif task_prompt == '<OD>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<OD>'])
-        return "", fig_to_pil(fig)
     elif task_prompt == '<DENSE_REGION_CAPTION>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<DENSE_REGION_CAPTION>'])
-        return "", fig_to_pil(fig)
     elif task_prompt == '<REGION_PROPOSAL>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<REGION_PROPOSAL>'])
-        return "", fig_to_pil(fig)
     elif task_prompt == '<CAPTION_TO_PHRASE_GROUNDING>':
         results = run_example(task_prompt, image, text_input)
         fig = plot_bbox(image, results['<CAPTION_TO_PHRASE_GROUNDING>'])
-        return "", fig_to_pil(fig)
     elif task_prompt == '<REFERRING_EXPRESSION_SEGMENTATION>':
         results = run_example(task_prompt, image, text_input)
         output_image = copy.deepcopy(image)
         output_image = draw_polygons(output_image, results['<REFERRING_EXPRESSION_SEGMENTATION>'], fill_mask=True)
-        return "", output_image
     elif task_prompt == '<REGION_TO_SEGMENTATION>':
         results = run_example(task_prompt, image, text_input)
         output_image = copy.deepcopy(image)
         output_image = draw_polygons(output_image, results['<REGION_TO_SEGMENTATION>'], fill_mask=True)
-        return "", output_image
     elif task_prompt == '<OPEN_VOCABULARY_DETECTION>':
         results = run_example(task_prompt, image, text_input)
         bbox_results = convert_to_od_format(results['<OPEN_VOCABULARY_DETECTION>'])
         fig = plot_bbox(image, bbox_results)
-        return "", fig_to_pil(fig)
     elif task_prompt == '<REGION_TO_CATEGORY>':
         results = run_example(task_prompt, image, text_input)
         return results, None
@@ -162,7 +162,7 @@ def process_image(image, task_prompt, text_input=None):
         results = run_example(task_prompt, image)
         output_image = copy.deepcopy(image)
         output_image = draw_ocr_bboxes(output_image, results['<OCR_WITH_REGION>'])
-        return "", output_image
     else:
         return "", None  # Return empty string and None for unknown task prompts

     elif task_prompt == '<OD>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<OD>'])
+        return results, fig_to_pil(fig)
     elif task_prompt == '<DENSE_REGION_CAPTION>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<DENSE_REGION_CAPTION>'])
+        return results, fig_to_pil(fig)
     elif task_prompt == '<REGION_PROPOSAL>':
         results = run_example(task_prompt, image)
         fig = plot_bbox(image, results['<REGION_PROPOSAL>'])
+        return results, fig_to_pil(fig)
     elif task_prompt == '<CAPTION_TO_PHRASE_GROUNDING>':
         results = run_example(task_prompt, image, text_input)
         fig = plot_bbox(image, results['<CAPTION_TO_PHRASE_GROUNDING>'])
+        return results, fig_to_pil(fig)
     elif task_prompt == '<REFERRING_EXPRESSION_SEGMENTATION>':
         results = run_example(task_prompt, image, text_input)
         output_image = copy.deepcopy(image)
         output_image = draw_polygons(output_image, results['<REFERRING_EXPRESSION_SEGMENTATION>'], fill_mask=True)
+        return results, output_image
     elif task_prompt == '<REGION_TO_SEGMENTATION>':
         results = run_example(task_prompt, image, text_input)
         output_image = copy.deepcopy(image)
         output_image = draw_polygons(output_image, results['<REGION_TO_SEGMENTATION>'], fill_mask=True)
+        return results, output_image
     elif task_prompt == '<OPEN_VOCABULARY_DETECTION>':
         results = run_example(task_prompt, image, text_input)
         bbox_results = convert_to_od_format(results['<OPEN_VOCABULARY_DETECTION>'])
         fig = plot_bbox(image, bbox_results)
+        return results, fig_to_pil(fig)
     elif task_prompt == '<REGION_TO_CATEGORY>':
         results = run_example(task_prompt, image, text_input)
         return results, None
         results = run_example(task_prompt, image)
         output_image = copy.deepcopy(image)
         output_image = draw_ocr_bboxes(output_image, results['<OCR_WITH_REGION>'])
+        return results, output_image
     else:
         return "", None  # Return empty string and None for unknown task prompts