vikhyatk commited on
Commit
c6c8487
·
verified ·
1 Parent(s): 26e1404

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +19 -0
app.py CHANGED
@@ -37,6 +37,7 @@ from threading import Thread
37
  from transformers import AutoModelForCausalLM
38
  from PIL import ImageDraw
39
  from torchvision.transforms.v2 import Resize
 
40
 
41
  os.environ["HF_TOKEN"] = os.environ.get("TOKEN_FROM_SECRET") or True
42
  moondream = AutoModelForCausalLM.from_pretrained(
@@ -204,6 +205,12 @@ def point(img, object):
204
  visible=True, value=img
205
  )
206
 
 
 
 
 
 
 
207
  js = ""
208
 
209
  css = """
@@ -310,6 +317,18 @@ with gr.Blocks(title="moondream vl (new)", css=css, js=js) as demo:
310
  submit.click(point, [img, prompt], [thought, ann])
311
  prompt.submit(point, [img, prompt], [thought, ann])
312
  img.change(point, [img, prompt], [thought, ann])
 
 
 
 
 
 
 
 
 
 
 
 
313
  else:
314
  gr.Markdown("Coming soon!")
315
 
 
37
  from transformers import AutoModelForCausalLM
38
  from PIL import ImageDraw
39
  from torchvision.transforms.v2 import Resize
40
+ from gradio_image_prompter import ImagePrompter
41
 
42
  os.environ["HF_TOKEN"] = os.environ.get("TOKEN_FROM_SECRET") or True
43
  moondream = AutoModelForCausalLM.from_pretrained(
 
205
  visible=True, value=img
206
  )
207
 
208
+ @spaces.GPU(duration=10)
209
+ def localized_query(img_prompt, question):
210
+ img, points = img_prompt["image"], img_prompt["points"]
211
+ yield repr(points), {"text": "..."}
212
+
213
+
214
  js = ""
215
 
216
  css = """
 
317
  submit.click(point, [img, prompt], [thought, ann])
318
  prompt.submit(point, [img, prompt], [thought, ann])
319
  img.change(point, [img, prompt], [thought, ann])
320
+ elif mode == "Localized":
321
+ with gr.Group():
322
+ with gr.Row():
323
+ prompt = gr.Textbox(
324
+ label="Input",
325
+ value="What does the text say?",
326
+ scale=4,
327
+ )
328
+ submit = gr.Button("Submit")
329
+ img = ImagePrompter(show_label=False)
330
+ submit.click(localized_query, [img, prompt], [output, thought])
331
+ prompt.submit(localized_query, [img, prompt], [output, thought])
332
  else:
333
  gr.Markdown("Coming soon!")
334