ledits

Sleeping

Linoy Tsaban commited on Jun 29, 2023

Commit

5c86655

1 Parent(s): f58d8b8

Update app.py

fix auto-inversion and auto-caption when removing an image

Files changed (1) hide show

app.py CHANGED Viewed

@@ -27,12 +27,14 @@ blip_model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image
 ## IMAGE CPATIONING ##
 def caption_image(input_image):
-  inputs = blip_processor(images=input_image, return_tensors="pt").to(device)
-  pixel_values = inputs.pixel_values
-  generated_ids = blip_model.generate(pixel_values=pixel_values, max_length=50)
-  generated_caption = blip_processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-  return generated_caption
 ## DDPM INVERSION AND SAMPLING ##
@@ -361,8 +363,10 @@ with gr.Blocks(css="style.css") as demo:
     def reset_do_inversion():
-        do_inversion = True
-        return do_inversion
     def reset_do_reconstruction():
       do_reconstruction = True
@@ -597,6 +601,7 @@ with gr.Blocks(css="style.css") as demo:
     # Automatically start inverting upon input_image change
     input_image.change(
         fn = reset_do_inversion,
         outputs = [do_inversion],
         queue = False).then(fn = caption_image,
         inputs = [input_image],

 ## IMAGE CPATIONING ##
 def caption_image(input_image):
+  if not input_image is None:
+    inputs = blip_processor(images=input_image, return_tensors="pt").to(device)
+    pixel_values = inputs.pixel_values
+    generated_ids = blip_model.generate(pixel_values=pixel_values, max_length=50)
+    generated_caption = blip_processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
+    return generated_caption
+  return ""
 ## DDPM INVERSION AND SAMPLING ##
     def reset_do_inversion():
+        if not input_image is None:
+            return True
+        else:
+            return False
     def reset_do_reconstruction():
       do_reconstruction = True
     # Automatically start inverting upon input_image change
     input_image.change(
         fn = reset_do_inversion,
+        inputs = [input_image],
         outputs = [do_inversion],
         queue = False).then(fn = caption_image,
         inputs = [input_image],