Ovis-U1-3B

Running on Zero

App Files Files Community

evalstate HF Staff commited on 7 days ago

Commit

545fd3c

verified ·

1 Parent(s): 3440b76

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -6

app.py CHANGED Viewed

@@ -31,28 +31,31 @@ print(f'Loading info of Ovis-U1:\n{loading_info}')
 model = model.eval().to("cuda")
 model = model.to(torch.bfloat16)
-def set_global_seed(seed: int = 42):
     random.seed(seed)
     np.random.seed(seed)
     torch.manual_seed(seed)
     torch.cuda.manual_seed_all(seed)
-def randomize_seed_fn(seed: int, randomize: bool) -> int:
     return random.randint(0, MAX_SEED) if randomize else seed
 @spaces.GPU(duration=20)
 def process_txt_to_img(prompt: str, height: int, width: int, steps: int, final_seed: int, guidance_scale: float, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> list[Image.Image]:
     set_global_seed(final_seed)
     images = pipe_t2i(model, prompt, height, width, steps, cfg=guidance_scale, seed=final_seed)
     return images
 @spaces.GPU(duration=20)
 def process_img_to_txt(prompt: str, img: Image.Image, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> str:
     output_text = pipe_txt_gen(model, img, prompt)
     return output_text
 @spaces.GPU(duration=20)
 def process_img_txt_to_img(prompt: str, img: Image.Image, steps: int, final_seed: int, txt_cfg: float, img_cfg: float, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> list[Image.Image]:
     set_global_seed(final_seed)
     images = pipe_img_edit(model, img, prompt, steps, txt_cfg, img_cfg, seed=final_seed)
     return images
@@ -206,8 +209,7 @@ with gr.Blocks(title="Ovis-U1-3B") as demo:
             output_text    = gr.Textbox(label="Generated Text", visible=False, lines=5, interactive=False)
     @spaces.GPU(duration=20)
-    def run_img_txt_to_img_tab(prompt, img, steps, seed, txt_cfg, img_cfg, progress=gr.Progress(track_tqdm=True)):
-        """Use Ovis-U1-3B to modify an image. Supply Image and Text Prompt"""
         if img is None:
             return (
                 gr.update(value=[], visible=False),
@@ -221,7 +223,7 @@ with gr.Blocks(title="Ovis-U1-3B") as demo:
         )
     @spaces.GPU(duration=20)
-    def run_txt_to_img_tab(prompt, height, width, steps, seed, guidance, progress=gr.Progress(track_tqdm=True)):
         """Use Ovis-U1-3B to generate an Image."""
         # Seed is already finalized by the randomize_seed_fn in the click chain
         imgs = process_txt_to_img(prompt, height, width, steps, seed, guidance, progress=progress)
@@ -231,7 +233,7 @@ with gr.Blocks(title="Ovis-U1-3B") as demo:
         )
     @spaces.GPU(duration=20)
-    def run_img_to_txt_tab(img, prompt, progress=gr.Progress(track_tqdm=True)):
         """User Ovis-U1-3B to understand an Image (Vision processing)"""
         if img is None:
             return (

 model = model.eval().to("cuda")
 model = model.to(torch.bfloat16)
+def set_global_seed(seed: int = 42,show_api=False):
     random.seed(seed)
     np.random.seed(seed)
     torch.manual_seed(seed)
     torch.cuda.manual_seed_all(seed)
+def randomize_seed_fn(seed: int, randomize: bool,show_api=False) -> int:
     return random.randint(0, MAX_SEED) if randomize else seed
 @spaces.GPU(duration=20)
 def process_txt_to_img(prompt: str, height: int, width: int, steps: int, final_seed: int, guidance_scale: float, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> list[Image.Image]:
+    """Use Ovis-U1-3B to generate an image. Supply a Text Prompt"""
     set_global_seed(final_seed)
     images = pipe_t2i(model, prompt, height, width, steps, cfg=guidance_scale, seed=final_seed)
     return images
 @spaces.GPU(duration=20)
 def process_img_to_txt(prompt: str, img: Image.Image, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> str:
+    """Use Ovis-U1-3B to analyse an Image"""
     output_text = pipe_txt_gen(model, img, prompt)
     return output_text
 @spaces.GPU(duration=20)
 def process_img_txt_to_img(prompt: str, img: Image.Image, steps: int, final_seed: int, txt_cfg: float, img_cfg: float, progress: gr.Progress = gr.Progress(track_tqdm=True)) -> list[Image.Image]:
+    """Use Ovis-U1-3B to modify an Image. Supply an Image URL and a Text Prompt (e.g. 'ghiblify', 'low-poly 3d render', 'replace house with car'"""
     set_global_seed(final_seed)
     images = pipe_img_edit(model, img, prompt, steps, txt_cfg, img_cfg, seed=final_seed)
     return images
             output_text    = gr.Textbox(label="Generated Text", visible=False, lines=5, interactive=False)
     @spaces.GPU(duration=20)
+    def run_img_txt_to_img_tab(prompt, img, steps, seed, txt_cfg, img_cfg, progress=gr.Progress(track_tqdm=True),show_api=False):
         if img is None:
             return (
                 gr.update(value=[], visible=False),
         )
     @spaces.GPU(duration=20)
+    def run_txt_to_img_tab(prompt, height, width, steps, seed, guidance, progress=gr.Progress(track_tqdm=True),show_api=False):
         """Use Ovis-U1-3B to generate an Image."""
         # Seed is already finalized by the randomize_seed_fn in the click chain
         imgs = process_txt_to_img(prompt, height, width, steps, seed, guidance, progress=progress)
         )
     @spaces.GPU(duration=20)
+    def run_img_to_txt_tab(img, prompt, progress=gr.Progress(track_tqdm=True),show_api=False):
         """User Ovis-U1-3B to understand an Image (Vision processing)"""
         if img is None:
             return (