Spaces:

ankandrew
/

MiMo-VL-7B

Running on Zero

ankandrew commited on 19 days ago

Commit

f3ecef9

verified ·

1 Parent(s): 082e877

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -54,7 +54,8 @@ def downsample_video(video_path):
     vidcap.release()
     return frames
-MODEL_ID = "XiaomiMiMo/MiMo-VL-7B-RL"
 processor = AutoProcessor.from_pretrained(MODEL_ID, trust_remote_code=True)
 model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID,
@@ -156,7 +157,7 @@ def model_inference(input_dict, history):
 demo = gr.ChatInterface(
     fn=model_inference,
-    description="# **MiMo-VL-7B-RL `@video-infer for video understanding`**",
     fill_height=True,
     textbox=gr.MultimodalTextbox(label="Query Input", file_types=["image", "video"], file_count="multiple"),
     stop_btn="Stop Generation",

     vidcap.release()
     return frames
+# MODEL_ID = "XiaomiMiMo/MiMo-VL-7B-RL"
+MODEL_ID = "XiaomiMiMo/MiMo-VL-7B-RL-2508"
 processor = AutoProcessor.from_pretrained(MODEL_ID, trust_remote_code=True)
 model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
     MODEL_ID,
 demo = gr.ChatInterface(
     fn=model_inference,
+    description="# **MiMo-VL-7B-RL (2508) `@video-infer for video understanding`**",
     fill_height=True,
     textbox=gr.MultimodalTextbox(label="Query Input", file_types=["image", "video"], file_count="multiple"),
     stop_btn="Stop Generation",