Spaces:

Didier
/

Mistral_Small_AutoRound

Sleeping

Mistral_Small_AutoRound / module_vision.py

Create module_vision.py

0e37c10 verified 21 days ago

1.01 kB

	"""
	File: module_vision.py
	Description: A module for chat using image + text with a multimodal interface.
	Author: Didier Guillevic
	Date: 2025-05-08
	"""

	import gradio as gr
	import vlm

	def process(message, history):
	"""Generate the model response given message and history
	"""
	messages = vlm.build_messages(message, history)
	yield from vlm.stream_response(messages)

	#examples=[
	# [{"text": "What is happening in the video?", "files": ["Usain_Bolt_floats_to_victory.mp4"]}],
	# [{"text": "Pourrais-tu décrire cette image?", "files": ["le_monde_2025-04-01.jpg"]}],
	# [{"text": "Could you descrive the video?", "files": ["threads_brittlestar_post_DIABZcnJ.mp4"]}],
	#]

	#
	# User interface
	#
	with gr.Blocks() as demo:
	chat_interface = gr.ChatInterface(
	fn=process,
	description="Chat with text / text+image / text+video.",
	#examples=examples,
	#cache_examples=False,
	stop_btn="Stop Generation",
	multimodal=True,
	type="messages"
	)