File size: 974 Bytes
0e37c10
 
 
 
 
 
 
 
 
 
 
 
 
f870519
0e37c10
 
39be3da
 
 
 
 
 
 
 
0e37c10
 
 
 
 
 
 
39be3da
 
0e37c10
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
"""
File: module_vision.py
Description: A module for chat using image + text with a multimodal interface.
Author: Didier Guillevic
Date: 2025-05-08
"""

import gradio as gr
import vlm

def process(message, history):
    """Generate the model response given message and history
    """
    messages = vlm.build_messages(message, history)
    yield from vlm.stream_response(messages)

examples=[
    {
        'files': ['./passport_jp.png',],
        'text': 'Can you describe the image and present the information as a JSON document?'
    },
    {'text': 'How can we rationalize quantum entanglement?'},
    {'text': "Peux-tu expliquer le terme 'quantum spin'?"}
]

#
# User interface
#
with gr.Blocks() as demo:
    chat_interface = gr.ChatInterface(
        fn=process,
        description="Chat with text or text+image.",
        examples=examples,
        #cache_examples=False,
        stop_btn="Stop Generation",
        multimodal=True,
        type="messages"
    )