Spaces:
Sleeping
Sleeping
import gradio as gr | |
from transformers import AutoTokenizer, AutoModelForImageTextToText | |
import torch | |
tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/SmolVLM2-2.2B-Instruct") | |
model = AutoModelForImageTextToText.from_pretrained("HuggingFaceTB/SmolVLM2-2.2B-Instruct") | |
model_path = "HuggingFaceTB/SmolVLM2-2.2B-Instruct" | |
processor = AutoProcessor.from_pretrained(model_path) | |
def launch(input): | |
out = model.generate(**input) | |
return(out) | |
iface = gr.Interface(launch, | |
inputs=gr.Image(type='pil'), | |
outputs="text") | |
iface.launch() |