File size: 468 Bytes
9704a98
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
69649ce
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
import gradio as gr, transformers

pipe = transformers.pipeline("text-generation",
                             model="marcelbinz/Llama-3.1-Minitaur-8B")
pipe.to('cuda')

@spaces.GPU
def infer(prompt, max_tokens):
    return pipe(prompt, max_new_tokens=int(max_tokens))[0]["generated_text"]

demo = gr.Interface(
        fn=infer,
        inputs=gr.Text(),
        outputs="text",
        title="Minitaur",
        description="Just type and hit *Run*"
)
demo.launch()