Spaces:
Runtime error
Runtime error
File size: 468 Bytes
9704a98 69649ce |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
import gradio as gr, transformers
pipe = transformers.pipeline("text-generation",
model="marcelbinz/Llama-3.1-Minitaur-8B")
pipe.to('cuda')
@spaces.GPU
def infer(prompt, max_tokens):
return pipe(prompt, max_new_tokens=int(max_tokens))[0]["generated_text"]
demo = gr.Interface(
fn=infer,
inputs=gr.Text(),
outputs="text",
title="Minitaur",
description="Just type and hit *Run*"
)
demo.launch() |