Spaces:
Running
on
Zero
Running
on
Zero
File size: 863 Bytes
2e01190 9704a98 65872c0 9704a98 bb856a6 b916df8 9704a98 186c6d4 26380ae 186c6d4 26380ae 186c6d4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 |
import spaces
import gradio as gr
import torch
from transformers import pipeline
pipe = pipeline(
"text-generation",
model="marcelbinz/Llama-3.1-Minitaur-8B",
device_map="auto",
torch_dtype=torch.bfloat16
)
@spaces.GPU
def infer(prompt):
return pipe(prompt, max_new_tokens=1, do_sample=True, temperature=1.0, return_full_text=False)[0]["generated_text"]
with gr.Blocks(fill_width=True, css="""
#prompt-box textarea {height:200px}
#answer-box textarea {height:320px}
""") as demo:
with gr.Row(equal_height=True):
inp = gr.Textbox(label="Prompt", elem_id="prompt-box",
lines=12, max_lines=12, scale=3)
outp = gr.Textbox(label="Response", elem_id="answer-box",
lines=1, interactive=False, scale=3)
run = gr.Button("Run")
run.click(infer, inp, outp)
demo.queue().launch() |