apitest / app.py
seawolf2357's picture
Create app.py
0096596 verified
raw
history blame
1.56 kB
import gradio as gr
import requests
def call_api(prompt, history, system_prompt, temperature, max_new_tokens, top_p, repetition_penalty):
url = "https://seawolf2357-nvidia-llama-fastapi.hf.space/generate/"
data = {
"prompt": prompt,
"history": history,
"system_prompt": system_prompt,
"temperature": temperature,
"max_new_tokens": max_new_tokens,
"top_p": top_p,
"repetition_penalty": repetition_penalty
}
response = requests.post(url, json=data)
return response.json()['response']
def main_interface():
with gr.Blocks() as demo:
with gr.Row():
prompt = gr.Textbox(label="Prompt", placeholder="Enter your prompt here...")
history = gr.Textbox(label="History", placeholder="Enter history here...")
system_prompt = gr.Textbox(label="System Prompt", placeholder="Enter system prompt here...")
temperature = gr.Number(label="Temperature", value=0.0)
max_new_tokens = gr.Number(label="Max New Tokens", value=1048)
top_p = gr.Number(label="Top P", value=0.15)
repetition_penalty = gr.Number(label="Repetition Penalty", value=1.0)
submit_button = gr.Button("Generate")
submit_button.click(
fn=call_api,
inputs=[prompt, history, system_prompt, temperature, max_new_tokens, top_p, repetition_penalty],
outputs=[gr.Textbox(label="Response")]
)
return demo
if __name__ == "__main__":
demo = main_interface()
demo.launch()