Spaces:

artificialguybr
/

Nemotron-3-8B-QA-FREE-DEMO

Runtime error

App Files Files Community

artificialguybr commited on Mar 5, 2024

Commit

092abcd

verified ·

1 Parent(s): 2c0ed9f

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -16

app.py CHANGED Viewed

@@ -1,14 +1,15 @@
 import os
 import gradio as gr
 import requests
-# Função modificada para incluir a obtenção da API key do ambiente
-def query_model(context, question):
     """
-    Queries the Nemotron-3-8B-QA API with the provided question and context.
     """
     invoke_url = "https://api.nvcf.nvidia.com/v2/nvcf/pexec/functions/0c60f14d-46cb-465e-b994-227e1c3d5047"
-    # Obtém a API key do ambiente
     api_key = os.environ.get("NEMO_API_KEY")
     if not api_key:
         raise ValueError("Please set the NEMO_API_KEY environment variable.")
@@ -17,16 +18,23 @@ def query_model(context, question):
         "accept": "text/event-stream",
         "content-type": "application/json",
     }
     payload = {
         "messages": [
             {"content": context, "role": "context"},
             {"content": question, "role": "user"},
         ],
-        "temperature": 0.2,
-        "top_p": 0.7,
-        "max_tokens": 1024,
         "stream": True,
     }
     response = requests.post(invoke_url, headers=headers, json=payload, stream=True)
     answer = ""
     for line in response.iter_lines():
@@ -42,45 +50,44 @@ def query_model(context, question):
                 break
     return answer
 iface = gr.Interface(
     fn=query_model,
     inputs=[
         gr.Textbox(label="Context", lines=5),
         gr.Textbox(label="Question"),
     ],
     outputs="text",
     title="Nemotron-3-8B-QA",
-    description="""
-<div style="text-align: center; font-size: 1.5em; margin-bottom: 20px;">
 <strong>Unlock the Power of AI with Nemotron-3-8B-QA for Precision Question Answering</strong>
 </div>
 <p>
     Dive into the realm of advanced AI with the Nemotron-3-8B-QA, a state-of-the-art language model fine-tuned by NVIDIA for unparalleled question answering performance. Built upon the robust Nemotron-3-8B architecture, this 8 billion parameter model is designed to understand and follow instructions with remarkable accuracy, providing you with precise answers to your queries.
 </p>
 <p>
     <strong>How to Use:</strong>
 </p>
 <ol>
     <li>Provide a <strong>context</strong> in the designated box, offering the model relevant information or background on your question.</li>
     <li>Enter your <strong>question</strong> in the next box, making it as clear and specific as possible.</li>
     <li>Click <strong>Submit</strong> to receive a detailed and accurate answer based on the provided context and the model's extensive knowledge base.</li>
 </ol>
 <p>
     <strong>This cutting-edge question answering service is powered by NVIDIA NGC, ensuring top-notch performance and reliability, and is completely free to use.</strong>
 </p>
 <p>
     <strong>Created by:</strong> @artificialguybr (<a href="https://twitter.com/artificialguybr">Twitter</a>)
 </p>
 <p>
     <strong>Discover more:</strong> <a href="https://artificialguy.com">artificialguy.com</a>
 </p>
 """
 )
-iface.launch()

 import os
 import gradio as gr
 import requests
+import random
+# Função atualizada para incluir a geração de uma seed aleatória
+def query_model(context, question, temperature, top_p, max_tokens, seed=""):
     """
+    Queries the Nemotron-3-8B-QA API with the provided question and context, allowing customization of temperature, top_p, max_tokens, and seed.
+    If no seed is provided, generates a random seed within the specified range.
     """
     invoke_url = "https://api.nvcf.nvidia.com/v2/nvcf/pexec/functions/0c60f14d-46cb-465e-b994-227e1c3d5047"
     api_key = os.environ.get("NEMO_API_KEY")
     if not api_key:
         raise ValueError("Please set the NEMO_API_KEY environment variable.")
         "accept": "text/event-stream",
         "content-type": "application/json",
     }
+    # Gera uma seed aleatória se o usuário não especificou uma
+    if not seed:
+        seed = random.randint(0, 18446744073709552000)
     payload = {
         "messages": [
             {"content": context, "role": "context"},
             {"content": question, "role": "user"},
         ],
+        "temperature": float(temperature),
+        "top_p": float(top_p),
+        "max_tokens": int(max_tokens),
         "stream": True,
+        "seed": int(seed),  # Usa a seed especificada ou a gerada aleatoriamente
     }
     response = requests.post(invoke_url, headers=headers, json=payload, stream=True)
     answer = ""
     for line in response.iter_lines():
                 break
     return answer
+# Interface do Gradio atualizada para incluir a entrada da seed com limitação de valor
 iface = gr.Interface(
     fn=query_model,
     inputs=[
         gr.Textbox(label="Context", lines=5),
         gr.Textbox(label="Question"),
+        gr.Slider(label="Temperature", minimum=0.1, maximum=1.0, step=0.1, default=0.2),
+        gr.Slider(label="Top P", minimum=0.1, maximum=1.0, step=0.1, default=0.7),
+        gr.Slider(label="Max Tokens", minimum=1, maximum=1024, step=63, default=1024),
+        gr.Textbox(label="Seed (optional, 0 to 18446744073709552000)", optional=True),
     ],
     outputs="text",
     title="Nemotron-3-8B-QA",
+    description="""<div style="text-align: center; font-size: 1.5em; margin-bottom: 20px;">
 <strong>Unlock the Power of AI with Nemotron-3-8B-QA for Precision Question Answering</strong>
 </div>
 <p>
     Dive into the realm of advanced AI with the Nemotron-3-8B-QA, a state-of-the-art language model fine-tuned by NVIDIA for unparalleled question answering performance. Built upon the robust Nemotron-3-8B architecture, this 8 billion parameter model is designed to understand and follow instructions with remarkable accuracy, providing you with precise answers to your queries.
 </p>
 <p>
     <strong>How to Use:</strong>
 </p>
 <ol>
     <li>Provide a <strong>context</strong> in the designated box, offering the model relevant information or background on your question.</li>
     <li>Enter your <strong>question</strong> in the next box, making it as clear and specific as possible.</li>
+    <li>Adjust <strong>Temperature</strong>, <strong>Top P</strong>, <strong>Max Tokens</strong>, and <strong>Seed</strong> (optional) as needed to customize the response.</li>
     <li>Click <strong>Submit</strong> to receive a detailed and accurate answer based on the provided context and the model's extensive knowledge base.</li>
 </ol>
 <p>
     <strong>This cutting-edge question answering service is powered by NVIDIA NGC, ensuring top-notch performance and reliability, and is completely free to use.</strong>
 </p>
 <p>
     <strong>Created by:</strong> @artificialguybr (<a href="https://twitter.com/artificialguybr">Twitter</a>)
 </p>
 <p>
     <strong>Discover more:</strong> <a href="https://artificialguy.com">artificialguy.com</a>
 </p>
 """
 )
+iface.launch()