Trial and error.
Browse files
app.py
CHANGED
@@ -41,7 +41,7 @@ class BasicAgent:
|
|
41 |
messages=[
|
42 |
{
|
43 |
"role": "system",
|
44 |
-
"content": "Answer the following question directly without any explanations, introductions, or conclusions. Provide only the specific answer itself.
|
45 |
},
|
46 |
{
|
47 |
"role": "user",
|
@@ -125,7 +125,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
|
|
125 |
answers_payload = []
|
126 |
print(f"Running agent on {len(questions_data)} questions...")
|
127 |
count = 0
|
128 |
-
question_array = [
|
129 |
for item in questions_data:
|
130 |
count += 1
|
131 |
if count not in question_array:
|
@@ -198,7 +198,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
|
|
198 |
|
199 |
# --- Build Gradio Interface using Blocks ---
|
200 |
with gr.Blocks() as demo:
|
201 |
-
gr.Markdown("# Basic Agent Evaluation Runner #
|
202 |
gr.Markdown(
|
203 |
"""
|
204 |
**Instructions:**
|
|
|
41 |
messages=[
|
42 |
{
|
43 |
"role": "system",
|
44 |
+
"content": "Answer the following question directly without any explanations, introductions, or conclusions. Provide only the specific answer itself. Always give answer in same language as question."
|
45 |
},
|
46 |
{
|
47 |
"role": "user",
|
|
|
125 |
answers_payload = []
|
126 |
print(f"Running agent on {len(questions_data)} questions...")
|
127 |
count = 0
|
128 |
+
question_array = [1, 3, 5, 6, 7] # Example question array for testing
|
129 |
for item in questions_data:
|
130 |
count += 1
|
131 |
if count not in question_array:
|
|
|
198 |
|
199 |
# --- Build Gradio Interface using Blocks ---
|
200 |
with gr.Blocks() as demo:
|
201 |
+
gr.Markdown("# Basic Agent Evaluation Runner #21")
|
202 |
gr.Markdown(
|
203 |
"""
|
204 |
**Instructions:**
|