Final_Assignment_Template_smiquensi3

Paused

App Files Files Community

smiquensi commited on Jun 30

Commit

41ba21f

verified ·

1 Parent(s): 0305bdf

sdfa

Browse files

Files changed (1) hide show

app.py +31 -24

app.py CHANGED Viewed

@@ -1,53 +1,57 @@
 # app.py
 import os
 import gradio as gr
 import requests
 import pandas as pd
 from agent import make_agent
-API = "https://agents-course-unit4-scoring.hf.space"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
-    # 1) Login check
     if not profile:
-        return "🔒 Por favor inicia sesión.", None
-    user = profile.username
     space_id = os.getenv("SPACE_ID", "")
-    # 2) Instanciar agente
     agent = make_agent()
-    # 3) Descargar preguntas
-    resp = requests.get(f"{API}/questions", timeout=20)
     resp.raise_for_status()
-    qs = resp.json()
     answers, log = [], []
-    for q in qs:
-        tid, txt = q["task_id"], q["question"]
-        # Construimos un prompt que fuerce solo la respuesta final
         prompt = (
             "Responde SÓLO con la respuesta final, sin explicaciones.\n"
-            f"{txt}\n"
             "Respuesta:"
         )
         raw = agent.run(prompt)
-        # Extraemos la última línea no vacía
-        ans = next((line for line in raw.splitlines()[::-1] if line.strip()), raw).strip()
         answers.append({"task_id": tid, "submitted_answer": ans})
-        log.append({"Task ID": tid, "Question": txt, "Answer": ans})
-    # 4) Envío
     payload = {
-        "username": user,
         "agent_code": f"https://huggingface.co/spaces/{space_id}/tree/main",
         "answers": answers,
     }
-    sub = requests.post(f"{API}/submit", json=payload, timeout=60)
     sub.raise_for_status()
     result = sub.json()
     status = (
-        f"✅ ¡Éxito!\n"
         f"User: {result['username']}\n"
         f"Score: {result['score']}% "
         f"({result.get('correct_count')}/{result.get('total_attempted')})\n"
@@ -55,13 +59,16 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     )
     return status, pd.DataFrame(log)
 with gr.Blocks() as demo:
-    gr.Markdown("# GAIA Final Agent Mini")
     gr.LoginButton()
-    btn = gr.Button("Run & Submit")
-    out = gr.Textbox(label="Resultado", lines=6)
-    tbl = gr.DataFrame(label="Q & A", wrap=True)
-    btn.click(fn=run_and_submit_all, outputs=[out, tbl])
 if __name__ == "__main__":
     demo.launch(debug=True)

 # app.py
 import os
 import gradio as gr
 import requests
 import pandas as pd
 from agent import make_agent
+API_URL = "https://agents-course-unit4-scoring.hf.space"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
+    # 0) Comprueba login
     if not profile:
+        return "🔒 Por favor, haz login con Hugging Face.", None
+    username = profile.username
     space_id = os.getenv("SPACE_ID", "")
+    # 1) Instancia tu agente
     agent = make_agent()
+    # 2) Descarga las 20 preguntas de GAIA
+    resp = requests.get(f"{API_URL}/questions", timeout=20)
     resp.raise_for_status()
+    questions = resp.json()
+    # 3) Para cada pregunta: construye prompt, ejecuta y extrae la última línea
     answers, log = [], []
+    for q in questions:
+        tid, text = q["task_id"], q["question"]
         prompt = (
             "Responde SÓLO con la respuesta final, sin explicaciones.\n"
+            f"{text}\n"
             "Respuesta:"
         )
         raw = agent.run(prompt)
+        # toma la última línea no vacía
+        ans = next((l for l in raw.splitlines()[::-1] if l.strip()), raw).strip()
         answers.append({"task_id": tid, "submitted_answer": ans})
+        log.append({"Task ID": tid, "Question": text, "Answer": ans})
+    # 4) Envía el payload
     payload = {
+        "username": username,
         "agent_code": f"https://huggingface.co/spaces/{space_id}/tree/main",
         "answers": answers,
     }
+    sub = requests.post(f"{API_URL}/submit", json=payload, timeout=60)
     sub.raise_for_status()
     result = sub.json()
+    # 5) Muestra resultado y tabla
     status = (
+        f"✅ Submission Successful!\n"
         f"User: {result['username']}\n"
         f"Score: {result['score']}% "
         f"({result.get('correct_count')}/{result.get('total_attempted')})\n"
     )
     return status, pd.DataFrame(log)
+# --- Interfaz Gradio ---
 with gr.Blocks() as demo:
+    gr.Markdown("# 🧠 GAIA Final Agent Mini")
+    gr.Markdown("Haz login y pulsa el botón para evaluar tu agente en GAIA.")
     gr.LoginButton()
+    run_btn = gr.Button("Run Evaluation & Submit All Answers")
+    status = gr.Textbox(label="Resultado", lines=6, interactive=False)
+    table  = gr.Dataframe(label="Preguntas y Respuestas", wrap=True)
+    run_btn.click(fn=run_and_submit_all, outputs=[status, table])
 if __name__ == "__main__":
     demo.launch(debug=True)