Final_Assignment_Template_smiquensi3

Paused

App Files Files Community

smiquensi commited on Jun 30

Commit

54e22ca

verified ·

1 Parent(s): b20fcf6

dsfa

Browse files

Files changed (1) hide show

app.py +29 -41

app.py CHANGED Viewed

@@ -7,52 +7,50 @@ from smolagents import CodeAgent
 from smolagents.models import InferenceClientModel
 from smolagents.tools import (
     DuckDuckGoSearchTool,
-    PythonREPLTool,
     RequestsTool,
 )
-# (Keep Constants as is)
-# --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # --- Basic Agent Definition ---
-# ----- THIS IS WHERE YOU CAN BUILD WHAT YOU WANT ------
 class BasicAgent:
     def __init__(self):
-        # Cargamos el modelo
         model = InferenceClientModel(model_id="google/flan-t5-large")
-        # Usamos búsqueda, requests y REPL para todo tipo de tareas
         tools = [
-            DuckDuckGoSearchTool(),
-            RequestsTool(),        # para descargar attachments
-            PythonREPLTool(),      # para procesar tablas Excel, etc.
         ]
-        # IMPORTANT: add_base_tools=True mete más utilidades por defecto
         self.agent = CodeAgent(
             model=model,
             tools=tools,
             add_base_tools=True,
             max_steps=10,
         )
-        print("✅ CodeAgent initialized with full toolset.")
     def __call__(self, question: str) -> str:
-        # Forzamos solo la respuesta final
         prompt = (
-            "Eres un asistente que SOLO devuelve la respuesta final, "
-            "sin explicaciones ni formato extra.\n"
             f"Pregunta: {question}\n"
             "Respuesta:"
         )
         raw = self.agent.run(prompt)
-        # Extraemos la última línea no vacía
         for line in raw.strip().splitlines()[::-1]:
             if line.strip():
                 return line.strip()
         return raw.strip()
 def run_and_submit_all(profile: gr.OAuthProfile | None):
-    space_id = os.getenv("SPACE_ID","")
     if not profile:
         return "🔒 Por favor, inicia sesión con Hugging Face.", None
     username = profile.username
@@ -60,13 +58,12 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     # 1) Instanciar agente
     agent = BasicAgent()
-    # 2) Obtener preguntas
-    questions_url = f"{DEFAULT_API_URL}/questions"
-    resp = requests.get(questions_url, timeout=20)
     resp.raise_for_status()
     questions = resp.json()
-    # 3) Ejecutar en bucle
     answers, log = [], []
     for q in questions:
         tid, txt = q["task_id"], q["question"]
@@ -74,16 +71,16 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         answers.append({"task_id": tid, "submitted_answer": ans})
         log.append({"Task ID": tid, "Question": txt, "Submitted Answer": ans})
-    # 4) Enviar
     payload = {
         "username": username,
         "agent_code": f"https://huggingface.co/spaces/{space_id}/tree/main",
-        "answers": answers
     }
-    submit_url = f"{DEFAULT_API_URL}/submit"
-    resp2 = requests.post(submit_url, json=payload, timeout=60)
-    resp2.raise_for_status()
-    result = resp2.json()
     status = (
         f"✅ Submission Successful!\n"
         f"User: {result['username']}\n"
@@ -93,24 +90,15 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     )
     return status, pd.DataFrame(log)
-# --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner")
-    gr.Markdown(
-        """
-        **Instructions:**
-        1. Clone this space, modifica solo la clase `BasicAgent`.
-        2. Haz login con Hugging Face.
-        3. Click ‘Run Evaluation & Submit All Answers’.
-        """
-    )
     gr.LoginButton()
     run_btn = gr.Button("Run Evaluation & Submit All Answers")
-    out = gr.Textbox(label="Run Status / Submission Result", lines=6)
-    table = gr.DataFrame(label="Questions and Agent Answers")
-    run_btn.click(fn=run_and_submit_all, outputs=[out, table])
 if __name__ == "__main__":
     demo.launch(debug=True)

 from smolagents.models import InferenceClientModel
 from smolagents.tools import (
     DuckDuckGoSearchTool,
     RequestsTool,
+    PythonREPLTool,
 )
+# --- Constants (no toques) ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # --- Basic Agent Definition ---
 class BasicAgent:
     def __init__(self):
         model = InferenceClientModel(model_id="google/flan-t5-large")
         tools = [
+            DuckDuckGoSearchTool(),   # buscar texto en web
+            RequestsTool(),           # descargar archivos adjuntos
+            PythonREPLTool(),         # procesar Excel, cálculos, imágenes…
         ]
+        # add_base_tools=True inyecta más utilidades (filesystem, JSON, etc.)
         self.agent = CodeAgent(
             model=model,
             tools=tools,
             add_base_tools=True,
             max_steps=10,
         )
+        print("✅ CodeAgent con todas las herramientas listo.")
     def __call__(self, question: str) -> str:
+        # Prompt que obliga a devolver solo la respuesta pura
         prompt = (
+            "Eres un asistente que SOLO debe devolver la respuesta final, "
+            "sin explicaciones, listas ni texto adicional.\n"
             f"Pregunta: {question}\n"
             "Respuesta:"
         )
         raw = self.agent.run(prompt)
+        print("RAW OUTPUT:", raw)  # ayuda a depurar si algo falla
+        # Extraer únicamente la última línea no vacía
         for line in raw.strip().splitlines()[::-1]:
             if line.strip():
                 return line.strip()
         return raw.strip()
 def run_and_submit_all(profile: gr.OAuthProfile | None):
+    space_id = os.getenv("SPACE_ID", "")
     if not profile:
         return "🔒 Por favor, inicia sesión con Hugging Face.", None
     username = profile.username
     # 1) Instanciar agente
     agent = BasicAgent()
+    # 2) Descargar preguntas
+    resp = requests.get(f"{DEFAULT_API_URL}/questions", timeout=20)
     resp.raise_for_status()
     questions = resp.json()
+    # 3) Ejecutar agente en cada pregunta
     answers, log = [], []
     for q in questions:
         tid, txt = q["task_id"], q["question"]
         answers.append({"task_id": tid, "submitted_answer": ans})
         log.append({"Task ID": tid, "Question": txt, "Submitted Answer": ans})
+    # 4) Enviar resultados
     payload = {
         "username": username,
         "agent_code": f"https://huggingface.co/spaces/{space_id}/tree/main",
+        "answers": answers,
     }
+    submit_resp = requests.post(f"{DEFAULT_API_URL}/submit", json=payload, timeout=60)
+    submit_resp.raise_for_status()
+    result = submit_resp.json()
     status = (
         f"✅ Submission Successful!\n"
         f"User: {result['username']}\n"
     )
     return status, pd.DataFrame(log)
+# --- Gradio UI ---
 with gr.Blocks() as demo:
+    gr.Markdown("# 🧠 GAIA Final Agent Runner")
+    gr.Markdown("Haz login y pulsa el botón para evaluar tu agente en el benchmark GAIA.")
     gr.LoginButton()
     run_btn = gr.Button("Run Evaluation & Submit All Answers")
+    status = gr.Textbox(label="Run Status / Submission Result", lines=6)
+    table = gr.Dataframe(label="Questions and Agent Answers", wrap=True)
+    run_btn.click(fn=run_and_submit_all, outputs=[status, table])
 if __name__ == "__main__":
     demo.launch(debug=True)