Spaces:

Agents-MCP-Hackathon
/

MCP_Server_Web2JSON

Sleeping

abdo-Mansour commited on Jun 10

Commit

44fb3b3

1 Parent(s): da05e38

improved the prompt

Files changed (1) hide show

app.py CHANGED Viewed

@@ -42,7 +42,20 @@ def webpage_to_json(content: str, is_url: bool, schema_name: str) -> Dict[str, A
         return {"error": f"Invalid schema name: {schema_name}. Choose from: {', '.join(SCHEMA_OPTIONS.keys())}"}
     schema = SCHEMA_OPTIONS[schema_name]
-    prompt_template = "extract the following information: {content} based on schema: {schema}"
     # Initialize pipeline components
     preprocessor = BasicPreprocessor(config={'keep_tags': False})

         return {"error": f"Invalid schema name: {schema_name}. Choose from: {', '.join(SCHEMA_OPTIONS.keys())}"}
     schema = SCHEMA_OPTIONS[schema_name]
+    prompt_template = """Extract the following information from the provided content according to the specified schema.
+    Content to analyze:
+    {content}
+    Schema requirements:
+    {schema}
+    Instructions:
+    - Extract only information that is explicitly present in the content
+    - Follow the exact structure and data types specified in the schema
+    - If a required field cannot be found, indicate this clearly
+    - Preserve the original formatting and context where relevant
+    - Return the extracted data in the format specified by the schema"""
     # Initialize pipeline components
     preprocessor = BasicPreprocessor(config={'keep_tags': False})