Spaces:

Agents-MCP-Hackathon
/

MCP_Server_Web2JSON

Running

abdo-Mansour commited on Jun 10

Commit

0e70948

1 Parent(s): 2856ca3

updated the input

Files changed (1) hide show

app.py CHANGED Viewed

@@ -141,6 +141,20 @@ def webpage_to_json_wrapper(content: str, is_url: bool, schema_input: str) -> Di
         return {"error": f"Schema parsing error: {str(e)}"}
 def webpage_to_json(content: str, is_url: bool, schema: BaseModel) -> Dict[str, Any]:
     prompt_template = """Extract the following information from the provided content according to the specified schema.
     Content to analyze:

         return {"error": f"Schema parsing error: {str(e)}"}
 def webpage_to_json(content: str, is_url: bool, schema: BaseModel) -> Dict[str, Any]:
+    """
+    Extracts structured JSON information from a given content based on a specified schema.
+    This function sets up a processing pipeline that includes:
+    - Preprocessing the input content.
+    - Utilizing an AI language model to extract information according to the provided schema.
+    - Postprocessing the extracted output to match the exact schema requirements.
+    Parameters:
+        content (str): The input content to be analyzed. This can be direct text or a URL content.
+        is_url (bool): A flag indicating whether the provided content is a URL (True) or raw text (False).
+        schema (BaseModel): A Pydantic BaseModel defining the expected structure and data types for the output.
+    Returns:
+        Dict[str, Any]: A dictionary containing the extracted data matching the schema. In case of errors during initialization
+                        or processing, the dictionary will include an "error" key with a descriptive message.
+    """
     prompt_template = """Extract the following information from the provided content according to the specified schema.
     Content to analyze: