Spaces:

victor
/

websearch

Running

victor HF Staff commited on Jul 11

Commit

f2aca49

1 Parent(s): 1d115f5

Update README and app.py: change title to 'Web Search MCP', enhance rate limit to 360 requests/hour, and improve logging for rate limit and content extraction.

Files changed (2) hide show

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-title: Websearch
 emoji: 🔎
 colorFrom: red
 colorTo: green
@@ -7,6 +7,7 @@ sdk: gradio
 sdk_version: 5.36.2
 app_file: app.py
 pinned: false
 ---
 # Web Search MCP Server

 ---
+title: Web Search MCP
 emoji: 🔎
 colorFrom: red
 colorTo: green
 sdk_version: 5.36.2
 app_file: app.py
 pinned: false
+short_description: Search and extract web content for LLM ingestion
 ---
 # Web Search MCP Server

app.py CHANGED Viewed

@@ -37,7 +37,7 @@ HEADERS = {"X-API-KEY": SERPER_API_KEY, "Content-Type": "application/json"}
 # Rate limiting
 storage = MemoryStorage()
 limiter = MovingWindowRateLimiter(storage)
-rate_limit = parse("200/hour")
 async def search_web(
@@ -97,8 +97,8 @@ async def search_web(
     try:
         # Check rate limit
         if not await limiter.hit(rate_limit, "global"):
-            print(f"Rate limit exceeded at {datetime.now().isoformat()}")
-            return "Error: Rate limit exceeded. Please try again later (limit: 200 requests per hour)."
         # Select endpoint based on search type
         endpoint = (
@@ -149,6 +149,9 @@ async def search_web(
                 continue
             successful_extractions += 1
             # Format the chunk based on search type
             if search_type == "news":
@@ -190,6 +193,9 @@ async def search_web(
         result = "\n---\n".join(chunks)
         summary = f"Successfully extracted content from {successful_extractions} out of {len(results)} {search_type} results for query: '{query}'\n\n---\n\n"
         return summary + result
     except Exception as e:

 # Rate limiting
 storage = MemoryStorage()
 limiter = MovingWindowRateLimiter(storage)
+rate_limit = parse("360/hour")
 async def search_web(
     try:
         # Check rate limit
         if not await limiter.hit(rate_limit, "global"):
+            print(f"[{datetime.now().isoformat()}] Rate limit exceeded")
+            return "Error: Rate limit exceeded. Please try again later (limit: 500 requests per hour)."
         # Select endpoint based on search type
         endpoint = (
                 continue
             successful_extractions += 1
+            print(
+                f"[{datetime.now().isoformat()}] Successfully extracted content from {meta['link']}"
+            )
             # Format the chunk based on search type
             if search_type == "news":
         result = "\n---\n".join(chunks)
         summary = f"Successfully extracted content from {successful_extractions} out of {len(results)} {search_type} results for query: '{query}'\n\n---\n\n"
+        print(
+            f"[{datetime.now().isoformat()}] Extraction complete: {successful_extractions}/{len(results)} successful for query '{query}'"
+        )
         return summary + result
     except Exception as e: