Spaces:

Nymbo
/

Tools

Running

App Files Files Community

Nymbo commited on Oct 11

Commit

cbe0212

verified ·

1 Parent(s): 4b97eaa

Update Modules/Web_Fetch.py

Browse files

Files changed (1) hide show

Modules/Web_Fetch.py +9 -16

Modules/Web_Fetch.py CHANGED Viewed

@@ -14,6 +14,13 @@ from app import _fetch_rate_limiter, _log_call_end, _log_call_start, _truncate_f
 from ._docstrings import autodoc
 def _http_get_enhanced(url: str, timeout: int | float = 30, *, skip_rate_limit: bool = False) -> requests.Response:
     headers = {
         "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36",
@@ -167,12 +174,7 @@ def _truncate_markdown(markdown: str, max_chars: int) -> Tuple[str, Dict[str, ob
     return truncated + truncation_notice, metadata
-@autodoc(
-    summary=(
-        "Fetch a webpage and return clean Markdown or a list of links, with max length and pagination via offset."
-    ),
-    returns="Markdown content (or links) possibly with a truncation notice when max_chars is exceeded.",
-)
 def Web_Fetch(
     url: Annotated[str, "The absolute URL to fetch (must return HTML)."],
     max_chars: Annotated[int, "Maximum characters to return (0 = no limit, full page content)."] = 3000,
@@ -265,16 +267,7 @@ def build_interface() -> gr.Interface:
             "<div style=\"text-align:center\">Convert any webpage to clean Markdown format with precision controls, "
             "or extract all links. Supports custom element removal, length limits, and pagination with offset.</div>"
         ),
-        api_description=(
-            "Fetch a web page and return it converted to Markdown format or extract links with configurable options. "
-            "Includes enhanced truncation with detailed metadata and pagination support via offset parameter. "
-            "Parameters: url (str - absolute URL), max_chars (int - 0=no limit, default 3000), "
-            "strip_selectors (str - CSS selectors to remove, comma-separated), "
-            "url_scraper (bool - extract only links instead of content, default False), "
-            "offset (int - character offset for pagination, use next_cursor from previous call). "
-            "When content is truncated, returns detailed metadata including truncated status, character counts, "
-            "and next_cursor for continuation. When url_scraper=True, returns formatted list of all links found on the page."
-        ),
         flagging_mode="never",
     )

 from ._docstrings import autodoc
+# Single source of truth for the LLM-facing tool description
+TOOL_SUMMARY = (
+    "Fetch a webpage and return clean Markdown or a list of links, with max length and pagination via offset; "
+    "if truncated, the output includes a notice with next_cursor for exact continuation."
+)
 def _http_get_enhanced(url: str, timeout: int | float = 30, *, skip_rate_limit: bool = False) -> requests.Response:
     headers = {
         "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36",
     return truncated + truncation_notice, metadata
+@autodoc(summary=TOOL_SUMMARY)
 def Web_Fetch(
     url: Annotated[str, "The absolute URL to fetch (must return HTML)."],
     max_chars: Annotated[int, "Maximum characters to return (0 = no limit, full page content)."] = 3000,
             "<div style=\"text-align:center\">Convert any webpage to clean Markdown format with precision controls, "
             "or extract all links. Supports custom element removal, length limits, and pagination with offset.</div>"
         ),
+        api_description=TOOL_SUMMARY,
         flagging_mode="never",
     )