Spaces:

Nymbo
/

Web

Running

App Files Files Community

Nymbo commited on 7 days ago

Commit

82f0069

verified ·

1 Parent(s): 5ca3b99

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -11

app.py CHANGED Viewed

@@ -26,7 +26,7 @@ from duckduckgo_search import DDGS
 def _http_get(url: str) -> requests.Response:
     """
-    (layman) Download the page politely with a short timeout and realistic headers.
     """
     headers = {
         "User-Agent": "Mozilla/5.0 (compatible; WebMCP/1.0; +https://example.com)",
@@ -38,7 +38,7 @@ def _http_get(url: str) -> requests.Response:
 def _normalize_whitespace(text: str) -> str:
     """
-    (layman) Squeeze extra spaces and blank lines to keep things compact.
     """
     text = re.sub(r"[ \t\u00A0]+", " ", text)
     text = re.sub(r"\n\s*\n\s*\n+", "\n\n", text.strip())
@@ -47,7 +47,7 @@ def _normalize_whitespace(text: str) -> str:
 def _truncate(text: str, max_chars: int) -> Tuple[str, bool]:
     """
-    (layman) Cut text if it gets too long; return the text and whether we trimmed.
     """
     if max_chars is None or max_chars <= 0 or len(text) <= max_chars:
         return text, False
@@ -56,7 +56,7 @@ def _truncate(text: str, max_chars: int) -> Tuple[str, bool]:
 def _shorten(text: str, limit: int) -> str:
     """
-    (layman) Hard cap a string with an ellipsis to keep tokens small.
     """
     if limit <= 0 or len(text) <= limit:
         return text
@@ -65,7 +65,7 @@ def _shorten(text: str, limit: int) -> str:
 def _domain_of(url: str) -> str:
     """
-    (layman) Show a friendly site name like "example.com".
     """
     try:
         return urlparse(url).netloc or ""
@@ -85,7 +85,7 @@ def _og(soup: BeautifulSoup, prop: str) -> str | None:
 def _extract_metadata(soup: BeautifulSoup, final_url: str) -> Dict[str, str]:
     """
-    (layman) Pull the useful bits: title, description, site name, canonical URL, language, etc.
     """
     meta: Dict[str, str] = {}
@@ -123,7 +123,7 @@ def _extract_metadata(soup: BeautifulSoup, final_url: str) -> Dict[str, str]:
 def _extract_main_text(html: str) -> Tuple[str, BeautifulSoup]:
     """
-    (layman) Use Readability to isolate the main article and turn it into clean text.
     Returns (clean_text, soup_of_readable_html).
     """
     # Simplified article HTML from Readability
@@ -151,7 +151,7 @@ def _extract_main_text(html: str) -> Tuple[str, BeautifulSoup]:
 def _extract_links(readable_soup: BeautifulSoup, base_url: str, max_links: int) -> List[Tuple[str, str]]:
     """
-    (layman) Collect clean, unique, absolute links from the readable section only.
     """
     seen = set()
     links: List[Tuple[str, str]] = []
@@ -193,7 +193,7 @@ def _format_markdown(
     verbosity: str,
 ) -> str:
     """
-    (layman) Assemble a compact Markdown summary with optional sections.
     """
     lines: List[str] = []
@@ -412,7 +412,7 @@ def Search_Concise(  # <-- MCP tool #4 (Concise DDG)
 # --- Fetch tab (compact controllable extraction) ---
 fetch_interface = gr.Interface(
-    fn=Fetch_Webpage,  # (layman) connect the function to the UI
     inputs=[
         gr.Textbox(label="URL", placeholder="https://example.com/article"),
         gr.Dropdown(label="Verbosity", choices=["Brief", "Standard", "Full"], value="Standard"),
@@ -431,7 +431,7 @@ fetch_interface = gr.Interface(
 # --- Websearch tab (structured DDG via LangChain) ---
 websearch_interface = gr.Interface(
-    fn=Search_Structured,  # (layman) connect the function to the UI
     inputs=[
         gr.Textbox(value="", label="Search query", placeholder="site:example.com interesting topic"),
         gr.Slider(minimum=1, maximum=20, value=5, step=1, label="Max results"),

 def _http_get(url: str) -> requests.Response:
     """
+    Download the page politely with a short timeout and realistic headers.
     """
     headers = {
         "User-Agent": "Mozilla/5.0 (compatible; WebMCP/1.0; +https://example.com)",
 def _normalize_whitespace(text: str) -> str:
     """
+    Squeeze extra spaces and blank lines to keep things compact.
     """
     text = re.sub(r"[ \t\u00A0]+", " ", text)
     text = re.sub(r"\n\s*\n\s*\n+", "\n\n", text.strip())
 def _truncate(text: str, max_chars: int) -> Tuple[str, bool]:
     """
+    Cut text if it gets too long; return the text and whether we trimmed.
     """
     if max_chars is None or max_chars <= 0 or len(text) <= max_chars:
         return text, False
 def _shorten(text: str, limit: int) -> str:
     """
+    Hard cap a string with an ellipsis to keep tokens small.
     """
     if limit <= 0 or len(text) <= limit:
         return text
 def _domain_of(url: str) -> str:
     """
+    Show a friendly site name like "example.com".
     """
     try:
         return urlparse(url).netloc or ""
 def _extract_metadata(soup: BeautifulSoup, final_url: str) -> Dict[str, str]:
     """
+    Pull the useful bits: title, description, site name, canonical URL, language, etc.
     """
     meta: Dict[str, str] = {}
 def _extract_main_text(html: str) -> Tuple[str, BeautifulSoup]:
     """
+    Use Readability to isolate the main article and turn it into clean text.
     Returns (clean_text, soup_of_readable_html).
     """
     # Simplified article HTML from Readability
 def _extract_links(readable_soup: BeautifulSoup, base_url: str, max_links: int) -> List[Tuple[str, str]]:
     """
+    Collect clean, unique, absolute links from the readable section only.
     """
     seen = set()
     links: List[Tuple[str, str]] = []
     verbosity: str,
 ) -> str:
     """
+    Assemble a compact Markdown summary with optional sections.
     """
     lines: List[str] = []
 # --- Fetch tab (compact controllable extraction) ---
 fetch_interface = gr.Interface(
+    fn=Fetch_Webpage,  # connect the function to the UI
     inputs=[
         gr.Textbox(label="URL", placeholder="https://example.com/article"),
         gr.Dropdown(label="Verbosity", choices=["Brief", "Standard", "Full"], value="Standard"),
 # --- Websearch tab (structured DDG via LangChain) ---
 websearch_interface = gr.Interface(
+    fn=Search_Structured,  # connect the function to the UI
     inputs=[
         gr.Textbox(value="", label="Search query", placeholder="site:example.com interesting topic"),
         gr.Slider(minimum=1, maximum=20, value=5, step=1, label="Max results"),