Spaces:

Makkoen
/

mcp-qiskit-learn

Sleeping

App Files Files Community

Ludek Matyska commited on Jun 8

Commit

044a142

1 Parent(s): 0a9b724

feat: add error messages

Browse files

Files changed (1) hide show

theory_tools.py +112 -75

theory_tools.py CHANGED Viewed

@@ -2,48 +2,76 @@ import re
 import requests
 import nbformat
-RAW_BASE = "https://raw.githubusercontent.com/Qiskit/textbook/main/notebooks/intro/"
-README_URL = RAW_BASE + "README.md"
-FALLBACK = [
-    "what-is-quantum.ipynb",
-    "entangled-states.ipynb",
-    "superdense-coding.ipynb",
-    "teleportation.ipynb",
-]
-# ────────────────────────────────────────────────────────────────────
-# Internal helpers
-# ────────────────────────────────────────────────────────────────────
-def _discover_notebooks() -> list[str]:
-    """Scrape notebooks/intro/README.md for *.ipynb links; fallback if offline."""
     try:
-        md = requests.get(README_URL, timeout=10).text
-        found = re.findall(r"\(([^)]+?\.ipynb)\)", md)
-        if found:
-            return found
     except requests.RequestException:
-        pass
-    return FALLBACK
-def _pretty(name: str) -> str:
-    """'superdense-coding.ipynb' ➜ 'Superdense Coding'."""
-    return name.replace("-", " ").replace(".ipynb", "").title()
-# ────────────────────────────────────────────────────────────────────
-# Public API
-# ────────────────────────────────────────────────────────────────────
-def get_theory_topics() -> dict[str, str]:
-    """
-    Return a mapping of *friendly topic name* → *notebook filename*.
-    Example
-    -------
-    {'What Is Quantum?': 'what-is-quantum.ipynb', ...}
     """
-    return {_pretty(f): f for f in _discover_notebooks()}
 def get_theory(
@@ -51,59 +79,68 @@ def get_theory(
     markdown_only: bool = True,
     include_headers: bool = True,
 ) -> str:
-    """
-    Download **one** intro notebook and return its content as text.
-    Parameters
-    ----------
-    topic
-        Accepts pretty title (“Teleportation”), slug (“teleportation”)
-        or exact filename (“teleportation.ipynb”).
-    markdown_only
-        True (default) ➜ keep only Markdown cells;
-        False          ➜ include code cells fenced as ```python.
-    include_headers
-        Prepend an H1 title for readability.
-    Raises
-    ------
-    ValueError
-        If *topic* cannot be resolved.
-    Returns
-    -------
-    str
-        Concatenated notebook text.
     """
     topics = get_theory_topics()
-    # Build a lenient lookup table
     lookup: dict[str, str] = {}
-    for pretty, fname in topics.items():
-        slug = fname.removesuffix(".ipynb")
-        lookup[pretty.lower()] = fname
-        lookup[slug.lower()]   = fname
-        lookup[fname.lower()]  = fname
     key = topic.lower()
     if key not in lookup:
-        raise ValueError(
-            f"Unknown topic '{topic}'. "
-            f"Known: {', '.join(topics.keys())}."
-        )
-    fname = lookup[key]
-    raw_json = requests.get(RAW_BASE + fname, timeout=20).text
-    nb = nbformat.reads(raw_json, as_version=4)
-    parts: list[str] = []
     if include_headers:
-        parts.append(f"# {_pretty(fname)}\n")
     for cell in nb.cells:
         if cell.cell_type == "markdown":
-            parts.append(cell.source)
         elif cell.cell_type == "code" and not markdown_only:
-            parts.append(f"```python\n{cell.source}\n```")
-    return "\n\n".join(parts)

 import requests
 import nbformat
+RAW_ROOT = "https://raw.githubusercontent.com/Qiskit/textbook/main/notebooks/"
+# README locations we now support
+_SECTIONS: dict[str, str] = {
+    "intro":        "intro/README.md",
+    "ch-states":    "ch-states/README.md",
+    "ch-gates":     "ch-gates/README.md",
+    "ch-algorithms":"ch-algorithms/README.md",
+}
+# ───────────────────────────────────────────────────────────────────
+# internals
+# ───────────────────────────────────────────────────────────────────
+def _scrape_readme(rel_path: str) -> list[str]:
+    """Return *.ipynb files mentioned in a README; empty list on failure."""
     try:
+        md = requests.get(f"{RAW_ROOT}{rel_path}", timeout=10).text
+        # markdown link target: (...filename.ipynb)
+        return re.findall(r"\(([^)]+?\.ipynb)\)", md)
     except requests.RequestException:
+        return []
+def _discover_files() -> list[str]:
+    """Aggregate notebooks from all configured READMEs (no fallback)."""
+    files: list[str] = []
+    for dir_key, readme in _SECTIONS.items():
+        found = _scrape_readme(readme)
+        # Prepend the directory path if the README gives bare filenames
+        prefixed = [
+            name if "/" in name else f"{dir_key}/{name}" for name in found
+        ]
+        files.extend(prefixed)
+    return files
+def _pretty(path: str) -> str:
+    """'ch-states/bloch_sphere.ipynb' → 'Bloch Sphere'."""
+    fname = path.rsplit("/", 1)[-1]
+    return fname.replace("-", " ").replace(".ipynb", "").title()
+# ───────────────────────────────────────────────────────────────────
+# public tools
+# ───────────────────────────────────────────────────────────────────
+def get_theory_topics() -> dict[str, str]:
+    """Return a mapping of friendly topic names to notebook file paths.
+    Discovers available Jupyter notebooks from the Qiskit textbook across all
+    four main chapters (intro, ch-states, ch-gates, ch-algorithms) by scraping
+    their respective README files.
+    Returns:
+        dict[str, str]: A dictionary mapping human-readable topic names to their
+            corresponding notebook file paths. For example:
+            {'What Is Quantum': 'intro/what-is-quantum.ipynb',
+            'Bloch Sphere': 'ch-states/bloch_sphere.ipynb'}
+            Returns an empty dictionary if network requests fail.
+    Note:
+        If network requests fail, returns an empty dictionary instead of
+        falling back to hardcoded content.
     """
+    try:
+        discovered_files = _discover_files()
+        if not discovered_files:
+            return {}
+        return {_pretty(p): p for p in discovered_files}
+    except Exception:
+        return {}
 def get_theory(
     markdown_only: bool = True,
     include_headers: bool = True,
 ) -> str:
+    """Download and parse a Qiskit textbook notebook, returning its content as text.
+    Accepts flexible topic identification: pretty names ("Teleportation"),
+    slugs ("teleportation"), or full paths ("intro/teleportation.ipynb").
+    Downloads the notebook from GitHub and extracts its content.
+    Args:
+        topic (str): The quantum topic to fetch. Can be:
+            - Pretty name: "Teleportation", "What Is Quantum"
+            - Slug: "teleportation", "what-is-quantum"
+            - Full path: "intro/teleportation.ipynb"
+        markdown_only (bool, optional): If True, include only markdown cells.
+            If False, also include code cells wrapped in ```python blocks.
+            Defaults to True.
+        include_headers (bool, optional): If True, prepend an H1 header with
+            the topic name for better readability. Defaults to True.
+    Returns:
+        str: The concatenated content of the notebook as formatted text,
+            with cells separated by double newlines. Returns error messages
+            if the topic is not found or if network requests fail.
+    Example:
+        >>> content = get_theory("teleportation")
+        >>> print(content[:100])
+        # Teleportation
+        Quantum teleportation is a process by which quantum information...
     """
     topics = get_theory_topics()
+    # Build lenient lookup table
     lookup: dict[str, str] = {}
+    for nice, path in topics.items():
+        slug = path.rsplit("/", 1)[-1].removesuffix(".ipynb")
+        lookup[nice.lower()] = path
+        lookup[slug.lower()] = path
+        lookup[path.lower()] = path
     key = topic.lower()
     if key not in lookup:
+        if not topics:
+            return "Unable to get theory - no topics available (network may be down)"
+        available_topics = ', '.join(topics.keys())
+        return f"Topic unknown: '{topic}'. Available topics: {available_topics}"
+    path = lookup[key]
+    try:
+        raw_json = requests.get(f"{RAW_ROOT}{path}", timeout=20).text
+        nb = nbformat.reads(raw_json, as_version=4)
+    except Exception:
+        return "Unable to get theory - failed to download or parse notebook content"
+    chunks: list[str] = []
     if include_headers:
+        chunks.append(f"# {_pretty(path)}\n")
     for cell in nb.cells:
         if cell.cell_type == "markdown":
+            chunks.append(cell.source)
         elif cell.cell_type == "code" and not markdown_only:
+            chunks.append(f"```python\n{cell.source}\n```")
+    return "\n\n".join(chunks)