Spaces:

MCP-1st-Birthday
/

monkey-mind

Running

App Files Files Community

sxandie commited on 17 days ago

Commit

794fb9b

verified ·

1 Parent(s): 8dd7e23

Update mcp_server.py

Browse files

Files changed (1) hide show

mcp_server.py +1823 -24

mcp_server.py CHANGED Viewed

@@ -1,45 +1,1844 @@
-"""MCP server exposing repo analysis and Q&A tools.
-This allows any MCP-capable client (e.g., Claude Desktop, Cursor, Windsurf)
-to reuse the same backend logic that powers the Gradio UI.
 """
-from mcp.server.fastmcp import FastMCP
-from agent import analyze_github_repo, qa_on_repo, fetch_youtube_transcript
-server = FastMCP("github-doc-generator")
-@server.tool()
-def analyze_repository(repo_url: str) -> dict:
-    """Clone and inspect a GitHub repository.
-    Returns the same payload as the Gradio analyzer, including documentation
-    status, structure, and extracted doc content. Errors are surfaced as a
-    dictionary with an ``error`` key.
     """
-    return analyze_github_repo(repo_url)
-@server.tool()
-def ask_repository_question(repo_url: str, question: str) -> str:
-    """Answer a natural-language question about the given repository."""
-    return qa_on_repo(repo_url, question)
-@server.tool()
-def get_youtube_transcript(video_url: str, lang: str = "en") -> dict:
-    """Fetch a YouTube video's transcript via the RapidAPI backend.
-    This delegates to the shared `fetch_youtube_transcript` helper used by the
-    Gradio app. The response includes a raw transcript string and metadata.
     """
-    return fetch_youtube_transcript(video_url, lang=lang)
 if __name__ == "__main__":
-    server.run()

+from datetime import datetime, timezone
+from pathlib import Path
+import os
+import re
+import shutil
+import gradio as gr
+from agent import (
+    analyze_github_repo,
+    analyze_local_repo,
+    build_experiment_from_report,
+    build_repo_vector_store,
+    fetch_youtube_transcript,
+    generate_youtube_study_notes,
+    rag_answer_from_store,
+    summarize_youtube_chapters,
+)
+from bookmarks import (
+    bookmark_repo_from_analysis,
+    find_metadata_by_label,
+    get_cache_dirs,
+    get_dropdown_options,
+)
+# File extensions and folders to ignore for local uploads
+IGNORE_PATTERNS = {
+    'folders': {
+        '__pycache__', '.git', '.svn', '.hg', 'node_modules',
+        'venv', 'env', '.venv', '.env', 'dist', 'build',
+        '.idea', '.vscode', '.pytest_cache', '.mypy_cache',
+        'coverage', '.coverage', 'htmlcov', '.tox', 'eggs',
+        '.eggs', '*.egg-info', '.DS_Store'
+    },
+    'extensions': {
+        '.pyc', '.pyo', '.pyd', '.so', '.dll', '.dylib',
+        '.class', '.o', '.obj', '.exe', '.bin', '.lock',
+        '.log', '.tmp', '.temp', '.cache', '.bak', '.swp',
+        '.swo', '.DS_Store', '.gitignore'
+    }
+}
+def _should_ignore_path(path: Path) -> bool:
+    """Check if a path should be ignored during local folder processing."""
+    for part in path.parts:
+        if part in IGNORE_PATTERNS['folders']:
+            return True
+        if part.startswith('.') and part not in {'.', '..'}:
+            return True
+    if path.suffix.lower() in IGNORE_PATTERNS['extensions']:
+        return True
+    return False
+KNOWLEDGE_TRANSFER_ROOT = Path("Knowledge Transfer")
+def _is_gradio_v6_or_newer() -> bool:
+    """Return True if the installed Gradio major version is >= 6."""
+    version_str = getattr(gr, "__version__", "0")
+    try:
+        major = int(version_str.split(".")[0])
+        return major >= 6
+    except (ValueError, IndexError):
+        return False
+IS_GRADIO_V6 = _is_gradio_v6_or_newer()
+def run_github_ingestion(repo_url: str):
+    """Analyze GitHub repository without indexing."""
+    repo_url = (repo_url or "").strip()
+    if not repo_url:
+        warning = "⚠️ Please paste a public GitHub repository URL to begin."
+        source_info = "**Source:** Not selected\n**Status:** ⏳ Pending\n**Chunks:** 0 vectors"
+        return warning, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+            "summary_base": [],
+        }
+    result = analyze_github_repo(repo_url)
+    if "error" in result:
+        error_msg = f"❌ {result['error']}"
+        source_info = f"**Source:** {repo_url}\n**Status:** ❌ Error\n**Chunks:** 0 vectors"
+        return error_msg, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+            "summary_base": [],
+        }
+    docs = result.get("documentation", [])
+    repo_name = result.get("repo_name", repo_url)
+    timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")
+    # Source info for preview panel
+    source_info = f"""**Source:** GitHub Repository
+**Repository:** {repo_name}
+**Status:** ✅ Analyzed
+**Documents:** {len(docs)} files
+**Analyzed:** {timestamp}"""
+    # Document preview content
+    preview_sections = []
+    for doc in docs[:5]:
+        content = (doc.get("content") or "").strip()
+        if not content:
+            continue
+        snippet = content[:600]
+        if len(content) > 600:
+            snippet = snippet.rstrip() + " ..."
+        preview_sections.append(
+            f"### 📄 {doc.get('path', 'document')}\n\n{snippet}"
+        )
+    preview_content = (
+        "\n\n---\n\n".join(preview_sections)
+        if preview_sections
+        else "*No textual documentation snippets were found.*"
+    )
+    state_payload = {
+        "analysis": result,
+        "vector_dir": "",
+        "vector_chunks": 0,
+        "summary_base": [repo_name, str(len(docs))],
+        "processed_timestamp": timestamp,
+        "indexed": False,
+    }
+    return preview_content, source_info, state_payload
+def index_github_repo(state_payload: dict | None):
+    """Index the analyzed GitHub repository for RAG."""
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return "⚠️ Run analysis before indexing.", state_payload
+    if state_payload.get("indexed"):
+        return "✅ Repository already indexed and ready for RAG queries.", state_payload
+    docs = analysis_data.get("documentation", [])
+    repo_name = analysis_data.get("repo_name", "repo")
+    repo_url = analysis_data.get("repo_url", "")
+    slug, cache_dir, cache_vector_dir = get_cache_dirs(repo_url, repo_name)
+    if cache_dir.exists():
+        shutil.rmtree(cache_dir)
+    cache_dir.mkdir(parents=True, exist_ok=True)
+    vector_chunks = 0
+    if docs:
+        _, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)
+        vector_chunks = chunk_count
+    else:
+        return "⚠️ No documentation found to index.", state_payload
+    new_state = {
+        **state_payload,
+        "vector_dir": str(cache_vector_dir),
+        "vector_chunks": vector_chunks,
+        "indexed": True,
+    }
+    return f"✅ Indexed {vector_chunks} vector chunks. Ready for RAG queries!", new_state
+def bookmark_github_repo(state_payload: dict | None):
+    """Bookmark and index the GitHub repository permanently."""
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return "⚠️ Run analysis before bookmarking.", state_payload, gr.Dropdown()
+    docs = analysis_data.get("documentation", [])
+    if not docs:
+        return "⚠️ No documentation to bookmark.", state_payload, gr.Dropdown()
+    repo_url = analysis_data.get("repo_url") or analysis_data.get("repo_name")
+    # Build vector store if not already done
+    vector_dir = state_payload.get("vector_dir") if state_payload else ""
+    if not vector_dir:
+        repo_name = analysis_data.get("repo_name", "repo")
+        slug, cache_dir, cache_vector_dir = get_cache_dirs(repo_url, repo_name)
+        if cache_dir.exists():
+            shutil.rmtree(cache_dir)
+        cache_dir.mkdir(parents=True, exist_ok=True)
+        if docs:
+            _, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)
+            vector_dir = str(cache_vector_dir)
+        else:
+            chunk_count = 0
+    else:
+        chunk_count = state_payload.get("vector_chunks", 0)
+    metadata = bookmark_repo_from_analysis(
+        repo_url,
+        analysis_data,
+        prebuilt_vector_dir=Path(vector_dir) if vector_dir else None,
+        prebuilt_chunks=chunk_count,
+    )
+    choices, metadata_list = get_dropdown_options()
+    dropdown_update = gr.Dropdown(
+        choices=choices,
+        value=metadata.dropdown_label,
+        interactive=True,
+    )
+    new_state = {
+        **state_payload,
+        "vector_dir": vector_dir,
+        "vector_chunks": chunk_count,
+        "indexed": True,
+    }
+    return f"💾 Repository bookmarked on {metadata.last_pulled_display}. Access it in the Chat tab!", new_state, dropdown_update
+def run_youtube_ingestion(youtube_url: str):
+    """Analyze YouTube video without indexing."""
+    youtube_url = (youtube_url or "").strip()
+    if not youtube_url:
+        warning = "⚠️ Paste a YouTube video URL to begin."
+        source_info = "**Source:** Not selected\n**Status:** ⏳ Pending\n**Chunks:** 0 vectors"
+        return warning, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+        }
+    result = fetch_youtube_transcript(youtube_url)
+    if "error" in result:
+        error_msg = f"❌ {result['error']}"
+        source_info = f"**Source:** YouTube\n**Status:** ❌ Error\n**Chunks:** 0 vectors"
+        return error_msg, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+        }
+    transcript = (result.get("raw_transcript") or "").strip()
+    if not transcript:
+        source_info = "**Source:** YouTube\n**Status:** ⚠️ No transcript\n**Chunks:** 0 vectors"
+        return "⚠️ No transcript text was returned.", source_info, {"analysis": None}
+    timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")
+    video_url = result.get("url", youtube_url)
+    lang = result.get("lang", "en")
+    # Source info for preview panel
+    source_info = f"""**Source:** YouTube Video
+**URL:** {video_url}
+**Language:** {lang}
+**Status:** ✅ Analyzed
+**Analyzed:** {timestamp}"""
+    # Generate chapter summaries
+    chapters = summarize_youtube_chapters(transcript, url=video_url)
+    # Preview content with chapters
+    preview_content = f"""### 📺 Video Transcript Analysis
+{chapters}
+---
+### 📝 Transcript Preview
+{transcript[:2000]}{"..." if len(transcript) > 2000 else ""}
 """
+    state_payload = {
+        "analysis": {
+            "transcript": transcript,
+            "url": video_url,
+            "lang": lang,
+            "chapters": chapters,
+        },
+        "vector_dir": "",
+        "vector_chunks": 0,
+        "indexed": False,
+    }
+    return preview_content, source_info, state_payload
+def index_youtube_video(state_payload: dict | None):
+    """Index YouTube transcript for RAG."""
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return "⚠️ Run analysis before indexing.", state_payload
+    if state_payload.get("indexed"):
+        return "✅ Video already indexed and ready for RAG queries.", state_payload
+    transcript = analysis_data.get("transcript", "")
+    if not transcript:
+        return "⚠️ No transcript found to index.", state_payload
+    # Create pseudo-documents from transcript
+    docs = [{
+        "path": "transcript.txt",
+        "content": transcript,
+        "type": "transcript",
+    }]
+    url = analysis_data.get("url", "youtube")
+    slug, cache_dir, cache_vector_dir = get_cache_dirs(url, "youtube")
+    if cache_dir.exists():
+        shutil.rmtree(cache_dir)
+    cache_dir.mkdir(parents=True, exist_ok=True)
+    _, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)
+    new_state = {
+        **state_payload,
+        "vector_dir": str(cache_vector_dir),
+        "vector_chunks": chunk_count,
+        "indexed": True,
+    }
+    return f"✅ Indexed {chunk_count} transcript chunks. Ready for RAG queries!", new_state
+def bookmark_youtube_video(state_payload: dict | None):
+    """Bookmark YouTube video - persists transcript to bookmarks system."""
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return "⚠️ Run analysis before bookmarking.", state_payload, gr.Dropdown()
+    transcript = analysis_data.get("transcript", "")
+    if not transcript:
+        return "⚠️ No transcript found to bookmark.", state_payload, gr.Dropdown()
+    video_url = analysis_data.get("url", "youtube-video")
+    chapters = analysis_data.get("chapters", "")
+    # Create pseudo-analysis structure compatible with bookmark_repo_from_analysis
+    pseudo_analysis = {
+        "repo_name": f"YouTube: {video_url[:50]}",
+        "repo_url": video_url,
+        "documentation": [
+            {
+                "path": "transcript.txt",
+                "content": transcript,
+            },
+            {
+                "path": "chapters.md",
+                "content": chapters,
+            }
+        ],
+    }
+    # Use prebuilt vector store if already indexed
+    prebuilt_dir = None
+    prebuilt_chunks = None
+    if state_payload.get("indexed") and state_payload.get("vector_dir"):
+        prebuilt_dir = Path(state_payload["vector_dir"])
+        prebuilt_chunks = state_payload.get("vector_chunks", 0)
+    metadata = bookmark_repo_from_analysis(
+        video_url,
+        pseudo_analysis,
+        prebuilt_vector_dir=prebuilt_dir,
+        prebuilt_chunks=prebuilt_chunks,
+    )
+    choices, _ = get_dropdown_options()
+    dropdown_update = gr.Dropdown(choices=choices, value=metadata.dropdown_label)
+    new_state = {
+        **state_payload,
+        "vector_dir": metadata.vector_dir,
+        "vector_chunks": metadata.vector_chunks,
+        "indexed": True,
+        "bookmarked": True,
+    }
+    return f"🔖 YouTube video bookmarked! {metadata.vector_chunks} chunks indexed.", new_state, dropdown_update
+def generate_youtube_transfer_report(youtube_url: str):
+    youtube_url = (youtube_url or "").strip()
+    if not youtube_url:
+        return "⚠️ Paste a YouTube video URL before generating a report."
+    result = fetch_youtube_transcript(youtube_url)
+    if "error" in result:
+        return f"❌ {result['error']}"
+    transcript = (result.get("raw_transcript") or "").strip()
+    if not transcript:
+        return "No transcript text was returned by the youtube-transcript MCP server; report generation was skipped."
+    chapters = summarize_youtube_chapters(transcript, url=result.get("url", youtube_url))
+    study_notes = generate_youtube_study_notes(chapters, url=result.get("url", youtube_url))
+    generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
+    header_lines = [
+        "# YouTube Knowledge Transfer Report",
+        "",
+        f"- Source: {result.get('url', youtube_url)}",
+        f"- Language: {result.get('lang', 'en')}",
+        f"- Generated at: {generated_at}",
+    ]
+    lines: list[str] = []
+    lines.extend(header_lines)
+    lines.append("")
+    lines.append("## 1. Topic & Chapter Outline")
+    lines.append("")
+    lines.append(chapters)
+    lines.append("")
+    lines.append("## 2. Study & Interview Guidance")
+    lines.append("")
+    lines.append(study_notes)
+    report_markdown = "\n".join(lines)
+    root = _ensure_knowledge_root()
+    youtube_root = root / "Youtube Video"
+    youtube_root.mkdir(parents=True, exist_ok=True)
+    slug = _slugify_name(result.get("url", youtube_url))
+    ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
+    report_path = youtube_root / f"{slug}-youtube-knowledge-{ts}.md"
+    report_path.write_text(report_markdown, encoding="utf-8")
+    rel_path = report_path.relative_to(Path("."))
+    return f"📄 YouTube knowledge transfer report written to `{rel_path}`."
+def _ensure_knowledge_root() -> Path:
+    KNOWLEDGE_TRANSFER_ROOT.mkdir(parents=True, exist_ok=True)
+    return KNOWLEDGE_TRANSFER_ROOT
+def _slugify_name(name: str) -> str:
+    base = (name or "project").lower()
+    safe = re.sub(r"[^a-z0-9-]+", "-", base).strip("-")
+    return safe or "project"
+def generate_knowledge_transfer_report(state_payload: dict | None):
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return "⚠️ Run an analysis before generating a report."
+    repo_name = analysis_data.get("repo_name") or "Project"
+    repo_url = analysis_data.get("repo_url") or "local upload"
+    docs = analysis_data.get("documentation") or []
+    doc_count = len(docs)
+    structure = analysis_data.get("structure") or []
+    vector_dir = state_payload.get("vector_dir") if state_payload else ""
+    vector_chunks = state_payload.get("vector_chunks", 0) if state_payload else 0
+    summary_base = state_payload.get("summary_base", []) if state_payload else []
+    processed_timestamp = state_payload.get("processed_timestamp") if state_payload else None
+    generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
+    header_lines = [
+        f"# Knowledge Transfer Report – {repo_name}",
+        "",
+        f"- Source: {repo_url}",
+        f"- Generated at: {generated_at}",
+        f"- Documentation files: {doc_count}",
+        f"- Vector chunks: {vector_chunks}",
+    ]
+    if processed_timestamp:
+        header_lines.append(f"- Last analysis run: {processed_timestamp}")
+    overview_section = "\n".join(summary_base) if summary_base else "No high-level summary was captured during analysis."
+    llm_summary_section = ""
+    if vector_dir and vector_chunks:
+        try:
+            question = (
+                "Provide a detailed knowledge transfer summary of this repository. "
+                "Explain its purpose, main components, architecture, key dependencies, "
+                "and patterns that would be reusable in other projects. "
+                "Focus on actionable insights and how to extend or adapt this codebase."
+            )
+            llm_summary_section = rag_answer_from_store(Path(vector_dir), question, repo_summary=overview_section)
+        except Exception as err:
+            llm_summary_section = f"LLM summary unavailable due to error: {err}"
+    else:
+        llm_summary_section = "Vector store not available; running RAG-based summary was skipped."
+    max_items = 80
+    structure_snippet = "\n".join(structure[:max_items]) if structure else "No repository structure information was captured."
+    doc_paths = [d.get("path", "") for d in docs][:max_items]
+    docs_list_section = "\n".join(f"- {p}" for p in doc_paths) if doc_paths else "No documentation files were detected."
+    lines: list[str] = []
+    lines.extend(header_lines)
+    lines.append("")
+    lines.append("## 1. High-level Overview")
+    lines.append("")
+    lines.append(overview_section)
+    lines.append("")
+    lines.append("## 2. Repository Layout (snapshot)")
+    lines.append("")
+    lines.append("```")
+    lines.append(structure_snippet)
+    lines.append("```")
+    lines.append("")
+    lines.append("## 3. Documentation Files")
+    lines.append("")
+    lines.append(docs_list_section)
+    lines.append("")
+    lines.append("## 4. LLM Knowledge Summary")
+    lines.append("")
+    lines.append(llm_summary_section)
+    lines.append("")
+    lines.append("## 5. Notes for Future Reuse")
+    lines.append("")
+    lines.append(
+        "Use this report as a starting point when designing new projects. "
+        "Focus on reusing architecture patterns, utility modules, and any "
+        "documented best practices or workflows."
+    )
+    report_markdown = "\n".join(lines)
+    root = _ensure_knowledge_root()
+    slug = _slugify_name(repo_name)
+    ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
+    report_path = root / f"{slug}-knowledge-transfer-{ts}.md"
+    report_path.write_text(report_markdown, encoding="utf-8")
+    rel_path = report_path.relative_to(Path("."))
+    return f"📄 Knowledge transfer report written to `{rel_path}`."
+def _list_knowledge_report_choices() -> list[str]:
+    root = _ensure_knowledge_root()
+    reports = sorted(root.glob("*.md"))
+    return [report.name for report in reports]
+def _refresh_lab_reports_dropdown():
+    return gr.Dropdown(
+        label="Knowledge Transfer report (optional)",
+        choices=_list_knowledge_report_choices(),
+        value=None,
+        interactive=True,
+    )
+def load_study_deck_from_report(report_name: str | None) -> str:
+    if not report_name:
+        return "Select a Knowledge Transfer report above to view its study deck-style summary."
+    root = _ensure_knowledge_root()
+    report_path = root / report_name
+    if not report_path.exists():
+        return f"Report `{report_name}` was not found in the Knowledge Transfer folder."
+    try:
+        raw = report_path.read_text(encoding="utf-8", errors="ignore")
+    except OSError as err:
+        return f"Unable to read report `{report_name}`: {err}"
+    max_chars = 6000
+    snippet = raw[:max_chars]
+    if len(raw) > max_chars:
+        snippet = snippet.rstrip() + "\n\n... (truncated)"
+    return (
+        f"### Study Deck · {report_name}\n\n"
+        "Scroll through this condensed report to refresh yourself on the key concepts, "
+        "architecture, and reusable patterns for this project.\n\n"
+        f"```markdown\n{snippet}\n```"
+    )
+def _derive_local_repo_root(uploaded: str | list[str] | None) -> Path | None:
+    """Given a directory-style file upload, infer the repository root directory.
+    Gradio's File component with ``file_count="directory"`` returns a list of
+    filepaths under the uploaded folder (or a single filepath). We compute the
+    common parent directory and treat that as the repo root.
     """
+    if not uploaded:
+        return None
+    if isinstance(uploaded, str):
+        paths = [uploaded]
+    else:
+        paths = [p for p in uploaded if p]
+    if not paths:
+        return None
+    try:
+        common = os.path.commonpath(paths)
+    except ValueError:
+        return None
+    root = Path(common)
+    return root if root.exists() and root.is_dir() else None
+def run_local_repo_ingestion(uploaded_folder):
+    """Analyze local repository folder, filtering irrelevant files."""
+    repo_root = _derive_local_repo_root(uploaded_folder)
+    if not repo_root:
+        warning = "⚠️ Upload a project folder before running analysis."
+        source_info = "**Source:** Not selected\n**Status:** ⏳ Pending\n**Chunks:** 0 vectors"
+        return warning, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+            "summary_base": [],
+        }
+    # Filter out irrelevant files before analysis
+    if isinstance(uploaded_folder, list):
+        filtered_files = [f for f in uploaded_folder if not _should_ignore_path(Path(f))]
+        if not filtered_files:
+            warning = "⚠️ No relevant files found after filtering."
+            source_info = "**Source:** Local\n**Status:** ⚠️ No files\n**Chunks:** 0 vectors"
+            return warning, source_info, {
+                "analysis": None,
+                "vector_dir": "",
+                "vector_chunks": 0,
+                "summary_base": [],
+            }
+    result = analyze_local_repo(str(repo_root))
+    if "error" in result:
+        error_msg = f"❌ {result['error']}"
+        source_info = f"**Source:** Local\n**Status:** ❌ Error\n**Chunks:** 0 vectors"
+        return error_msg, source_info, {
+            "analysis": None,
+            "vector_dir": "",
+            "vector_chunks": 0,
+            "summary_base": [],
+        }
+    docs = result.get("documentation", [])
+    repo_name = result.get("repo_name", repo_root.name)
+    timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")
+    # Source info for preview panel
+    source_info = f"""**Source:** Local Project
+**Folder:** {repo_name}
+**Status:** ✅ Analyzed
+**Documents:** {len(docs)} files
+**Analyzed:** {timestamp}"""
+    # Document preview content
+    preview_sections = []
+    for doc in docs[:5]:
+        content = (doc.get("content") or "").strip()
+        if not content:
+            continue
+        snippet = content[:600]
+        if len(content) > 600:
+            snippet = snippet.rstrip() + " ..."
+        preview_sections.append(
+            f"### 📄 {doc.get('path', 'document')}\n\n{snippet}"
+        )
+    preview_content = (
+        "\n\n---\n\n".join(preview_sections)
+        if preview_sections
+        else "*No textual documentation snippets were found.*"
+    )
+    state_payload = {
+        "analysis": result,
+        "vector_dir": "",
+        "vector_chunks": 0,
+        "summary_base": [repo_name, str(len(docs))],
+        "processed_timestamp": timestamp,
+        "indexed": False,
+    }
+    return preview_content, source_info, state_payload
+def index_local_repo(state_payload: dict | None):
+    """Index the analyzed local repository for RAG."""
+    return index_github_repo(state_payload)  # Same logic
+def bookmark_local_repo(state_payload: dict | None):
+    """Bookmark and index the local repository permanently."""
+    return bookmark_github_repo(state_payload)  # Same logic
+def _format_bookmark_info(metadata: dict | None) -> str:
+    if not metadata:
+        return (
+            "No bookmarks yet. Process a repository in the *Process New Repository* tab, then bookmark it to enable RAG chat."
+        )
+    preview = (metadata.get("summary_preview") or "").strip()
+    if preview:
+        max_len = 600
+        if len(preview) > max_len:
+            preview_display = preview[:max_len].rstrip() + " ..."
+        else:
+            preview_display = preview
+        return (
+            f"### {metadata.get('repo_name', 'Saved Repository')}\n"
+            f"- URL: {metadata.get('repo_url', 'N/A')}\n"
+            f"- Last pulled: {metadata.get('last_pulled_display', '--/--/----')}\n"
+            f"- Documentation files: {metadata.get('docs_count', 0)}\n"
+            f"- Vector chunks: {metadata.get('vector_chunks', 0)}\n\n"
+            f"**Preview:**\n\n{preview_display}"
+        )
+    return (
+        f"### {metadata.get('repo_name', 'Saved Repository')}\n"
+        f"- URL: {metadata.get('repo_url', 'N/A')}\n"
+        f"- Last pulled: {metadata.get('last_pulled_display', '--/--/----')}\n"
+        f"- Documentation files: {metadata.get('docs_count', 0)}\n"
+        f"- Vector chunks: {metadata.get('vector_chunks', 0)}"
+    )
+def _refresh_bookmarks(preselect: str | None = None):
+    choices, metadata_list = get_dropdown_options()
+    value = preselect if preselect and preselect in choices else (choices[0] if choices else None)
+    dropdown_update = gr.Dropdown(
+        choices=choices,
+        value=value,
+        interactive=bool(choices),
+        label="Bookmarked repositories",
+        allow_custom_value=True,
+    )
+    info = _format_bookmark_info(
+        find_metadata_by_label(value, metadata_list) if value else None
+    )
+    return dropdown_update, metadata_list, info
+def load_bookmarks_on_start():
+    dropdown_update, metadata_list, info = _refresh_bookmarks()
+    status = "Bookmarks loaded." if metadata_list else "No bookmarks saved yet."
+    return dropdown_update, metadata_list, info, status
+def _build_summary_from_base(base_lines: list[str], final_message: str) -> str:
+    if not base_lines:
+        return final_message
+    return "\n".join(base_lines + ["", final_message])
+def bookmark_current_repo(state_payload: dict | None):
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data or not analysis_data.get("documentation"):
+        return (
+            "⚠️ Run an analysis before bookmarking a repository.",
+            gr.Dropdown(choices=[], value=None, interactive=False, label="Bookmarked repositories"),
+            [],
+            _format_bookmark_info(None),
+            _build_summary_from_base(
+                (state_payload or {}).get("summary_base", []),
+                "⚠️ Bookmark failed because no analysis data is available.",
+            ),
+            state_payload,
+        )
+    repo_url = analysis_data.get("repo_url") or analysis_data.get("repo_name")
+    vector_dir = state_payload.get("vector_dir") if state_payload else ""
+    metadata = bookmark_repo_from_analysis(
+        repo_url,
+        analysis_data,
+        prebuilt_vector_dir=Path(vector_dir) if vector_dir else None,
+        prebuilt_chunks=state_payload.get("vector_chunks") if state_payload else None,
+    )
+    dropdown_update, metadata_list, info = _refresh_bookmarks(preselect=metadata.dropdown_label)
+    saved_msg = (
+        f"💾 Repo saved on {metadata.last_pulled_display}. Access it via the Bookmarked tab for RAG chat."
+    )
+    updated_summary = _build_summary_from_base(
+        state_payload.get("summary_base", []),
+        saved_msg,
+    )
+    new_state = {
+        **(state_payload or {}),
+        "summary_base": state_payload.get("summary_base", []),
+        "saved": True,
+    }
+    return saved_msg, dropdown_update, metadata_list, info, updated_summary, new_state
+def update_selected_bookmark(label: str, metadata_list: list[dict]):
+    metadata = find_metadata_by_label(label, metadata_list or []) if label else None
+    return _format_bookmark_info(metadata)
+def answer_bookmark_question(label: str, question: str, metadata_list: list[dict]):
+    if not label:
+        return "Select a bookmarked repository before asking a question."
+    if not question.strip():
+        return "Enter a question to query your bookmarked repository."
+    metadata = find_metadata_by_label(label, metadata_list or [])
+    if not metadata:
+        return "Bookmark metadata not found. Try refreshing bookmarks."
+    if metadata.get("vector_chunks", 0) == 0:
+        return "This bookmark has no vector store yet. Re-bookmark the repo to rebuild embeddings."
+    summary = (
+        f"Repository: {metadata.get('repo_name', label)}\n"
+        f"Docs: {metadata.get('docs_count', 0)} | Last pulled: {metadata.get('last_pulled_display', '--/--/----')}"
+    )
+    answer = rag_answer_from_store(Path(metadata["vector_dir"]), question, repo_summary=summary)
+    return answer
+def placeholder_action_message(label: str):
+    if not label:
+        return "Select a bookmarked repository to use this action."
+    return f"Additional bookmark actions for **{label}** are coming soon."
+def run_experimental_lab(intention: str, report_name: str | None):
+    text = (intention or "").strip()
+    if not text:
+        return "Describe what you want to build in the Experimental Lab to get started."
+    root = _ensure_knowledge_root()
+    report_markdown = ""
+    context_note = ""
+    if report_name:
+        report_path = root / report_name
+        if report_path.exists():
+            try:
+                raw = report_path.read_text(encoding="utf-8", errors="ignore")
+                report_markdown = raw
+                snippet = raw[:3000]
+                context_note = (
+                    f"Using Knowledge Transfer report: `{report_name}` as reference.\n\n"
+                    f"Snippet from report (truncated):\n\n```markdown\n{snippet}\n```\n\n"
+                )
+            except OSError:
+                context_note = f"Unable to read Knowledge Transfer report `{report_name}`. Proceeding without embedded context.\n\n"
+    build_result = build_experiment_from_report(text, report_markdown)
+    code = build_result.get("code", "")
+    stdout = build_result.get("stdout", "")
+    error = build_result.get("error", "")
+    base_intro = (
+        "Experimental Lab is a sandbox where future versions of MonkeyMind will use "
+        "Knowledge Transfer reports as context to plan and build small Gradio apps.\n\n"
+    )
+    code_section = "### Generated experiment code\n\n"
+    if code:
+        code_section += f"```python\n{code}\n```\n\n"
+    else:
+        code_section += "No code was generated.\n\n"
+    results_section = "### Sandbox output\n\n"
+    if stdout:
+        results_section += f"**Stdout / logs:**\n\n```text\n{stdout}\n```\n\n"
+    if error:
+        results_section += f"**Error:**\n\n```text\n{error}\n```\n\n"
+    if not stdout and not error:
+        results_section += "No errors encountered during sandbox test.\n\n"
+    return (
+        base_intro
+        + context_note
+        + f"You wrote:\n\n> {text}\n\n"
+        + code_section
+        + results_section
+    )
+def lab_fix_bugs(intention: str, report_name: str | None):
+    base = run_experimental_lab(intention, report_name)
+    return (
+        base
+        + "\n\n---\n\n_This Fix bugs action will eventually trigger another build iteration to resolve errors in the generated app. "
+        "For now, it simply records another planning pass based on your intention and chosen report._"
+    )
+def lab_mark_happy(intention: str, report_name: str | None):
+    text = (intention or "").strip()
+    return (
+        "Marking this experiment as complete.\n\n"
+        f"Final intention:\n\n> {text or 'N/A'}\n\n"
+        "You can now export or reuse this idea elsewhere. Future versions will attach concrete code artifacts here."
+    )
+def lab_export_project(intention: str, report_name: str | None):
+    text = (intention or "").strip()
+    return (
+        "Export placeholder: a future version will bundle generated code, configuration, and a short README "
+        "into a downloadable package.\n\n"
+        f"Current experiment description:\n\n> {text or 'N/A'}\n\n"
+        f"Reference report: `{report_name or 'none selected'}`."
+    )
+def answer_chat_question(question: str, github_state, local_state, youtube_state, selected_bookmark, metadata_list):
+    """Answer questions using RAG from any indexed source or bookmark."""
+    if not question.strip():
+        return "Please enter a question."
+    # Check if using a bookmark
+    if selected_bookmark:
+        metadata = find_metadata_by_label(selected_bookmark, metadata_list or [])
+        if metadata and metadata.get("vector_chunks", 0) > 0:
+            summary = (
+                f"Repository: {metadata.get('repo_name', selected_bookmark)}\n"
+                f"Last pulled: {metadata.get('last_pulled_display', '--/--/----')}"
+            )
+            answer = rag_answer_from_store(Path(metadata["vector_dir"]), question, repo_summary=summary)
+            return f"**[Bookmark: {selected_bookmark}]**\n\n{answer}"
+    # Check current session sources
+    for state, label in [
+        (github_state, "GitHub"),
+        (local_state, "Local"),
+        (youtube_state, "YouTube"),
+    ]:
+        if state and state.get("indexed") and state.get("vector_dir"):
+            vector_dir = Path(state["vector_dir"])
+            if vector_dir.exists():
+                answer = rag_answer_from_store(vector_dir, question)
+                return f"**[{label} Source]**\n\n{answer}"
+    return "⚠️ No indexed sources available. Please index a repository or select a bookmark first."
+def generate_and_download_report(state_payload: dict | None, source_type: str):
+    """Generate markdown report and return file path for download."""
+    analysis_data = (state_payload or {}).get("analysis") if state_payload else None
+    if not analysis_data:
+        return None
+    if source_type == "youtube":
+        transcript = analysis_data.get("transcript", "")
+        chapters = analysis_data.get("chapters", "")
+        url = analysis_data.get("url", "youtube")
+        lang = analysis_data.get("lang", "en")
+        study_notes = generate_youtube_study_notes(chapters, url=url)
+        generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
+        lines = [
+            "# YouTube Knowledge Transfer Report",
+            "",
+            f"- Source: {url}",
+            f"- Language: {lang}",
+            f"- Generated at: {generated_at}",
+            "",
+            "## 1. Chapter Outline",
+            "",
+            chapters,
+            "",
+            "## 2. Study Notes",
+            "",
+            study_notes,
+        ]
+    else:
+        # GitHub or Local repo
+        repo_name = analysis_data.get("repo_name", "Project")
+        repo_url = analysis_data.get("repo_url", "local")
+        docs = analysis_data.get("documentation", [])
+        generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
+        lines = [
+            f"# Knowledge Transfer Report – {repo_name}",
+            "",
+            f"- Source: {repo_url}",
+            f"- Generated at: {generated_at}",
+            f"- Documentation files: {len(docs)}",
+            "",
+            "## Documentation Files",
+            "",
+        ]
+        for doc in docs[:50]:
+            lines.append(f"- {doc.get('path', 'unknown')}")
+    report_markdown = "\n".join(lines)
+    root = _ensure_knowledge_root()
+    slug = _slugify_name(analysis_data.get("repo_name", "project"))
+    ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
+    report_path = root / f"{slug}-report-{ts}.md"
+    report_path.write_text(report_markdown, encoding="utf-8")
+    return str(report_path)
+def refresh_bookmarks_dropdown():
+    """Refresh the bookmarks dropdown."""
+    choices, metadata_list = get_dropdown_options()
+    return gr.Dropdown(choices=choices, value=None, interactive=True), metadata_list
+def build_interface() -> tuple[gr.Blocks, gr.Theme | None, str | None]:
+    """Build the Gradio interface with improved UI/UX inspired by modern dashboard design."""
+    custom_css = """
+        @import url('https://fonts.googleapis.com/css2?family=Outfit:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap');
+        :root {
+            --primary: #34d399; /* Mint Green */
+            --primary-glow: rgba(52, 211, 153, 0.4);
+            --glass-bg: rgba(15, 23, 42, 0.6);
+            --glass-border: rgba(255, 255, 255, 0.08);
+            --text-main: #f8fafc;
+            --text-muted: #94a3b8;
+        }
+        body {
+            background-color: #0f172a;
+            color: var(--text-main);
+            font-family: 'Outfit', sans-serif !important;
+        }
+        /* Global container override */
+        .gradio-container {
+            max-width: 1400px !important;
+            background: #0f172a !important;
+            background-image:
+                radial-gradient(circle at 0% 0%, rgba(52, 211, 153, 0.15) 0%, transparent 50%),
+                radial-gradient(circle at 100% 100%, rgba(16, 185, 129, 0.1) 0%, transparent 50%) !important;
+            border: none !important;
+        }
+        /* Header styling */
+        .header-container {
+            background: rgba(15, 23, 42, 0.8);
+            backdrop-filter: blur(12px);
+            border-bottom: 1px solid var(--glass-border);
+            padding: 20px 24px;
+            margin: -16px -16px 24px -16px;
+            border-radius: 0;
+        }
+        /* Card/Panel styling */
+        .source-card, .gradio-group, .tabs, .tabitem, .box-container {
+            background: var(--glass-bg) !important;
+            backdrop-filter: blur(12px);
+            border: 1px solid var(--glass-border) !important;
+            border-radius: 16px !important;
+            box-shadow: 0 4px 20px rgba(0, 0, 0, 0.2);
+            padding: 20px !important;
+            margin-bottom: 20px !important;
+        }
+        /* Inputs and Textareas */
+        input, textarea, .gr-input, .gr-box, .dropdown-wrap {
+            background-color: rgba(30, 41, 59, 0.6) !important;
+            border: 1px solid rgba(255, 255, 255, 0.1) !important;
+            color: var(--text-main) !important;
+            border-radius: 10px !important;
+        }
+        input:focus, textarea:focus {
+            border-color: var(--primary) !important;
+            box-shadow: 0 0 0 2px var(--primary-glow) !important;
+        }
+        /* Buttons */
+        button.primary {
+            background: linear-gradient(135deg, #34d399 0%, #10b981 100%) !important;
+            color: #0f172a !important;
+            font-weight: 600 !important;
+            border: none !important;
+            box-shadow: 0 4px 15px rgba(52, 211, 153, 0.3) !important;
+        }
+        button.secondary {
+            background: rgba(30, 41, 59, 0.8) !important;
+            border: 1px solid rgba(255, 255, 255, 0.1) !important;
+            color: var(--text-muted) !important;
+        }
+        button.secondary:hover {
+            color: var(--text-main) !important;
+            border-color: var(--primary) !important;
+        }
+        button.stop {
+            background: linear-gradient(135deg, #f87171 0%, #ef4444 100%) !important;
+            color: white !important;
+        }
+        /* Status indicators */
+        .status-ready {
+            background: rgba(16, 185, 129, 0.1);
+            color: #34d399;
+            padding: 6px 12px;
+            border-radius: 20px;
+            font-size: 12px;
+            border: 1px solid rgba(16, 185, 129, 0.2);
+        }
+        .status-pending {
+            background: rgba(251, 191, 36, 0.1);
+            color: #fbbf24;
+            padding: 6px 12px;
+            border-radius: 20px;
+            font-size: 12px;
+            border: 1px solid rgba(251, 191, 36, 0.2);
+        }
+        /* Keep copy/like buttons always visible and styled */
+        .message-buttons {
+            opacity: 1 !important;
+            display: flex !important;
+            gap: 4px !important;
+        }
+        .message-buttons button {
+            color: #94a3b8 !important; /* text-muted */
+            background: transparent !important;
+            border: none !important;
+            box-shadow: none !important;
+        }
+        .message-buttons button:hover {
+            color: #34d399 !important; /* primary */
+            background: rgba(52, 211, 153, 0.1) !important;
+        }
+        /* Chat bubbles */
+        .chat-assistant {
+            background: rgba(30, 41, 59, 0.8) !important;
+            border: 1px solid var(--glass-border);
+            border-radius: 18px 18px 18px 4px !important;
+            color: var(--text-main) !important;
+        }
+        .chat-user {
+            background: linear-gradient(135deg, #34d399 0%, #10b981 100%) !important;
+            color: #022c22 !important;
+            border-radius: 18px 18px 4px 18px !important;
+            font-weight: 500;
+        }
+        /* Chat message text size and font */
+        .message-wrap .message {
+            font-size: 0.9rem !important;
+            font-family: 'JetBrains Mono', monospace !important;
+            line-height: 1.5 !important;
+        }
+        /* Typography overrides */
+        .prose, .prose h1, .prose h2, .prose h3, .prose p, .prose strong {
+            color: var(--text-main) !important;
+        }
+        /* Scrollbar */
+        ::-webkit-scrollbar { width: 6px; height: 6px; }
+        ::-webkit-scrollbar-track { background: transparent; }
+        ::-webkit-scrollbar-thumb { background: #334155; border-radius: 10px; }
+        ::-webkit-scrollbar-thumb:hover { background: #475569; }
     """
+    app_theme = gr.themes.Soft(
+        primary_hue="emerald",
+        secondary_hue="slate",
+        neutral_hue="slate",
+    ).set(
+        body_background_fill="#0f172a",
+        block_background_fill="#1e293b",
+        block_border_color="rgba(255,255,255,0.1)",
+        input_background_fill="#0f172a",
+        button_primary_background_fill="#34d399",
+        button_primary_text_color="#0f172a",
+    )
+    blocks_kwargs = {"title": "🐒 MonkeyMind - Knowledge Transfer Agent"}
+    if not IS_GRADIO_V6:
+        blocks_kwargs.update(theme=app_theme, css=custom_css)
+    with gr.Blocks(**blocks_kwargs) as demo:
+        # State variables
+        github_state = gr.State({})
+        local_state = gr.State({})
+        youtube_state = gr.State({})
+        bookmarks_metadata = gr.State([])
+        chat_history = gr.State([])
+        notepad_content = gr.State("")  # For notepad feature
+        copied_texts = gr.State(set())  # Track copied texts to prevent duplicates
+        # ===== HEADER =====
+        with gr.Row(elem_classes=["header-container"]):
+            gr.HTML("""
+                <div style="display: flex; align-items: center; gap: 16px;">
+                    <div style="width: 48px; height: 48px; border-radius: 12px; background: linear-gradient(135deg, #34d399 0%, #10b981 100%); display: flex; align-items: center; justify-content: center; box-shadow: 0 0 20px rgba(52, 211, 153, 0.3);">
+                        <span style="font-size: 28px;">🐒</span>
+                    </div>
+                    <div>
+                        <h1 style="margin: 0; font-size: 1.5rem; font-weight: 700; color: #f8fafc; letter-spacing: -0.5px;">
+                            MonkeyMind
+                        </h1>
+                        <div style="display: flex; align-items: center; gap: 8px;">
+                            <span style="width: 8px; height: 8px; border-radius: 50%; background: #34d399; box-shadow: 0 0 10px #34d399;"></span>
+                            <p style="margin: 0; font-size: 0.8rem; color: #94a3b8; font-family: 'JetBrains Mono', monospace;">AGENT ACTIVE</p>
+                        </div>
+                    </div>
+                </div>
+            """)
+        # ===== APP DESCRIPTION =====
+        gr.Markdown("""
+> **🐒 MonkeyMind** is your Knowledge Transfer & RAG Agent. Analyze GitHub repos, local projects, or YouTube videos
+> to build a personal knowledge base. Chat with your sources using AI-powered retrieval.
+>
+> **Quick Start:** Paste a GitHub URL → Click **Analyze** → Click **Index** → Start chatting!
+> Bookmark important sources to access them anytime.
+        """)
+        # ===== MAIN LAYOUT: 1/3 Left Panel + 2/3 Right Panel =====
+        with gr.Row():
+            # ===== LEFT PANEL: Data Sources + Bookmarks =====
+            with gr.Column(scale=1, min_width=350):
+                # Data Sources Section
+                gr.Markdown("### 📡 Data Ingestion")
+                # Source Type Selector (pill-style tabs)
+                source_type = gr.Radio(
+                    choices=["🔗 GitHub", "📁 Local", "🎥 YouTube"],
+                    value="🔗 GitHub",
+                    label="",
+                    container=False,
+                    interactive=True
+                )
+                # Dynamic source input based on selection
+                with gr.Group(visible=True) as github_group:
+                    gr.Markdown("*Paste a GitHub repo URL and click **Analyze** to extract docs. Then **Index** to enable RAG chat. You can see retrieved contents in the **Preview** tab on the right.*")
+                    github_url = gr.Textbox(
+                        label="Repository URL",
+                        placeholder="https://github.com/username/repo",
+                        show_label=True,
+                    )
+                    github_analyze_btn = gr.Button("🔍 Analyze Repository", variant="secondary")
+                    github_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
+                    github_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
+                    github_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
+                    gr.Markdown("---")
+                    gr.Markdown("**📝 Notepad** *(copy useful info here)*")
+                    github_notepad = gr.Textbox(
+                        label="",
+                        placeholder="Paste or write notes here...",
+                        lines=3,
+                        container=False,
+                        show_copy_button=True,
+                    )
+                    with gr.Row():
+                        github_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")
+                with gr.Group(visible=False) as local_group:
+                    gr.Markdown("*Upload a project folder. Irrelevant files are auto-filtered. You can see retrieved contents in the **Preview** tab on the right.*")
+                    local_folder = gr.File(
+                        label="Upload Project Folder",
+                        file_count="directory",
+                        type="filepath",
+                    )
+                    local_analyze_btn = gr.Button("🔍 Analyze Project", variant="secondary")
+                    local_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
+                    local_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
+                    local_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
+                    gr.Markdown("---")
+                    gr.Markdown("**📝 Notepad** *(copy useful info here)*")
+                    local_notepad = gr.Textbox(
+                        label="",
+                        placeholder="Paste or write notes here...",
+                        lines=3,
+                        container=False,
+                        show_copy_button=True,
+                    )
+                    with gr.Row():
+                        local_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")
+                with gr.Group(visible=False) as youtube_group:
+                    gr.Markdown("*Paste a YouTube video URL to extract and analyze the transcript. You can see retrieved contents in the **Preview** tab on the right.*")
+                    youtube_url = gr.Textbox(
+                        label="Video URL",
+                        placeholder="https://www.youtube.com/watch?v=...",
+                    )
+                    youtube_analyze_btn = gr.Button("🔍 Analyze Video", variant="secondary")
+                    youtube_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
+                    youtube_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
+                    youtube_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
+                    gr.Markdown("---")
+                    gr.Markdown("**📝 Notepad** *(copy useful info here)*")
+                    youtube_notepad = gr.Textbox(
+                        label="",
+                        placeholder="Paste or write notes here...",
+                        lines=3,
+                        container=False,
+                        show_copy_button=True,
+                    )
+                    with gr.Row():
+                        youtube_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")
+                # Source type switching logic
+                def switch_source(choice):
+                    return (
+                        gr.Group(visible=("GitHub" in choice)),
+                        gr.Group(visible=("Local" in choice)),
+                        gr.Group(visible=("YouTube" in choice)),
+                    )
+                source_type.change(
+                    fn=switch_source,
+                    inputs=[source_type],
+                    outputs=[github_group, local_group, youtube_group],
+                )
+                gr.Markdown("---")
+                # Bookmarks Quick Access Section
+                gr.Markdown("### 🧠 Knowledge Base")
+                gr.Markdown("*Select sources to use for chat. Multiple selections allowed.*")
+                # Use CheckboxGroup for multi-select
+                bookmarks_checkboxes = gr.CheckboxGroup(
+                    label="Active Sources",
+                    choices=[],
+                    value=[],
+                    interactive=True,
+                    info="Check sources to include in chat context"
+                )
+                # Keep dropdown for compatibility (hidden, used internally)
+                bookmarks_dropdown = gr.Dropdown(
+                    label="",
+                    choices=[],
+                    value=None,
+                    interactive=True,
+                    visible=False,
+                )
+                with gr.Row():
+                    refresh_bookmarks_btn = gr.Button("🔄 Refresh", variant="secondary", size="sm", scale=1)
+                    view_all_btn = gr.Button("📋 View All", variant="secondary", size="sm", scale=1)
+                # Bookmark info display
+                bookmark_info = gr.Markdown(
+                    value="*No sources selected. Bookmark repos to add them here.*",
+                    elem_classes=["info-box"]
+                )
+            # ===== RIGHT PANEL: Chat & Preview =====
+            with gr.Column(scale=2, min_width=500):
+                # Chat vs Preview Toggle
+                right_panel_mode = gr.Radio(
+                    choices=["💬 Chat & RAG", "📄 Preview"],
+                    value="💬 Chat & RAG",
+                    label="",
+                    container=False,
+                )
+                # Chat Interface
+                with gr.Group(visible=True) as chat_panel:
+                    with gr.Group(elem_classes=["box-container"]):
+                        gr.Markdown("### 🐒 Knowledge Assistant")
+                    gr.Markdown("*Hover over messages to see copy icon. Use toggles below to augment with web/wiki search.*")
+                    chatbot_kwargs = dict(
+                        value=[],
+                        height=450,
+                        show_label=False,
+                        avatar_images=["images/user.png", "images/monkey.png"],
+                        elem_classes=["chat-container"],
+                        type="messages",
+                    )
+                    chatbot = gr.Chatbot(**chatbot_kwargs)
+                    # Toolbar row: Web Search, Wiki Search (Clear Chat removed)
+                    with gr.Row():
+                        # clear_chat_btn removed as requested
+                        web_search_toggle = gr.Checkbox(
+                            label="🌐 Web Search",
+                            value=False,
+                            interactive=True,
+                        )
+                        wiki_search_toggle = gr.Checkbox(
+                            label="📚 Wikipedia",
+                            value=False,
+                            interactive=True,
+                        )
+                    with gr.Row():
+                        question_box = gr.Textbox(
+                            label="",
+                            placeholder="Ask anything about your indexed sources...",
+                            lines=1,
+                            scale=5,
+                            container=False,
+                        )
+                        send_btn = gr.Button("Send", variant="primary", scale=1)
+                    gr.Examples(
+                        examples=[
+                            "Summarize the main architecture patterns",
+                            "What are the key dependencies?",
+                            "Explain the core functionality",
+                            "What patterns can I reuse?",
+                        ],
+                        inputs=question_box,
+                        label="Quick Questions"
+                    )
+                    # ===== EXPERIMENTAL LAB (Collapsible) - Moved here =====
+                    with gr.Group(elem_classes=["box-container"]):
+                        gr.Markdown("### 🧪 Experimental Lab")
+                        gr.Markdown("Use this lab to prototype small apps based on your knowledge base.")
+                        with gr.Accordion("Open Lab", open=False):
+                            gr.Markdown("*The agent generates Gradio code and tests it in a sandbox.*")
+                            with gr.Row():
+                                with gr.Column(scale=1):
+                                    gr.Markdown("### 🎯 Build an Experiment")
+                                    lab_intention = gr.Textbox(
+                                        label="What do you want to build?",
+                                        placeholder="e.g., A Gradio app that visualizes patterns from a Knowledge Transfer report.",
+                                        lines=3,
+                                    )
+                                    lab_report_dropdown = gr.Dropdown(
+                                        label="Reference Material (bookmarked report)",
+                                        choices=_list_knowledge_report_choices(),
+                                        value=None,
+                                        interactive=True,
+                                        info="Select a Knowledge Transfer report as context"
+                                    )
+                                    with gr.Row():
+                                        lab_refresh_reports_btn = gr.Button("🔄 Refresh", variant="secondary", size="sm")
+                                        lab_start_btn = gr.Button("▶️ Start Build", variant="primary", size="sm")
+                                    gr.Markdown("---")
+                                    gr.Markdown("**🔧 Fix Issues**")
+                                    lab_fix_instruction = gr.Textbox(
+                                        label="",
+                                        placeholder="Describe what needs to be fixed (e.g., 'The button click handler is not working')...",
+                                        lines=2,
+                                        container=False,
+                                    )
+                                    with gr.Row():
+                                        lab_fix_btn = gr.Button("🔧 Apply Fix", variant="secondary", size="sm")
+                                        lab_happy_btn = gr.Button("✅ Done", variant="secondary", size="sm")
+                                    lab_export_btn = gr.Button("📥 Export Code", variant="primary")
+                                    lab_download = gr.File(label="Download", visible=False)
+                                with gr.Column(scale=2):
+                                    gr.Markdown("### 🔬 Experiment Output")
+                                    lab_output = gr.Markdown(
+                                        "Describe what you want to build, select a reference report from your bookmarks, then click **Start Build**.\n\n"
+                                        "If there are errors, describe the issue in the fix box and click **Apply Fix**."
+                                    )
+                                    lab_code_display = gr.Code(
+                                        label="Generated Code",
+                                        language="python",
+                                        visible=False,
+                                    )
+                # Preview Interface
+                with gr.Group(visible=False) as preview_panel:
+                    gr.Markdown("### 📄 Document Preview")
+                    with gr.Row():
+                        with gr.Column(scale=1):
+                            preview_source_info = gr.Markdown("""
+**Source:** Not selected
+**Status:** ⏳ Pending
+**Chunks:** 0 vectors
+                            """, elem_classes=["info-box"])
+                        with gr.Column(scale=1, min_width=100):
+                             with gr.Row():
+                                preview_copy_btn = gr.Button("📋 Copy", variant="secondary", size="sm", scale=1)
+                                preview_download_btn = gr.DownloadButton("📥 Download", variant="secondary", size="sm", scale=1)
+                                preview_download_file = gr.File(visible=False)
+                    preview_content = gr.Markdown(
+                        value="Select a source and analyze it to see the preview here.",
+                        elem_classes=["preview-card"]
+                    )
+                # Panel switching logic
+                def switch_panel(choice):
+                    return (
+                        gr.Group(visible=("Chat" in choice)),
+                        gr.Group(visible=("Preview" in choice)),
+                    )
+                right_panel_mode.change(
+                    fn=switch_panel,
+                    inputs=[right_panel_mode],
+                    outputs=[chat_panel, preview_panel],
+                )
+        gr.Markdown("---")
+        # ===== HIDDEN STATE COMPONENTS FOR DOWNLOADS =====
+        github_download = gr.File(label="Download", visible=False)
+        local_download = gr.File(label="Download", visible=False)
+        youtube_download = gr.File(label="Download", visible=False)
+        # ===== EVENT HANDLERS =====
+        # GitHub handlers
+        github_analyze_btn.click(
+            fn=lambda: "⏳ **Analyzing repository...** Please wait.",
+            outputs=[github_status],
+        ).then(
+            fn=run_github_ingestion,
+            inputs=[github_url],
+            outputs=[preview_content, preview_source_info, github_state],
+        ).then(
+            fn=lambda: "✅ **Analysis complete!** Click **Index for RAG** to enable chat.",
+            outputs=[github_status],
+        )
+        def index_github_with_status(state):
+            status, new_state = index_github_repo(state)
+            chunks = new_state.get("vector_chunks", 0) if new_state else 0
+            if "✅" in status or chunks > 0:
+                return f"✅ **Indexed {chunks} vector chunks.** Ready for RAG queries!", new_state
+            return status, new_state
+        def index_local_with_status(state):
+            status, new_state = index_local_repo(state)
+            chunks = new_state.get("vector_chunks", 0) if new_state else 0
+            if "✅" in status or chunks > 0:
+                return f"✅ **Indexed {chunks} vector chunks.** Ready for RAG queries!", new_state
+            return status, new_state
+        def index_youtube_with_status(state):
+            status, new_state = index_youtube_video(state)
+            chunks = new_state.get("vector_chunks", 0) if new_state else 0
+            if "✅" in status or chunks > 0:
+                return f"✅ **Indexed {chunks} transcript chunks.** Ready for RAG queries!", new_state
+            return status, new_state
+        github_index_btn.click(
+            fn=lambda: "⏳ **Indexing...** Building vector embeddings.",
+            outputs=[github_status],
+        ).then(
+            fn=index_github_with_status,
+            inputs=[github_state],
+            outputs=[github_status, github_state],
+        )
+        def bookmark_with_refresh(state):
+            status, new_state, dropdown = bookmark_github_repo(state)
+            choices, meta = get_dropdown_options()
+            return (
+                "🔖 **Bookmarked!** Added to Knowledge Base for future chat sessions.",
+                new_state,
+                gr.Dropdown(choices=choices, value=None),
+                gr.CheckboxGroup(choices=choices, value=[]),
+                meta
+            )
+        github_bookmark_btn.click(
+            fn=bookmark_with_refresh,
+            inputs=[github_state],
+            outputs=[github_status, github_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
+        )
+        # Local handlers
+        local_analyze_btn.click(
+            fn=lambda: "⏳ **Analyzing project...** Please wait.",
+            outputs=[local_status],
+        ).then(
+            fn=run_local_repo_ingestion,
+            inputs=[local_folder],
+            outputs=[preview_content, preview_source_info, local_state],
+        ).then(
+            fn=lambda: "✅ **Analysis complete!** Click **Index for RAG** to enable chat.",
+            outputs=[local_status],
+        )
+        local_index_btn.click(
+            fn=lambda: "⏳ **Indexing...** Building vector embeddings.",
+            outputs=[local_status],
+        ).then(
+            fn=index_local_with_status,
+            inputs=[local_state],
+            outputs=[local_status, local_state],
+        )
+        def bookmark_local_with_refresh(state):
+            status, new_state, dropdown = bookmark_local_repo(state)
+            choices, meta = get_dropdown_options()
+            return (
+                "🔖 **Bookmarked!** Added to Knowledge Base for future chat sessions.",
+                new_state,
+                gr.Dropdown(choices=choices, value=None),
+                gr.CheckboxGroup(choices=choices, value=[]),
+                meta
+            )
+        local_bookmark_btn.click(
+            fn=bookmark_local_with_refresh,
+            inputs=[local_state],
+            outputs=[local_status, local_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
+        )
+        # YouTube handlers
+        youtube_analyze_btn.click(
+            fn=lambda: "⏳ **Fetching transcript...** Please wait.",
+            outputs=[youtube_status],
+        ).then(
+            fn=run_youtube_ingestion,
+            inputs=[youtube_url],
+            outputs=[preview_content, preview_source_info, youtube_state],
+        ).then(
+            fn=lambda: "✅ **Analysis complete!** Click **Index for RAG** to enable chat.",
+            outputs=[youtube_status],
+        )
+        youtube_index_btn.click(
+            fn=lambda: "⏳ **Indexing...** Building vector embeddings.",
+            outputs=[youtube_status],
+        ).then(
+            fn=index_youtube_with_status,
+            inputs=[youtube_state],
+            outputs=[youtube_status, youtube_state],
+        )
+        def bookmark_youtube_with_refresh(state):
+            status, new_state, dropdown = bookmark_youtube_video(state)
+            choices, meta = get_dropdown_options()
+            return (
+                "🔖 **Bookmarked!** Added to Knowledge Base for future chat sessions.",
+                new_state,
+                gr.Dropdown(choices=choices, value=None),
+                gr.CheckboxGroup(choices=choices, value=[]),
+                meta
+            )
+        youtube_bookmark_btn.click(
+            fn=bookmark_youtube_with_refresh,
+            inputs=[youtube_state],
+            outputs=[youtube_status, youtube_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
+        )
+        # Chat handlers
+        def handle_chat_with_history(question, history, github_s, local_s, youtube_s, selected_sources, meta):
+            # Use first selected source from checkboxes, or fall back to indexed sources
+            bookmark = selected_sources[0] if selected_sources else None
+            answer = answer_chat_question(question, github_s, local_s, youtube_s, bookmark, meta)
+            history = history or []
+            history = history or []
+            history.append({"role": "user", "content": question})
+            history.append({"role": "assistant", "content": answer})
+            return history, ""
+        send_btn.click(
+            fn=handle_chat_with_history,
+            inputs=[question_box, chatbot, github_state, local_state, youtube_state, bookmarks_checkboxes, bookmarks_metadata],
+            outputs=[chatbot, question_box],
+        )
+        question_box.submit(
+            fn=handle_chat_with_history,
+            inputs=[question_box, chatbot, github_state, local_state, youtube_state, bookmarks_checkboxes, bookmarks_metadata],
+            outputs=[chatbot, question_box],
+        )
+        # Chatbot Like/Dislike Handler
+        def handle_chatbot_like(data: gr.LikeData):
+            # Placeholder for future feedback logging
+            print(f"User feedback: {'Liked' if data.liked else 'Disliked'} message index {data.index}")
+            return None
+        chatbot.like(
+            fn=handle_chatbot_like,
+            outputs=None
+        )
+        # Bookmark handlers - refresh both dropdown and checkboxes
+        def refresh_all_bookmarks():
+            choices, meta = get_dropdown_options()
+            return (
+                gr.Dropdown(choices=choices, value=None),
+                gr.CheckboxGroup(choices=choices, value=[]),
+                meta
+            )
+        refresh_bookmarks_btn.click(
+            fn=refresh_all_bookmarks,
+            outputs=[bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
+        )
+        # View All button - show bookmark details
+        def view_all_bookmarks(meta):
+            if not meta:
+                return "*No bookmarks found. Analyze and bookmark repositories to see them here.*"
+            lines = ["**📚 All Bookmarked Sources:**\n"]
+            for m in meta:
+                name = m.get("repo_name", "Unknown")
+                date = m.get("last_pulled_display", "--")
+                chunks = m.get("vector_chunks", 0)
+                lines.append(f"- **{name}** — {date} — {chunks} chunks")
+            return "\n".join(lines)
+        view_all_btn.click(
+            fn=view_all_bookmarks,
+            inputs=[bookmarks_metadata],
+            outputs=[bookmark_info],
+        )
+        # Update bookmark info when checkboxes change
+        def update_checkbox_info(selected, meta):
+            if not selected:
+                return "*No sources selected. Check sources above to include in chat.*"
+            lines = [f"**{len(selected)} source(s) selected:**\n"]
+            for label in selected:
+                m = find_metadata_by_label(label, meta or [])
+                if m:
+                    lines.append(f"- {m.get('repo_name', label)} ({m.get('vector_chunks', 0)} chunks)")
+            return "\n".join(lines)
+        bookmarks_checkboxes.change(
+            fn=update_checkbox_info,
+            inputs=[bookmarks_checkboxes, bookmarks_metadata],
+            outputs=[bookmark_info],
+        )
+        # Notepad download handlers
+        def download_notepad_as_md(content):
+            if not content or not content.strip():
+                return None
+            import tempfile
+            with tempfile.NamedTemporaryFile(mode='w', suffix='.md', delete=False, encoding='utf-8') as f:
+                f.write(content)
+                return f.name
+        github_notepad_download.click(
+            fn=download_notepad_as_md,
+            inputs=[github_notepad],
+            outputs=[github_notepad_download],
+        )
+        local_notepad_download.click(
+            fn=download_notepad_as_md,
+            inputs=[local_notepad],
+            outputs=[local_notepad_download],
+        )
+        youtube_notepad_download.click(
+            fn=download_notepad_as_md,
+            inputs=[youtube_notepad],
+            outputs=[youtube_notepad_download],
+        )
+        # Preview Copy Handler (JS)
+        preview_copy_btn.click(
+            fn=None,
+            inputs=[preview_content],
+            js="(content) => { navigator.clipboard.writeText(content); return 'Copied!'; }",
+        )
+        # Preview Download Handler
+        preview_download_btn.click(
+            fn=download_notepad_as_md, # Reusing the md download function
+            inputs=[preview_content],
+            outputs=[preview_download_btn],
+        )
+        # Lab handlers with improved output
+        def run_lab_with_code(intention, report):
+            result = run_experimental_lab(intention, report)
+            # Extract code if present in result
+            if "```python" in result:
+                code_start = result.find("```python") + 9
+                code_end = result.find("```", code_start)
+                code = result[code_start:code_end].strip() if code_end > code_start else ""
+                return result, gr.Code(value=code, visible=True)
+            return result, gr.Code(visible=False)
+        lab_start_btn.click(
+            fn=run_lab_with_code,
+            inputs=[lab_intention, lab_report_dropdown],
+            outputs=[lab_output, lab_code_display],
+        )
+        def fix_lab_with_instruction(intention, report, fix_instruction):
+            # Pass the fix instruction to the fix function
+            combined = f"{intention}\n\nFIX REQUEST: {fix_instruction}" if fix_instruction else intention
+            return lab_fix_bugs(combined, report)
+        lab_fix_btn.click(
+            fn=fix_lab_with_instruction,
+            inputs=[lab_intention, lab_report_dropdown, lab_fix_instruction],
+            outputs=[lab_output],
+        )
+        lab_happy_btn.click(
+            fn=lab_mark_happy,
+            inputs=[lab_intention, lab_report_dropdown],
+            outputs=[lab_output],
+        )
+        # Export lab code to file
+        def export_lab_code(code_content):
+            if not code_content:
+                return None
+            import tempfile
+            with tempfile.NamedTemporaryFile(mode='w', suffix='.py', delete=False) as f:
+                f.write(code_content)
+                return f.name
+        lab_export_btn.click(
+            fn=export_lab_code,
+            inputs=[lab_code_display],
+            outputs=[lab_download],
+        ).then(
+            fn=lambda: gr.File(visible=True),
+            outputs=[lab_download],
+        )
+        lab_refresh_reports_btn.click(
+            fn=_refresh_lab_reports_dropdown,
+            outputs=[lab_report_dropdown],
+        )
+        # Load bookmarks on startup (refresh both dropdown and checkboxes)
+        demo.load(
+            fn=refresh_all_bookmarks,
+            outputs=[bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
+        )
+    return demo, (app_theme if IS_GRADIO_V6 else None), (custom_css if IS_GRADIO_V6 else None)
 if __name__ == "__main__":
+    demo, app_theme, custom_css = build_interface()
+    launch_kwargs = {"share": False}
+    if IS_GRADIO_V6:
+        launch_kwargs.update(theme=app_theme, css=custom_css)
+    demo.launch(**launch_kwargs)