Spaces:

MCP-1st-Birthday
/

monkey-mind

Running

App Files Files Community

monkey-mind / mcp_server.py

sxandie

Update mcp_server.py

794fb9b verified 19 days ago

raw

history blame contribute delete

72.5 kB

	from datetime import datetime, timezone
	from pathlib import Path
	import os
	import re
	import shutil

	import gradio as gr

	from agent import (
	analyze_github_repo,
	analyze_local_repo,
	build_experiment_from_report,
	build_repo_vector_store,
	fetch_youtube_transcript,
	generate_youtube_study_notes,
	rag_answer_from_store,
	summarize_youtube_chapters,
	)
	from bookmarks import (
	bookmark_repo_from_analysis,
	find_metadata_by_label,
	get_cache_dirs,
	get_dropdown_options,
	)


	# File extensions and folders to ignore for local uploads
	IGNORE_PATTERNS = {
	'folders': {
	'__pycache__', '.git', '.svn', '.hg', 'node_modules',
	'venv', 'env', '.venv', '.env', 'dist', 'build',
	'.idea', '.vscode', '.pytest_cache', '.mypy_cache',
	'coverage', '.coverage', 'htmlcov', '.tox', 'eggs',
	'.eggs', '*.egg-info', '.DS_Store'
	},
	'extensions': {
	'.pyc', '.pyo', '.pyd', '.so', '.dll', '.dylib',
	'.class', '.o', '.obj', '.exe', '.bin', '.lock',
	'.log', '.tmp', '.temp', '.cache', '.bak', '.swp',
	'.swo', '.DS_Store', '.gitignore'
	}
	}


	def _should_ignore_path(path: Path) -> bool:
	"""Check if a path should be ignored during local folder processing."""
	for part in path.parts:
	if part in IGNORE_PATTERNS['folders']:
	return True
	if part.startswith('.') and part not in {'.', '..'}:
	return True
	if path.suffix.lower() in IGNORE_PATTERNS['extensions']:
	return True
	return False


	KNOWLEDGE_TRANSFER_ROOT = Path("Knowledge Transfer")


	def _is_gradio_v6_or_newer() -> bool:
	"""Return True if the installed Gradio major version is >= 6."""
	version_str = getattr(gr, "__version__", "0")
	try:
	major = int(version_str.split(".")[0])
	return major >= 6
	except (ValueError, IndexError):
	return False


	IS_GRADIO_V6 = _is_gradio_v6_or_newer()


	def run_github_ingestion(repo_url: str):
	"""Analyze GitHub repository without indexing."""
	repo_url = (repo_url or "").strip()
	if not repo_url:
	warning = "⚠️ Please paste a public GitHub repository URL to begin."
	source_info = "Source: Not selected\nStatus: ⏳ Pending\nChunks: 0 vectors"
	return warning, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [],
	}

	result = analyze_github_repo(repo_url)
	if "error" in result:
	error_msg = f"❌ {result['error']}"
	source_info = f"Source: {repo_url}\nStatus: ❌ Error\nChunks: 0 vectors"
	return error_msg, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [],
	}

	docs = result.get("documentation", [])
	repo_name = result.get("repo_name", repo_url)
	timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")

	# Source info for preview panel
	source_info = f"""Source: GitHub Repository
	Repository: {repo_name}
	Status: ✅ Analyzed
	Documents: {len(docs)} files
	Analyzed: {timestamp}"""

	# Document preview content
	preview_sections = []
	for doc in docs[:5]:
	content = (doc.get("content") or "").strip()
	if not content:
	continue
	snippet = content[:600]
	if len(content) > 600:
	snippet = snippet.rstrip() + " ..."
	preview_sections.append(
	f"### 📄 {doc.get('path', 'document')}\n\n{snippet}"
	)

	preview_content = (
	"\n\n---\n\n".join(preview_sections)
	if preview_sections
	else "No textual documentation snippets were found."
	)

	state_payload = {
	"analysis": result,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [repo_name, str(len(docs))],
	"processed_timestamp": timestamp,
	"indexed": False,
	}

	return preview_content, source_info, state_payload


	def index_github_repo(state_payload: dict \| None):
	"""Index the analyzed GitHub repository for RAG."""
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return "⚠️ Run analysis before indexing.", state_payload

	if state_payload.get("indexed"):
	return "✅ Repository already indexed and ready for RAG queries.", state_payload

	docs = analysis_data.get("documentation", [])
	repo_name = analysis_data.get("repo_name", "repo")
	repo_url = analysis_data.get("repo_url", "")

	slug, cache_dir, cache_vector_dir = get_cache_dirs(repo_url, repo_name)
	if cache_dir.exists():
	shutil.rmtree(cache_dir)
	cache_dir.mkdir(parents=True, exist_ok=True)

	vector_chunks = 0
	if docs:
	_, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)
	vector_chunks = chunk_count
	else:
	return "⚠️ No documentation found to index.", state_payload

	new_state = {
	**state_payload,
	"vector_dir": str(cache_vector_dir),
	"vector_chunks": vector_chunks,
	"indexed": True,
	}

	return f"✅ Indexed {vector_chunks} vector chunks. Ready for RAG queries!", new_state


	def bookmark_github_repo(state_payload: dict \| None):
	"""Bookmark and index the GitHub repository permanently."""
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return "⚠️ Run analysis before bookmarking.", state_payload, gr.Dropdown()

	docs = analysis_data.get("documentation", [])
	if not docs:
	return "⚠️ No documentation to bookmark.", state_payload, gr.Dropdown()

	repo_url = analysis_data.get("repo_url") or analysis_data.get("repo_name")

	# Build vector store if not already done
	vector_dir = state_payload.get("vector_dir") if state_payload else ""
	if not vector_dir:
	repo_name = analysis_data.get("repo_name", "repo")
	slug, cache_dir, cache_vector_dir = get_cache_dirs(repo_url, repo_name)
	if cache_dir.exists():
	shutil.rmtree(cache_dir)
	cache_dir.mkdir(parents=True, exist_ok=True)

	if docs:
	_, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)
	vector_dir = str(cache_vector_dir)
	else:
	chunk_count = 0
	else:
	chunk_count = state_payload.get("vector_chunks", 0)

	metadata = bookmark_repo_from_analysis(
	repo_url,
	analysis_data,
	prebuilt_vector_dir=Path(vector_dir) if vector_dir else None,
	prebuilt_chunks=chunk_count,
	)

	choices, metadata_list = get_dropdown_options()
	dropdown_update = gr.Dropdown(
	choices=choices,
	value=metadata.dropdown_label,
	interactive=True,
	)

	new_state = {
	**state_payload,
	"vector_dir": vector_dir,
	"vector_chunks": chunk_count,
	"indexed": True,
	}

	return f"💾 Repository bookmarked on {metadata.last_pulled_display}. Access it in the Chat tab!", new_state, dropdown_update


	def run_youtube_ingestion(youtube_url: str):
	"""Analyze YouTube video without indexing."""
	youtube_url = (youtube_url or "").strip()
	if not youtube_url:
	warning = "⚠️ Paste a YouTube video URL to begin."
	source_info = "Source: Not selected\nStatus: ⏳ Pending\nChunks: 0 vectors"
	return warning, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	}

	result = fetch_youtube_transcript(youtube_url)
	if "error" in result:
	error_msg = f"❌ {result['error']}"
	source_info = f"Source: YouTube\nStatus: ❌ Error\nChunks: 0 vectors"
	return error_msg, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	}

	transcript = (result.get("raw_transcript") or "").strip()
	if not transcript:
	source_info = "Source: YouTube\nStatus: ⚠️ No transcript\nChunks: 0 vectors"
	return "⚠️ No transcript text was returned.", source_info, {"analysis": None}

	timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")
	video_url = result.get("url", youtube_url)
	lang = result.get("lang", "en")

	# Source info for preview panel
	source_info = f"""Source: YouTube Video
	URL: {video_url}
	Language: {lang}
	Status: ✅ Analyzed
	Analyzed: {timestamp}"""

	# Generate chapter summaries
	chapters = summarize_youtube_chapters(transcript, url=video_url)

	# Preview content with chapters
	preview_content = f"""### 📺 Video Transcript Analysis

	{chapters}

	---

	### 📝 Transcript Preview

	{transcript[:2000]}{"..." if len(transcript) > 2000 else ""}
	"""

	state_payload = {
	"analysis": {
	"transcript": transcript,
	"url": video_url,
	"lang": lang,
	"chapters": chapters,
	},
	"vector_dir": "",
	"vector_chunks": 0,
	"indexed": False,
	}

	return preview_content, source_info, state_payload


	def index_youtube_video(state_payload: dict \| None):
	"""Index YouTube transcript for RAG."""
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return "⚠️ Run analysis before indexing.", state_payload

	if state_payload.get("indexed"):
	return "✅ Video already indexed and ready for RAG queries.", state_payload

	transcript = analysis_data.get("transcript", "")
	if not transcript:
	return "⚠️ No transcript found to index.", state_payload

	# Create pseudo-documents from transcript
	docs = [{
	"path": "transcript.txt",
	"content": transcript,
	"type": "transcript",
	}]

	url = analysis_data.get("url", "youtube")
	slug, cache_dir, cache_vector_dir = get_cache_dirs(url, "youtube")
	if cache_dir.exists():
	shutil.rmtree(cache_dir)
	cache_dir.mkdir(parents=True, exist_ok=True)

	_, chunk_count = build_repo_vector_store(docs, persist_path=cache_vector_dir)

	new_state = {
	**state_payload,
	"vector_dir": str(cache_vector_dir),
	"vector_chunks": chunk_count,
	"indexed": True,
	}

	return f"✅ Indexed {chunk_count} transcript chunks. Ready for RAG queries!", new_state


	def bookmark_youtube_video(state_payload: dict \| None):
	"""Bookmark YouTube video - persists transcript to bookmarks system."""
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return "⚠️ Run analysis before bookmarking.", state_payload, gr.Dropdown()

	transcript = analysis_data.get("transcript", "")
	if not transcript:
	return "⚠️ No transcript found to bookmark.", state_payload, gr.Dropdown()

	video_url = analysis_data.get("url", "youtube-video")
	chapters = analysis_data.get("chapters", "")

	# Create pseudo-analysis structure compatible with bookmark_repo_from_analysis
	pseudo_analysis = {
	"repo_name": f"YouTube: {video_url[:50]}",
	"repo_url": video_url,
	"documentation": [
	{
	"path": "transcript.txt",
	"content": transcript,
	},
	{
	"path": "chapters.md",
	"content": chapters,
	}
	],
	}

	# Use prebuilt vector store if already indexed
	prebuilt_dir = None
	prebuilt_chunks = None
	if state_payload.get("indexed") and state_payload.get("vector_dir"):
	prebuilt_dir = Path(state_payload["vector_dir"])
	prebuilt_chunks = state_payload.get("vector_chunks", 0)

	metadata = bookmark_repo_from_analysis(
	video_url,
	pseudo_analysis,
	prebuilt_vector_dir=prebuilt_dir,
	prebuilt_chunks=prebuilt_chunks,
	)

	choices, _ = get_dropdown_options()
	dropdown_update = gr.Dropdown(choices=choices, value=metadata.dropdown_label)

	new_state = {
	**state_payload,
	"vector_dir": metadata.vector_dir,
	"vector_chunks": metadata.vector_chunks,
	"indexed": True,
	"bookmarked": True,
	}

	return f"🔖 YouTube video bookmarked! {metadata.vector_chunks} chunks indexed.", new_state, dropdown_update


	def generate_youtube_transfer_report(youtube_url: str):
	youtube_url = (youtube_url or "").strip()
	if not youtube_url:
	return "⚠️ Paste a YouTube video URL before generating a report."

	result = fetch_youtube_transcript(youtube_url)
	if "error" in result:
	return f"❌ {result['error']}"

	transcript = (result.get("raw_transcript") or "").strip()
	if not transcript:
	return "No transcript text was returned by the youtube-transcript MCP server; report generation was skipped."

	chapters = summarize_youtube_chapters(transcript, url=result.get("url", youtube_url))
	study_notes = generate_youtube_study_notes(chapters, url=result.get("url", youtube_url))

	generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
	header_lines = [
	"# YouTube Knowledge Transfer Report",
	"",
	f"- Source: {result.get('url', youtube_url)}",
	f"- Language: {result.get('lang', 'en')}",
	f"- Generated at: {generated_at}",
	]

	lines: list[str] = []
	lines.extend(header_lines)
	lines.append("")
	lines.append("## 1. Topic & Chapter Outline")
	lines.append("")
	lines.append(chapters)
	lines.append("")
	lines.append("## 2. Study & Interview Guidance")
	lines.append("")
	lines.append(study_notes)

	report_markdown = "\n".join(lines)

	root = _ensure_knowledge_root()
	youtube_root = root / "Youtube Video"
	youtube_root.mkdir(parents=True, exist_ok=True)
	slug = _slugify_name(result.get("url", youtube_url))
	ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
	report_path = youtube_root / f"{slug}-youtube-knowledge-{ts}.md"
	report_path.write_text(report_markdown, encoding="utf-8")

	rel_path = report_path.relative_to(Path("."))
	return f"📄 YouTube knowledge transfer report written to `{rel_path}`."


	def _ensure_knowledge_root() -> Path:
	KNOWLEDGE_TRANSFER_ROOT.mkdir(parents=True, exist_ok=True)
	return KNOWLEDGE_TRANSFER_ROOT


	def _slugify_name(name: str) -> str:
	base = (name or "project").lower()
	safe = re.sub(r"[^a-z0-9-]+", "-", base).strip("-")
	return safe or "project"


	def generate_knowledge_transfer_report(state_payload: dict \| None):
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return "⚠️ Run an analysis before generating a report."

	repo_name = analysis_data.get("repo_name") or "Project"
	repo_url = analysis_data.get("repo_url") or "local upload"
	docs = analysis_data.get("documentation") or []
	doc_count = len(docs)
	structure = analysis_data.get("structure") or []

	vector_dir = state_payload.get("vector_dir") if state_payload else ""
	vector_chunks = state_payload.get("vector_chunks", 0) if state_payload else 0
	summary_base = state_payload.get("summary_base", []) if state_payload else []
	processed_timestamp = state_payload.get("processed_timestamp") if state_payload else None

	generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
	header_lines = [
	f"# Knowledge Transfer Report – {repo_name}",
	"",
	f"- Source: {repo_url}",
	f"- Generated at: {generated_at}",
	f"- Documentation files: {doc_count}",
	f"- Vector chunks: {vector_chunks}",
	]
	if processed_timestamp:
	header_lines.append(f"- Last analysis run: {processed_timestamp}")

	overview_section = "\n".join(summary_base) if summary_base else "No high-level summary was captured during analysis."

	llm_summary_section = ""
	if vector_dir and vector_chunks:
	try:
	question = (
	"Provide a detailed knowledge transfer summary of this repository. "
	"Explain its purpose, main components, architecture, key dependencies, "
	"and patterns that would be reusable in other projects. "
	"Focus on actionable insights and how to extend or adapt this codebase."
	)
	llm_summary_section = rag_answer_from_store(Path(vector_dir), question, repo_summary=overview_section)
	except Exception as err:
	llm_summary_section = f"LLM summary unavailable due to error: {err}"
	else:
	llm_summary_section = "Vector store not available; running RAG-based summary was skipped."

	max_items = 80
	structure_snippet = "\n".join(structure[:max_items]) if structure else "No repository structure information was captured."
	doc_paths = [d.get("path", "") for d in docs][:max_items]
	docs_list_section = "\n".join(f"- {p}" for p in doc_paths) if doc_paths else "No documentation files were detected."

	lines: list[str] = []
	lines.extend(header_lines)
	lines.append("")
	lines.append("## 1. High-level Overview")
	lines.append("")
	lines.append(overview_section)
	lines.append("")
	lines.append("## 2. Repository Layout (snapshot)")
	lines.append("")
	lines.append("```")
	lines.append(structure_snippet)
	lines.append("```")
	lines.append("")
	lines.append("## 3. Documentation Files")
	lines.append("")
	lines.append(docs_list_section)
	lines.append("")
	lines.append("## 4. LLM Knowledge Summary")
	lines.append("")
	lines.append(llm_summary_section)
	lines.append("")
	lines.append("## 5. Notes for Future Reuse")
	lines.append("")
	lines.append(
	"Use this report as a starting point when designing new projects. "
	"Focus on reusing architecture patterns, utility modules, and any "
	"documented best practices or workflows."
	)

	report_markdown = "\n".join(lines)

	root = _ensure_knowledge_root()
	slug = _slugify_name(repo_name)
	ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
	report_path = root / f"{slug}-knowledge-transfer-{ts}.md"
	report_path.write_text(report_markdown, encoding="utf-8")

	rel_path = report_path.relative_to(Path("."))
	return f"📄 Knowledge transfer report written to `{rel_path}`."


	def _list_knowledge_report_choices() -> list[str]:
	root = _ensure_knowledge_root()
	reports = sorted(root.glob("*.md"))
	return [report.name for report in reports]


	def _refresh_lab_reports_dropdown():
	return gr.Dropdown(
	label="Knowledge Transfer report (optional)",
	choices=_list_knowledge_report_choices(),
	value=None,
	interactive=True,
	)


	def load_study_deck_from_report(report_name: str \| None) -> str:
	if not report_name:
	return "Select a Knowledge Transfer report above to view its study deck-style summary."
	root = _ensure_knowledge_root()
	report_path = root / report_name
	if not report_path.exists():
	return f"Report `{report_name}` was not found in the Knowledge Transfer folder."
	try:
	raw = report_path.read_text(encoding="utf-8", errors="ignore")
	except OSError as err:
	return f"Unable to read report `{report_name}`: {err}"

	max_chars = 6000
	snippet = raw[:max_chars]
	if len(raw) > max_chars:
	snippet = snippet.rstrip() + "\n\n... (truncated)"

	return (
	f"### Study Deck · {report_name}\n\n"
	"Scroll through this condensed report to refresh yourself on the key concepts, "
	"architecture, and reusable patterns for this project.\n\n"
	f"```markdown\n{snippet}\n```"
	)


	def _derive_local_repo_root(uploaded: str \| list[str] \| None) -> Path \| None:
	"""Given a directory-style file upload, infer the repository root directory.

	Gradio's File component with ``file_count="directory"`` returns a list of
	filepaths under the uploaded folder (or a single filepath). We compute the
	common parent directory and treat that as the repo root.
	"""
	if not uploaded:
	return None
	if isinstance(uploaded, str):
	paths = [uploaded]
	else:
	paths = [p for p in uploaded if p]
	if not paths:
	return None
	try:
	common = os.path.commonpath(paths)
	except ValueError:
	return None
	root = Path(common)
	return root if root.exists() and root.is_dir() else None


	def run_local_repo_ingestion(uploaded_folder):
	"""Analyze local repository folder, filtering irrelevant files."""
	repo_root = _derive_local_repo_root(uploaded_folder)
	if not repo_root:
	warning = "⚠️ Upload a project folder before running analysis."
	source_info = "Source: Not selected\nStatus: ⏳ Pending\nChunks: 0 vectors"
	return warning, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [],
	}

	# Filter out irrelevant files before analysis
	if isinstance(uploaded_folder, list):
	filtered_files = [f for f in uploaded_folder if not _should_ignore_path(Path(f))]
	if not filtered_files:
	warning = "⚠️ No relevant files found after filtering."
	source_info = "Source: Local\nStatus: ⚠️ No files\nChunks: 0 vectors"
	return warning, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [],
	}

	result = analyze_local_repo(str(repo_root))
	if "error" in result:
	error_msg = f"❌ {result['error']}"
	source_info = f"Source: Local\nStatus: ❌ Error\nChunks: 0 vectors"
	return error_msg, source_info, {
	"analysis": None,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [],
	}

	docs = result.get("documentation", [])
	repo_name = result.get("repo_name", repo_root.name)
	timestamp = datetime.now(timezone.utc).strftime("%d %b %Y, %H:%M UTC")

	# Source info for preview panel
	source_info = f"""Source: Local Project
	Folder: {repo_name}
	Status: ✅ Analyzed
	Documents: {len(docs)} files
	Analyzed: {timestamp}"""

	# Document preview content
	preview_sections = []
	for doc in docs[:5]:
	content = (doc.get("content") or "").strip()
	if not content:
	continue
	snippet = content[:600]
	if len(content) > 600:
	snippet = snippet.rstrip() + " ..."
	preview_sections.append(
	f"### 📄 {doc.get('path', 'document')}\n\n{snippet}"
	)

	preview_content = (
	"\n\n---\n\n".join(preview_sections)
	if preview_sections
	else "No textual documentation snippets were found."
	)

	state_payload = {
	"analysis": result,
	"vector_dir": "",
	"vector_chunks": 0,
	"summary_base": [repo_name, str(len(docs))],
	"processed_timestamp": timestamp,
	"indexed": False,
	}

	return preview_content, source_info, state_payload


	def index_local_repo(state_payload: dict \| None):
	"""Index the analyzed local repository for RAG."""
	return index_github_repo(state_payload) # Same logic


	def bookmark_local_repo(state_payload: dict \| None):
	"""Bookmark and index the local repository permanently."""
	return bookmark_github_repo(state_payload) # Same logic


	def _format_bookmark_info(metadata: dict \| None) -> str:
	if not metadata:
	return (
	"No bookmarks yet. Process a repository in the Process New Repository tab, then bookmark it to enable RAG chat."
	)
	preview = (metadata.get("summary_preview") or "").strip()
	if preview:
	max_len = 600
	if len(preview) > max_len:
	preview_display = preview[:max_len].rstrip() + " ..."
	else:
	preview_display = preview
	return (
	f"### {metadata.get('repo_name', 'Saved Repository')}\n"
	f"- URL: {metadata.get('repo_url', 'N/A')}\n"
	f"- Last pulled: {metadata.get('last_pulled_display', '--/--/----')}\n"
	f"- Documentation files: {metadata.get('docs_count', 0)}\n"
	f"- Vector chunks: {metadata.get('vector_chunks', 0)}\n\n"
	f"Preview:\n\n{preview_display}"
	)
	return (
	f"### {metadata.get('repo_name', 'Saved Repository')}\n"
	f"- URL: {metadata.get('repo_url', 'N/A')}\n"
	f"- Last pulled: {metadata.get('last_pulled_display', '--/--/----')}\n"
	f"- Documentation files: {metadata.get('docs_count', 0)}\n"
	f"- Vector chunks: {metadata.get('vector_chunks', 0)}"
	)


	def _refresh_bookmarks(preselect: str \| None = None):
	choices, metadata_list = get_dropdown_options()
	value = preselect if preselect and preselect in choices else (choices[0] if choices else None)
	dropdown_update = gr.Dropdown(
	choices=choices,
	value=value,
	interactive=bool(choices),
	label="Bookmarked repositories",
	allow_custom_value=True,
	)
	info = _format_bookmark_info(
	find_metadata_by_label(value, metadata_list) if value else None
	)
	return dropdown_update, metadata_list, info


	def load_bookmarks_on_start():
	dropdown_update, metadata_list, info = _refresh_bookmarks()
	status = "Bookmarks loaded." if metadata_list else "No bookmarks saved yet."
	return dropdown_update, metadata_list, info, status


	def _build_summary_from_base(base_lines: list[str], final_message: str) -> str:
	if not base_lines:
	return final_message
	return "\n".join(base_lines + ["", final_message])


	def bookmark_current_repo(state_payload: dict \| None):
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data or not analysis_data.get("documentation"):
	return (
	"⚠️ Run an analysis before bookmarking a repository.",
	gr.Dropdown(choices=[], value=None, interactive=False, label="Bookmarked repositories"),
	[],
	_format_bookmark_info(None),
	_build_summary_from_base(
	(state_payload or {}).get("summary_base", []),
	"⚠️ Bookmark failed because no analysis data is available.",
	),
	state_payload,
	)

	repo_url = analysis_data.get("repo_url") or analysis_data.get("repo_name")
	vector_dir = state_payload.get("vector_dir") if state_payload else ""
	metadata = bookmark_repo_from_analysis(
	repo_url,
	analysis_data,
	prebuilt_vector_dir=Path(vector_dir) if vector_dir else None,
	prebuilt_chunks=state_payload.get("vector_chunks") if state_payload else None,
	)
	dropdown_update, metadata_list, info = _refresh_bookmarks(preselect=metadata.dropdown_label)
	saved_msg = (
	f"💾 Repo saved on {metadata.last_pulled_display}. Access it via the Bookmarked tab for RAG chat."
	)
	updated_summary = _build_summary_from_base(
	state_payload.get("summary_base", []),
	saved_msg,
	)
	new_state = {
	**(state_payload or {}),
	"summary_base": state_payload.get("summary_base", []),
	"saved": True,
	}
	return saved_msg, dropdown_update, metadata_list, info, updated_summary, new_state


	def update_selected_bookmark(label: str, metadata_list: list[dict]):
	metadata = find_metadata_by_label(label, metadata_list or []) if label else None
	return _format_bookmark_info(metadata)


	def answer_bookmark_question(label: str, question: str, metadata_list: list[dict]):
	if not label:
	return "Select a bookmarked repository before asking a question."
	if not question.strip():
	return "Enter a question to query your bookmarked repository."

	metadata = find_metadata_by_label(label, metadata_list or [])
	if not metadata:
	return "Bookmark metadata not found. Try refreshing bookmarks."
	if metadata.get("vector_chunks", 0) == 0:
	return "This bookmark has no vector store yet. Re-bookmark the repo to rebuild embeddings."

	summary = (
	f"Repository: {metadata.get('repo_name', label)}\n"
	f"Docs: {metadata.get('docs_count', 0)} \| Last pulled: {metadata.get('last_pulled_display', '--/--/----')}"
	)
	answer = rag_answer_from_store(Path(metadata["vector_dir"]), question, repo_summary=summary)
	return answer


	def placeholder_action_message(label: str):
	if not label:
	return "Select a bookmarked repository to use this action."
	return f"Additional bookmark actions for {label} are coming soon."


	def run_experimental_lab(intention: str, report_name: str \| None):
	text = (intention or "").strip()
	if not text:
	return "Describe what you want to build in the Experimental Lab to get started."

	root = _ensure_knowledge_root()
	report_markdown = ""
	context_note = ""
	if report_name:
	report_path = root / report_name
	if report_path.exists():
	try:
	raw = report_path.read_text(encoding="utf-8", errors="ignore")
	report_markdown = raw
	snippet = raw[:3000]
	context_note = (
	f"Using Knowledge Transfer report: `{report_name}` as reference.\n\n"
	f"Snippet from report (truncated):\n\n```markdown\n{snippet}\n```\n\n"
	)
	except OSError:
	context_note = f"Unable to read Knowledge Transfer report `{report_name}`. Proceeding without embedded context.\n\n"

	build_result = build_experiment_from_report(text, report_markdown)
	code = build_result.get("code", "")
	stdout = build_result.get("stdout", "")
	error = build_result.get("error", "")

	base_intro = (
	"Experimental Lab is a sandbox where future versions of MonkeyMind will use "
	"Knowledge Transfer reports as context to plan and build small Gradio apps.\n\n"
	)

	code_section = "### Generated experiment code\n\n"
	if code:
	code_section += f"```python\n{code}\n```\n\n"
	else:
	code_section += "No code was generated.\n\n"

	results_section = "### Sandbox output\n\n"
	if stdout:
	results_section += f"Stdout / logs:\n\n```text\n{stdout}\n```\n\n"
	if error:
	results_section += f"Error:\n\n```text\n{error}\n```\n\n"
	if not stdout and not error:
	results_section += "No errors encountered during sandbox test.\n\n"

	return (
	base_intro
	+ context_note
	+ f"You wrote:\n\n> {text}\n\n"
	+ code_section
	+ results_section
	)


	def lab_fix_bugs(intention: str, report_name: str \| None):
	base = run_experimental_lab(intention, report_name)
	return (
	base
	+ "\n\n---\n\n_This Fix bugs action will eventually trigger another build iteration to resolve errors in the generated app. "
	"For now, it simply records another planning pass based on your intention and chosen report._"
	)


	def lab_mark_happy(intention: str, report_name: str \| None):
	text = (intention or "").strip()
	return (
	"Marking this experiment as complete.\n\n"
	f"Final intention:\n\n> {text or 'N/A'}\n\n"
	"You can now export or reuse this idea elsewhere. Future versions will attach concrete code artifacts here."
	)


	def lab_export_project(intention: str, report_name: str \| None):
	text = (intention or "").strip()
	return (
	"Export placeholder: a future version will bundle generated code, configuration, and a short README "
	"into a downloadable package.\n\n"
	f"Current experiment description:\n\n> {text or 'N/A'}\n\n"
	f"Reference report: `{report_name or 'none selected'}`."
	)


	def answer_chat_question(question: str, github_state, local_state, youtube_state, selected_bookmark, metadata_list):
	"""Answer questions using RAG from any indexed source or bookmark."""
	if not question.strip():
	return "Please enter a question."

	# Check if using a bookmark
	if selected_bookmark:
	metadata = find_metadata_by_label(selected_bookmark, metadata_list or [])
	if metadata and metadata.get("vector_chunks", 0) > 0:
	summary = (
	f"Repository: {metadata.get('repo_name', selected_bookmark)}\n"
	f"Last pulled: {metadata.get('last_pulled_display', '--/--/----')}"
	)
	answer = rag_answer_from_store(Path(metadata["vector_dir"]), question, repo_summary=summary)
	return f"[Bookmark: {selected_bookmark}]\n\n{answer}"

	# Check current session sources
	for state, label in [
	(github_state, "GitHub"),
	(local_state, "Local"),
	(youtube_state, "YouTube"),
	]:
	if state and state.get("indexed") and state.get("vector_dir"):
	vector_dir = Path(state["vector_dir"])
	if vector_dir.exists():
	answer = rag_answer_from_store(vector_dir, question)
	return f"[{label} Source]\n\n{answer}"

	return "⚠️ No indexed sources available. Please index a repository or select a bookmark first."


	def generate_and_download_report(state_payload: dict \| None, source_type: str):
	"""Generate markdown report and return file path for download."""
	analysis_data = (state_payload or {}).get("analysis") if state_payload else None
	if not analysis_data:
	return None

	if source_type == "youtube":
	transcript = analysis_data.get("transcript", "")
	chapters = analysis_data.get("chapters", "")
	url = analysis_data.get("url", "youtube")
	lang = analysis_data.get("lang", "en")

	study_notes = generate_youtube_study_notes(chapters, url=url)

	generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
	lines = [
	"# YouTube Knowledge Transfer Report",
	"",
	f"- Source: {url}",
	f"- Language: {lang}",
	f"- Generated at: {generated_at}",
	"",
	"## 1. Chapter Outline",
	"",
	chapters,
	"",
	"## 2. Study Notes",
	"",
	study_notes,
	]
	else:
	# GitHub or Local repo
	repo_name = analysis_data.get("repo_name", "Project")
	repo_url = analysis_data.get("repo_url", "local")
	docs = analysis_data.get("documentation", [])

	generated_at = datetime.now(timezone.utc).strftime("%Y-%m-%d %H:%M:%S %Z")
	lines = [
	f"# Knowledge Transfer Report – {repo_name}",
	"",
	f"- Source: {repo_url}",
	f"- Generated at: {generated_at}",
	f"- Documentation files: {len(docs)}",
	"",
	"## Documentation Files",
	"",
	]
	for doc in docs[:50]:
	lines.append(f"- {doc.get('path', 'unknown')}")

	report_markdown = "\n".join(lines)

	root = _ensure_knowledge_root()
	slug = _slugify_name(analysis_data.get("repo_name", "project"))
	ts = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
	report_path = root / f"{slug}-report-{ts}.md"
	report_path.write_text(report_markdown, encoding="utf-8")

	return str(report_path)


	def refresh_bookmarks_dropdown():
	"""Refresh the bookmarks dropdown."""
	choices, metadata_list = get_dropdown_options()
	return gr.Dropdown(choices=choices, value=None, interactive=True), metadata_list


	def build_interface() -> tuple[gr.Blocks, gr.Theme \| None, str \| None]:
	"""Build the Gradio interface with improved UI/UX inspired by modern dashboard design."""

	custom_css = """
	@import url('https://fonts.googleapis.com/css2?family=Outfit:wght@300;400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap');

	:root {
	--primary: #34d399; /* Mint Green */
	--primary-glow: rgba(52, 211, 153, 0.4);
	--glass-bg: rgba(15, 23, 42, 0.6);
	--glass-border: rgba(255, 255, 255, 0.08);
	--text-main: #f8fafc;
	--text-muted: #94a3b8;
	}

	body {
	background-color: #0f172a;
	color: var(--text-main);
	font-family: 'Outfit', sans-serif !important;
	}

	/* Global container override */
	.gradio-container {
	max-width: 1400px !important;
	background: #0f172a !important;
	background-image:
	radial-gradient(circle at 0% 0%, rgba(52, 211, 153, 0.15) 0%, transparent 50%),
	radial-gradient(circle at 100% 100%, rgba(16, 185, 129, 0.1) 0%, transparent 50%) !important;
	border: none !important;
	}

	/* Header styling */
	.header-container {
	background: rgba(15, 23, 42, 0.8);
	backdrop-filter: blur(12px);
	border-bottom: 1px solid var(--glass-border);
	padding: 20px 24px;
	margin: -16px -16px 24px -16px;
	border-radius: 0;
	}

	/* Card/Panel styling */
	.source-card, .gradio-group, .tabs, .tabitem, .box-container {
	background: var(--glass-bg) !important;
	backdrop-filter: blur(12px);
	border: 1px solid var(--glass-border) !important;
	border-radius: 16px !important;
	box-shadow: 0 4px 20px rgba(0, 0, 0, 0.2);
	padding: 20px !important;
	margin-bottom: 20px !important;
	}

	/* Inputs and Textareas */
	input, textarea, .gr-input, .gr-box, .dropdown-wrap {
	background-color: rgba(30, 41, 59, 0.6) !important;
	border: 1px solid rgba(255, 255, 255, 0.1) !important;
	color: var(--text-main) !important;
	border-radius: 10px !important;
	}

	input:focus, textarea:focus {
	border-color: var(--primary) !important;
	box-shadow: 0 0 0 2px var(--primary-glow) !important;
	}

	/* Buttons */
	button.primary {
	background: linear-gradient(135deg, #34d399 0%, #10b981 100%) !important;
	color: #0f172a !important;
	font-weight: 600 !important;
	border: none !important;
	box-shadow: 0 4px 15px rgba(52, 211, 153, 0.3) !important;
	}
	button.secondary {
	background: rgba(30, 41, 59, 0.8) !important;
	border: 1px solid rgba(255, 255, 255, 0.1) !important;
	color: var(--text-muted) !important;
	}
	button.secondary:hover {
	color: var(--text-main) !important;
	border-color: var(--primary) !important;
	}
	button.stop {
	background: linear-gradient(135deg, #f87171 0%, #ef4444 100%) !important;
	color: white !important;
	}

	/* Status indicators */
	.status-ready {
	background: rgba(16, 185, 129, 0.1);
	color: #34d399;
	padding: 6px 12px;
	border-radius: 20px;
	font-size: 12px;
	border: 1px solid rgba(16, 185, 129, 0.2);
	}

	.status-pending {
	background: rgba(251, 191, 36, 0.1);
	color: #fbbf24;
	padding: 6px 12px;
	border-radius: 20px;
	font-size: 12px;
	border: 1px solid rgba(251, 191, 36, 0.2);
	}

	/* Keep copy/like buttons always visible and styled */
	.message-buttons {
	opacity: 1 !important;
	display: flex !important;
	gap: 4px !important;
	}
	.message-buttons button {
	color: #94a3b8 !important; /* text-muted */
	background: transparent !important;
	border: none !important;
	box-shadow: none !important;
	}
	.message-buttons button:hover {
	color: #34d399 !important; /* primary */
	background: rgba(52, 211, 153, 0.1) !important;
	}

	/* Chat bubbles */
	.chat-assistant {
	background: rgba(30, 41, 59, 0.8) !important;
	border: 1px solid var(--glass-border);
	border-radius: 18px 18px 18px 4px !important;
	color: var(--text-main) !important;
	}
	.chat-user {
	background: linear-gradient(135deg, #34d399 0%, #10b981 100%) !important;
	color: #022c22 !important;
	border-radius: 18px 18px 4px 18px !important;
	font-weight: 500;
	}

	/* Chat message text size and font */
	.message-wrap .message {
	font-size: 0.9rem !important;
	font-family: 'JetBrains Mono', monospace !important;
	line-height: 1.5 !important;
	}

	/* Typography overrides */
	.prose, .prose h1, .prose h2, .prose h3, .prose p, .prose strong {
	color: var(--text-main) !important;
	}

	/* Scrollbar */
	::-webkit-scrollbar { width: 6px; height: 6px; }
	::-webkit-scrollbar-track { background: transparent; }
	::-webkit-scrollbar-thumb { background: #334155; border-radius: 10px; }
	::-webkit-scrollbar-thumb:hover { background: #475569; }
	"""

	app_theme = gr.themes.Soft(
	primary_hue="emerald",
	secondary_hue="slate",
	neutral_hue="slate",
	).set(
	body_background_fill="#0f172a",
	block_background_fill="#1e293b",
	block_border_color="rgba(255,255,255,0.1)",
	input_background_fill="#0f172a",
	button_primary_background_fill="#34d399",
	button_primary_text_color="#0f172a",
	)

	blocks_kwargs = {"title": "🐒 MonkeyMind - Knowledge Transfer Agent"}
	if not IS_GRADIO_V6:
	blocks_kwargs.update(theme=app_theme, css=custom_css)

	with gr.Blocks(**blocks_kwargs) as demo:

	# State variables
	github_state = gr.State({})
	local_state = gr.State({})
	youtube_state = gr.State({})
	bookmarks_metadata = gr.State([])
	chat_history = gr.State([])
	notepad_content = gr.State("") # For notepad feature
	copied_texts = gr.State(set()) # Track copied texts to prevent duplicates

	# ===== HEADER =====
	with gr.Row(elem_classes=["header-container"]):
	gr.HTML("""
	<div style="display: flex; align-items: center; gap: 16px;">
	<div style="width: 48px; height: 48px; border-radius: 12px; background: linear-gradient(135deg, #34d399 0%, #10b981 100%); display: flex; align-items: center; justify-content: center; box-shadow: 0 0 20px rgba(52, 211, 153, 0.3);">
	<span style="font-size: 28px;">🐒</span>
	</div>
	<div>
	<h1 style="margin: 0; font-size: 1.5rem; font-weight: 700; color: #f8fafc; letter-spacing: -0.5px;">
	MonkeyMind
	</h1>
	<div style="display: flex; align-items: center; gap: 8px;">
	<span style="width: 8px; height: 8px; border-radius: 50%; background: #34d399; box-shadow: 0 0 10px #34d399;"></span>
	<p style="margin: 0; font-size: 0.8rem; color: #94a3b8; font-family: 'JetBrains Mono', monospace;">AGENT ACTIVE</p>
	</div>
	</div>
	</div>
	""")

	# ===== APP DESCRIPTION =====
	gr.Markdown("""
	> 🐒 MonkeyMind is your Knowledge Transfer & RAG Agent. Analyze GitHub repos, local projects, or YouTube videos
	> to build a personal knowledge base. Chat with your sources using AI-powered retrieval.
	>
	> Quick Start: Paste a GitHub URL → Click Analyze → Click Index → Start chatting!
	> Bookmark important sources to access them anytime.
	""")

	# ===== MAIN LAYOUT: 1/3 Left Panel + 2/3 Right Panel =====
	with gr.Row():
	# ===== LEFT PANEL: Data Sources + Bookmarks =====
	with gr.Column(scale=1, min_width=350):

	# Data Sources Section
	gr.Markdown("### 📡 Data Ingestion")

	# Source Type Selector (pill-style tabs)
	source_type = gr.Radio(
	choices=["🔗 GitHub", "📁 Local", "🎥 YouTube"],
	value="🔗 GitHub",
	label="",
	container=False,
	interactive=True
	)

	# Dynamic source input based on selection
	with gr.Group(visible=True) as github_group:
	gr.Markdown("Paste a GitHub repo URL and click Analyze* to extract docs. Then Index to enable RAG chat. You can see retrieved contents in the Preview tab on the right.*")
	github_url = gr.Textbox(
	label="Repository URL",
	placeholder="https://github.com/username/repo",
	show_label=True,
	)
	github_analyze_btn = gr.Button("🔍 Analyze Repository", variant="secondary")
	github_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
	github_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
	github_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
	gr.Markdown("---")
	gr.Markdown("📝 Notepad (copy useful info here)")
	github_notepad = gr.Textbox(
	label="",
	placeholder="Paste or write notes here...",
	lines=3,
	container=False,
	show_copy_button=True,
	)
	with gr.Row():
	github_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")

	with gr.Group(visible=False) as local_group:
	gr.Markdown("Upload a project folder. Irrelevant files are auto-filtered. You can see retrieved contents in the Preview* tab on the right.*")
	local_folder = gr.File(
	label="Upload Project Folder",
	file_count="directory",
	type="filepath",
	)
	local_analyze_btn = gr.Button("🔍 Analyze Project", variant="secondary")
	local_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
	local_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
	local_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
	gr.Markdown("---")
	gr.Markdown("📝 Notepad (copy useful info here)")
	local_notepad = gr.Textbox(
	label="",
	placeholder="Paste or write notes here...",
	lines=3,
	container=False,
	show_copy_button=True,
	)
	with gr.Row():
	local_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")

	with gr.Group(visible=False) as youtube_group:
	gr.Markdown("Paste a YouTube video URL to extract and analyze the transcript. You can see retrieved contents in the Preview* tab on the right.*")
	youtube_url = gr.Textbox(
	label="Video URL",
	placeholder="https://www.youtube.com/watch?v=...",
	)
	youtube_analyze_btn = gr.Button("🔍 Analyze Video", variant="secondary")
	youtube_index_btn = gr.Button("⚡ Index for RAG", variant="primary")
	youtube_status = gr.Markdown("Ready to analyze.", elem_classes=["status-pending"])
	youtube_bookmark_btn = gr.Button("🔖 Bookmark & Save to Knowledge Base", variant="secondary")
	gr.Markdown("---")
	gr.Markdown("📝 Notepad (copy useful info here)")
	youtube_notepad = gr.Textbox(
	label="",
	placeholder="Paste or write notes here...",
	lines=3,
	container=False,
	show_copy_button=True,
	)
	with gr.Row():
	youtube_notepad_download = gr.DownloadButton("📥 Download as .md", variant="secondary", size="sm")

	# Source type switching logic
	def switch_source(choice):
	return (
	gr.Group(visible=("GitHub" in choice)),
	gr.Group(visible=("Local" in choice)),
	gr.Group(visible=("YouTube" in choice)),
	)

	source_type.change(
	fn=switch_source,
	inputs=[source_type],
	outputs=[github_group, local_group, youtube_group],
	)

	gr.Markdown("---")

	# Bookmarks Quick Access Section
	gr.Markdown("### 🧠 Knowledge Base")
	gr.Markdown("Select sources to use for chat. Multiple selections allowed.")

	# Use CheckboxGroup for multi-select
	bookmarks_checkboxes = gr.CheckboxGroup(
	label="Active Sources",
	choices=[],
	value=[],
	interactive=True,
	info="Check sources to include in chat context"
	)

	# Keep dropdown for compatibility (hidden, used internally)
	bookmarks_dropdown = gr.Dropdown(
	label="",
	choices=[],
	value=None,
	interactive=True,
	visible=False,
	)

	with gr.Row():
	refresh_bookmarks_btn = gr.Button("🔄 Refresh", variant="secondary", size="sm", scale=1)
	view_all_btn = gr.Button("📋 View All", variant="secondary", size="sm", scale=1)

	# Bookmark info display
	bookmark_info = gr.Markdown(
	value="No sources selected. Bookmark repos to add them here.",
	elem_classes=["info-box"]
	)

	# ===== RIGHT PANEL: Chat & Preview =====
	with gr.Column(scale=2, min_width=500):

	# Chat vs Preview Toggle
	right_panel_mode = gr.Radio(
	choices=["💬 Chat & RAG", "📄 Preview"],
	value="💬 Chat & RAG",
	label="",
	container=False,
	)

	# Chat Interface
	with gr.Group(visible=True) as chat_panel:
	with gr.Group(elem_classes=["box-container"]):
	gr.Markdown("### 🐒 Knowledge Assistant")
	gr.Markdown("Hover over messages to see copy icon. Use toggles below to augment with web/wiki search.")

	chatbot_kwargs = dict(
	value=[],
	height=450,
	show_label=False,
	avatar_images=["images/user.png", "images/monkey.png"],
	elem_classes=["chat-container"],
	type="messages",
	)

	chatbot = gr.Chatbot(**chatbot_kwargs)

	# Toolbar row: Web Search, Wiki Search (Clear Chat removed)
	with gr.Row():
	# clear_chat_btn removed as requested
	web_search_toggle = gr.Checkbox(
	label="🌐 Web Search",
	value=False,
	interactive=True,
	)
	wiki_search_toggle = gr.Checkbox(
	label="📚 Wikipedia",
	value=False,
	interactive=True,
	)

	with gr.Row():
	question_box = gr.Textbox(
	label="",
	placeholder="Ask anything about your indexed sources...",
	lines=1,
	scale=5,
	container=False,
	)
	send_btn = gr.Button("Send", variant="primary", scale=1)

	gr.Examples(
	examples=[
	"Summarize the main architecture patterns",
	"What are the key dependencies?",
	"Explain the core functionality",
	"What patterns can I reuse?",
	],
	inputs=question_box,
	label="Quick Questions"
	)

	# ===== EXPERIMENTAL LAB (Collapsible) - Moved here =====
	with gr.Group(elem_classes=["box-container"]):
	gr.Markdown("### 🧪 Experimental Lab")
	gr.Markdown("Use this lab to prototype small apps based on your knowledge base.")
	with gr.Accordion("Open Lab", open=False):
	gr.Markdown("The agent generates Gradio code and tests it in a sandbox.")
	with gr.Row():
	with gr.Column(scale=1):
	gr.Markdown("### 🎯 Build an Experiment")
	lab_intention = gr.Textbox(
	label="What do you want to build?",
	placeholder="e.g., A Gradio app that visualizes patterns from a Knowledge Transfer report.",
	lines=3,
	)
	lab_report_dropdown = gr.Dropdown(
	label="Reference Material (bookmarked report)",
	choices=_list_knowledge_report_choices(),
	value=None,
	interactive=True,
	info="Select a Knowledge Transfer report as context"
	)
	with gr.Row():
	lab_refresh_reports_btn = gr.Button("🔄 Refresh", variant="secondary", size="sm")
	lab_start_btn = gr.Button("▶️ Start Build", variant="primary", size="sm")

	gr.Markdown("---")
	gr.Markdown("🔧 Fix Issues")
	lab_fix_instruction = gr.Textbox(
	label="",
	placeholder="Describe what needs to be fixed (e.g., 'The button click handler is not working')...",
	lines=2,
	container=False,
	)
	with gr.Row():
	lab_fix_btn = gr.Button("🔧 Apply Fix", variant="secondary", size="sm")
	lab_happy_btn = gr.Button("✅ Done", variant="secondary", size="sm")

	lab_export_btn = gr.Button("📥 Export Code", variant="primary")
	lab_download = gr.File(label="Download", visible=False)

	with gr.Column(scale=2):
	gr.Markdown("### 🔬 Experiment Output")
	lab_output = gr.Markdown(
	"Describe what you want to build, select a reference report from your bookmarks, then click Start Build.\n\n"
	"If there are errors, describe the issue in the fix box and click Apply Fix."
	)
	lab_code_display = gr.Code(
	label="Generated Code",
	language="python",
	visible=False,
	)

	# Preview Interface
	with gr.Group(visible=False) as preview_panel:
	gr.Markdown("### 📄 Document Preview")

	with gr.Row():
	with gr.Column(scale=1):
	preview_source_info = gr.Markdown("""
	Source: Not selected
	Status: ⏳ Pending
	Chunks: 0 vectors
	""", elem_classes=["info-box"])
	with gr.Column(scale=1, min_width=100):
	with gr.Row():
	preview_copy_btn = gr.Button("📋 Copy", variant="secondary", size="sm", scale=1)
	preview_download_btn = gr.DownloadButton("📥 Download", variant="secondary", size="sm", scale=1)
	preview_download_file = gr.File(visible=False)

	preview_content = gr.Markdown(
	value="Select a source and analyze it to see the preview here.",
	elem_classes=["preview-card"]
	)

	# Panel switching logic
	def switch_panel(choice):
	return (
	gr.Group(visible=("Chat" in choice)),
	gr.Group(visible=("Preview" in choice)),
	)

	right_panel_mode.change(
	fn=switch_panel,
	inputs=[right_panel_mode],
	outputs=[chat_panel, preview_panel],
	)

	gr.Markdown("---")



	# ===== HIDDEN STATE COMPONENTS FOR DOWNLOADS =====
	github_download = gr.File(label="Download", visible=False)
	local_download = gr.File(label="Download", visible=False)
	youtube_download = gr.File(label="Download", visible=False)

	# ===== EVENT HANDLERS =====

	# GitHub handlers
	github_analyze_btn.click(
	fn=lambda: "⏳ Analyzing repository... Please wait.",
	outputs=[github_status],
	).then(
	fn=run_github_ingestion,
	inputs=[github_url],
	outputs=[preview_content, preview_source_info, github_state],
	).then(
	fn=lambda: "✅ Analysis complete! Click Index for RAG to enable chat.",
	outputs=[github_status],
	)

	def index_github_with_status(state):
	status, new_state = index_github_repo(state)
	chunks = new_state.get("vector_chunks", 0) if new_state else 0
	if "✅" in status or chunks > 0:
	return f"✅ Indexed {chunks} vector chunks. Ready for RAG queries!", new_state
	return status, new_state

	def index_local_with_status(state):
	status, new_state = index_local_repo(state)
	chunks = new_state.get("vector_chunks", 0) if new_state else 0
	if "✅" in status or chunks > 0:
	return f"✅ Indexed {chunks} vector chunks. Ready for RAG queries!", new_state
	return status, new_state

	def index_youtube_with_status(state):
	status, new_state = index_youtube_video(state)
	chunks = new_state.get("vector_chunks", 0) if new_state else 0
	if "✅" in status or chunks > 0:
	return f"✅ Indexed {chunks} transcript chunks. Ready for RAG queries!", new_state
	return status, new_state

	github_index_btn.click(
	fn=lambda: "⏳ Indexing... Building vector embeddings.",
	outputs=[github_status],
	).then(
	fn=index_github_with_status,
	inputs=[github_state],
	outputs=[github_status, github_state],
	)

	def bookmark_with_refresh(state):
	status, new_state, dropdown = bookmark_github_repo(state)
	choices, meta = get_dropdown_options()
	return (
	"🔖 Bookmarked! Added to Knowledge Base for future chat sessions.",
	new_state,
	gr.Dropdown(choices=choices, value=None),
	gr.CheckboxGroup(choices=choices, value=[]),
	meta
	)

	github_bookmark_btn.click(
	fn=bookmark_with_refresh,
	inputs=[github_state],
	outputs=[github_status, github_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
	)

	# Local handlers
	local_analyze_btn.click(
	fn=lambda: "⏳ Analyzing project... Please wait.",
	outputs=[local_status],
	).then(
	fn=run_local_repo_ingestion,
	inputs=[local_folder],
	outputs=[preview_content, preview_source_info, local_state],
	).then(
	fn=lambda: "✅ Analysis complete! Click Index for RAG to enable chat.",
	outputs=[local_status],
	)

	local_index_btn.click(
	fn=lambda: "⏳ Indexing... Building vector embeddings.",
	outputs=[local_status],
	).then(
	fn=index_local_with_status,
	inputs=[local_state],
	outputs=[local_status, local_state],
	)

	def bookmark_local_with_refresh(state):
	status, new_state, dropdown = bookmark_local_repo(state)
	choices, meta = get_dropdown_options()
	return (
	"🔖 Bookmarked! Added to Knowledge Base for future chat sessions.",
	new_state,
	gr.Dropdown(choices=choices, value=None),
	gr.CheckboxGroup(choices=choices, value=[]),
	meta
	)

	local_bookmark_btn.click(
	fn=bookmark_local_with_refresh,
	inputs=[local_state],
	outputs=[local_status, local_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
	)

	# YouTube handlers
	youtube_analyze_btn.click(
	fn=lambda: "⏳ Fetching transcript... Please wait.",
	outputs=[youtube_status],
	).then(
	fn=run_youtube_ingestion,
	inputs=[youtube_url],
	outputs=[preview_content, preview_source_info, youtube_state],
	).then(
	fn=lambda: "✅ Analysis complete! Click Index for RAG to enable chat.",
	outputs=[youtube_status],
	)

	youtube_index_btn.click(
	fn=lambda: "⏳ Indexing... Building vector embeddings.",
	outputs=[youtube_status],
	).then(
	fn=index_youtube_with_status,
	inputs=[youtube_state],
	outputs=[youtube_status, youtube_state],
	)

	def bookmark_youtube_with_refresh(state):
	status, new_state, dropdown = bookmark_youtube_video(state)
	choices, meta = get_dropdown_options()
	return (
	"🔖 Bookmarked! Added to Knowledge Base for future chat sessions.",
	new_state,
	gr.Dropdown(choices=choices, value=None),
	gr.CheckboxGroup(choices=choices, value=[]),
	meta
	)

	youtube_bookmark_btn.click(
	fn=bookmark_youtube_with_refresh,
	inputs=[youtube_state],
	outputs=[youtube_status, youtube_state, bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
	)

	# Chat handlers
	def handle_chat_with_history(question, history, github_s, local_s, youtube_s, selected_sources, meta):
	# Use first selected source from checkboxes, or fall back to indexed sources
	bookmark = selected_sources[0] if selected_sources else None
	answer = answer_chat_question(question, github_s, local_s, youtube_s, bookmark, meta)
	history = history or []
	history = history or []
	history.append({"role": "user", "content": question})
	history.append({"role": "assistant", "content": answer})
	return history, ""

	send_btn.click(
	fn=handle_chat_with_history,
	inputs=[question_box, chatbot, github_state, local_state, youtube_state, bookmarks_checkboxes, bookmarks_metadata],
	outputs=[chatbot, question_box],
	)

	question_box.submit(
	fn=handle_chat_with_history,
	inputs=[question_box, chatbot, github_state, local_state, youtube_state, bookmarks_checkboxes, bookmarks_metadata],
	outputs=[chatbot, question_box],
	)



	# Chatbot Like/Dislike Handler
	def handle_chatbot_like(data: gr.LikeData):
	# Placeholder for future feedback logging
	print(f"User feedback: {'Liked' if data.liked else 'Disliked'} message index {data.index}")
	return None

	chatbot.like(
	fn=handle_chatbot_like,
	outputs=None
	)

	# Bookmark handlers - refresh both dropdown and checkboxes
	def refresh_all_bookmarks():
	choices, meta = get_dropdown_options()
	return (
	gr.Dropdown(choices=choices, value=None),
	gr.CheckboxGroup(choices=choices, value=[]),
	meta
	)

	refresh_bookmarks_btn.click(
	fn=refresh_all_bookmarks,
	outputs=[bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
	)

	# View All button - show bookmark details
	def view_all_bookmarks(meta):
	if not meta:
	return "No bookmarks found. Analyze and bookmark repositories to see them here."
	lines = ["📚 All Bookmarked Sources:\n"]
	for m in meta:
	name = m.get("repo_name", "Unknown")
	date = m.get("last_pulled_display", "--")
	chunks = m.get("vector_chunks", 0)
	lines.append(f"- {name} — {date} — {chunks} chunks")
	return "\n".join(lines)

	view_all_btn.click(
	fn=view_all_bookmarks,
	inputs=[bookmarks_metadata],
	outputs=[bookmark_info],
	)

	# Update bookmark info when checkboxes change
	def update_checkbox_info(selected, meta):
	if not selected:
	return "No sources selected. Check sources above to include in chat."
	lines = [f"{len(selected)} source(s) selected:\n"]
	for label in selected:
	m = find_metadata_by_label(label, meta or [])
	if m:
	lines.append(f"- {m.get('repo_name', label)} ({m.get('vector_chunks', 0)} chunks)")
	return "\n".join(lines)

	bookmarks_checkboxes.change(
	fn=update_checkbox_info,
	inputs=[bookmarks_checkboxes, bookmarks_metadata],
	outputs=[bookmark_info],
	)

	# Notepad download handlers
	def download_notepad_as_md(content):
	if not content or not content.strip():
	return None
	import tempfile
	with tempfile.NamedTemporaryFile(mode='w', suffix='.md', delete=False, encoding='utf-8') as f:
	f.write(content)
	return f.name

	github_notepad_download.click(
	fn=download_notepad_as_md,
	inputs=[github_notepad],
	outputs=[github_notepad_download],
	)

	local_notepad_download.click(
	fn=download_notepad_as_md,
	inputs=[local_notepad],
	outputs=[local_notepad_download],
	)

	youtube_notepad_download.click(
	fn=download_notepad_as_md,
	inputs=[youtube_notepad],
	outputs=[youtube_notepad_download],
	)

	# Preview Copy Handler (JS)
	preview_copy_btn.click(
	fn=None,
	inputs=[preview_content],
	js="(content) => { navigator.clipboard.writeText(content); return 'Copied!'; }",
	)

	# Preview Download Handler
	preview_download_btn.click(
	fn=download_notepad_as_md, # Reusing the md download function
	inputs=[preview_content],
	outputs=[preview_download_btn],
	)

	# Lab handlers with improved output
	def run_lab_with_code(intention, report):
	result = run_experimental_lab(intention, report)
	# Extract code if present in result
	if "```python" in result:
	code_start = result.find("```python") + 9
	code_end = result.find("```", code_start)
	code = result[code_start:code_end].strip() if code_end > code_start else ""
	return result, gr.Code(value=code, visible=True)
	return result, gr.Code(visible=False)

	lab_start_btn.click(
	fn=run_lab_with_code,
	inputs=[lab_intention, lab_report_dropdown],
	outputs=[lab_output, lab_code_display],
	)

	def fix_lab_with_instruction(intention, report, fix_instruction):
	# Pass the fix instruction to the fix function
	combined = f"{intention}\n\nFIX REQUEST: {fix_instruction}" if fix_instruction else intention
	return lab_fix_bugs(combined, report)

	lab_fix_btn.click(
	fn=fix_lab_with_instruction,
	inputs=[lab_intention, lab_report_dropdown, lab_fix_instruction],
	outputs=[lab_output],
	)

	lab_happy_btn.click(
	fn=lab_mark_happy,
	inputs=[lab_intention, lab_report_dropdown],
	outputs=[lab_output],
	)

	# Export lab code to file
	def export_lab_code(code_content):
	if not code_content:
	return None
	import tempfile
	with tempfile.NamedTemporaryFile(mode='w', suffix='.py', delete=False) as f:
	f.write(code_content)
	return f.name

	lab_export_btn.click(
	fn=export_lab_code,
	inputs=[lab_code_display],
	outputs=[lab_download],
	).then(
	fn=lambda: gr.File(visible=True),
	outputs=[lab_download],
	)

	lab_refresh_reports_btn.click(
	fn=_refresh_lab_reports_dropdown,
	outputs=[lab_report_dropdown],
	)

	# Load bookmarks on startup (refresh both dropdown and checkboxes)
	demo.load(
	fn=refresh_all_bookmarks,
	outputs=[bookmarks_dropdown, bookmarks_checkboxes, bookmarks_metadata],
	)

	return demo, (app_theme if IS_GRADIO_V6 else None), (custom_css if IS_GRADIO_V6 else None)


	if __name__ == "__main__":
	demo, app_theme, custom_css = build_interface()
	launch_kwargs = {"share": False}
	if IS_GRADIO_V6:
	launch_kwargs.update(theme=app_theme, css=custom_css)
	demo.launch(**launch_kwargs)