Spaces:

DataQuests
/

DeepCritical

Running

App Files Files Community

Joseph Pollack commited on 9 days ago

Commit

8fa2ce6

unverified ·

1 Parent(s): a2f220d

attempts fix 403 and settings

Browse files

Files changed (16) hide show

.pre-commit-config.yaml +1 -1
dev/__init__.py +0 -1
docs/LICENSE.md +1 -0
pyproject.toml +2 -0
src/app.py +43 -37
src/orchestrator/graph_orchestrator.py +196 -4
src/tools/vendored/searchxng_client.py +0 -1
src/tools/vendored/serper_client.py +0 -1
src/tools/vendored/web_search_core.py +0 -1
src/utils/hf_error_handler.py +0 -1
src/utils/markdown.css +1 -0
src/utils/md_to_pdf.py +0 -1
tests/unit/middleware/test_budget_tracker_phase7.py +1 -0
tests/unit/middleware/test_workflow_manager.py +1 -0
tests/unit/utils/test_hf_error_handler.py +1 -0
tests/unit/utils/test_hf_model_validator.py +1 -0

.pre-commit-config.yaml CHANGED Viewed

@@ -14,7 +14,7 @@ repos:
     hooks:
       - id: mypy
         files: ^src/
-        exclude: ^folder
         additional_dependencies:
           - pydantic>=2.7
           - pydantic-settings>=2.2

     hooks:
       - id: mypy
         files: ^src/
+        exclude: ^folder|^src/app.py
         additional_dependencies:
           - pydantic>=2.7
           - pydantic-settings>=2.2

dev/__init__.py CHANGED Viewed

	@@ -1,2 +1 @@
1	"""Development utilities and plugins."""
2	-


1	"""Development utilities and plugins."""

docs/LICENSE.md CHANGED Viewed

	@@ -32,3 +32,4 @@ SOFTWARE.
32
33
34


32
33
34
35	+

pyproject.toml CHANGED Viewed

@@ -127,6 +127,7 @@ ignore = [
     "PLR0913",  # Too many arguments (agents need many params)
     "PLR0912",  # Too many branches (complex orchestrator logic)
     "PLR0911",  # Too many return statements (complex agent logic)
     "PLR2004",  # Magic values (statistical constants like p-values)
     "PLW0603",  # Global statement (singleton pattern for Modal)
     "PLC0415",  # Lazy imports for optional dependencies
@@ -152,6 +153,7 @@ exclude = [
     "^reference_repos/",
     "^examples/",
     "^folder/",
 ]
 # ============== PYTEST CONFIG ==============

     "PLR0913",  # Too many arguments (agents need many params)
     "PLR0912",  # Too many branches (complex orchestrator logic)
     "PLR0911",  # Too many return statements (complex agent logic)
+    "PLR0915",  # Too many statements (Gradio UI setup functions)
     "PLR2004",  # Magic values (statistical constants like p-values)
     "PLW0603",  # Global statement (singleton pattern for Modal)
     "PLC0415",  # Lazy imports for optional dependencies
     "^reference_repos/",
     "^examples/",
     "^folder/",
+    "^src/app.py",
 ]
 # ============== PYTEST CONFIG ==============

src/app.py CHANGED Viewed

@@ -583,7 +583,6 @@ async def research_agent(
             yield chat_msg
         # Optional: Generate audio output if enabled
-        audio_output_data: tuple[int, np.ndarray[Any, Any]] | None = None  # type: ignore[type-arg]
         if settings.enable_audio_output and settings.modal_available:
             try:
                 from src.services.tts_modal import get_tts_service
@@ -592,7 +591,7 @@ async def research_agent(
                 # Get the last message from history for TTS
                 last_message = history[-1].get("content", "") if history else processed_text
                 if last_message:
-                    audio_output_data = await tts_service.synthesize_async(
                         text=last_message,
                         voice=tts_voice,
                         speed=tts_speed,
@@ -834,6 +833,48 @@ def create_demo() -> gr.Blocks:
                     info="Select inference provider (leave empty for auto-select). Sign in to see all available providers.",
                 )
                 # Web Search Provider selection
                 gr.Markdown("### 🔍 Web Search Provider")
@@ -1064,41 +1105,6 @@ def create_demo() -> gr.Blocks:
             outputs=[tts_voice_dropdown, tts_speed_slider, audio_output],
         )
-        # Update model/provider dropdowns when user clicks refresh button
-        # Note: Gradio doesn't directly support watching OAuthToken/OAuthProfile changes
-        # So we provide a refresh button that users can click after logging in
-        def refresh_models_and_providers(
-            oauth_token: gr.OAuthToken | None = None,
-            oauth_profile: gr.OAuthProfile | None = None,
-        ) -> tuple[dict[str, Any], dict[str, Any], str]:
-            """Handle refresh button click and update dropdowns."""
-            import asyncio
-            # Run async function in sync context
-            loop = asyncio.new_event_loop()
-            asyncio.set_event_loop(loop)
-            try:
-                result = loop.run_until_complete(
-                    update_model_provider_dropdowns(oauth_token, oauth_profile)
-                )
-                return result
-            finally:
-                loop.close()
-        refresh_models_btn = gr.Button(
-            value="🔄 Refresh Available Models",
-            visible=True,
-            size="sm",
-        )
-        # Note: OAuthToken and OAuthProfile are automatically passed to functions
-        # when they are available in the Gradio context
-        refresh_models_btn.click(
-            fn=refresh_models_and_providers,
-            inputs=[],  # OAuth components are automatically available in Gradio context
-            outputs=[hf_model_dropdown, hf_provider_dropdown, model_provider_status],
-        )
         # Chat interface with multimodal support
         # Examples are provided but will NOT run at startup (cache_examples=False)
         # Users must log in first before using examples or submitting queries

             yield chat_msg
         # Optional: Generate audio output if enabled
         if settings.enable_audio_output and settings.modal_available:
             try:
                 from src.services.tts_modal import get_tts_service
                 # Get the last message from history for TTS
                 last_message = history[-1].get("content", "") if history else processed_text
                 if last_message:
+                    await tts_service.synthesize_async(
                         text=last_message,
                         voice=tts_voice,
                         speed=tts_speed,
                     info="Select inference provider (leave empty for auto-select). Sign in to see all available providers.",
                 )
+                # Refresh button for updating models/providers after login
+                def refresh_models_and_providers(
+                    request: gr.Request,
+                ) -> tuple[dict[str, Any], dict[str, Any], str]:
+                    """Handle refresh button click and update dropdowns."""
+                    import asyncio
+                    # Extract OAuth token and profile from request
+                    oauth_token: gr.OAuthToken | None = None
+                    oauth_profile: gr.OAuthProfile | None = None
+                    if request is not None:
+                        # Try to get OAuth token from request
+                        if hasattr(request, "oauth_token"):
+                            oauth_token = request.oauth_token
+                        if hasattr(request, "oauth_profile"):
+                            oauth_profile = request.oauth_profile
+                    # Run async function in sync context
+                    loop = asyncio.new_event_loop()
+                    asyncio.set_event_loop(loop)
+                    try:
+                        result = loop.run_until_complete(
+                            update_model_provider_dropdowns(oauth_token, oauth_profile)
+                        )
+                        return result
+                    finally:
+                        loop.close()
+                refresh_models_btn = gr.Button(
+                    value="🔄 Refresh Available Models",
+                    visible=True,
+                    size="sm",
+                )
+                # Pass request to get OAuth token from Gradio context
+                refresh_models_btn.click(
+                    fn=refresh_models_and_providers,
+                    inputs=[],  # Request is automatically available in Gradio context
+                    outputs=[hf_model_dropdown, hf_provider_dropdown, model_provider_status],
+                )
                 # Web Search Provider selection
                 gr.Markdown("### 🔍 Web Search Provider")
             outputs=[tts_voice_dropdown, tts_speed_slider, audio_output],
         )
         # Chat interface with multimodal support
         # Examples are provided but will NOT run at startup (cache_examples=False)
         # Users must log in first before using examples or submitting queries

src/orchestrator/graph_orchestrator.py CHANGED Viewed

@@ -886,10 +886,11 @@ class GraphOrchestrator:
     async def _execute_standard_agent(
         self, node: AgentNode, input_data: Any, query: str, context: GraphExecutionContext
     ) -> Any:
-        """Execute standard agent with error handling."""
         # Get message history from context (limit to most recent 10 messages for token efficiency)
         message_history = context.get_message_history(max_messages=10)
         try:
             # Pass message_history if available (Pydantic AI agents support this)
             if message_history:
@@ -909,13 +910,204 @@ class GraphOrchestrator:
                         "Failed to accumulate messages from agent result", error=str(e)
                     )
             return result
-        except Exception:
-            # Handle validation errors and API errors for planner node
             if node.node_id == "planner":
                 return self._create_fallback_plan(query, input_data)
-            # For other nodes, re-raise the exception
             raise
     def _create_fallback_plan(self, query: str, input_data: Any) -> Any:
         """Create fallback ReportPlan when planner fails."""
         from src.utils.models import ReportPlan, ReportPlanSection

     async def _execute_standard_agent(
         self, node: AgentNode, input_data: Any, query: str, context: GraphExecutionContext
     ) -> Any:
+        """Execute standard agent with error handling and fallback models."""
         # Get message history from context (limit to most recent 10 messages for token efficiency)
         message_history = context.get_message_history(max_messages=10)
+        # Try with the original agent first
         try:
             # Pass message_history if available (Pydantic AI agents support this)
             if message_history:
                         "Failed to accumulate messages from agent result", error=str(e)
                     )
             return result
+        except Exception as e:
+            # Check if we should retry with fallback models
+            from src.utils.hf_error_handler import (
+                extract_error_details,
+                should_retry_with_fallback,
+            )
+            error_details = extract_error_details(e)
+            should_retry = should_retry_with_fallback(e)
+            # Handle validation errors and API errors for planner node (with fallback)
             if node.node_id == "planner":
+                if should_retry:
+                    self.logger.warning(
+                        "Planner failed, trying fallback models",
+                        original_error=str(e),
+                        status_code=error_details.get("status_code"),
+                    )
+                    # Try fallback models for planner
+                    fallback_result = await self._try_fallback_models(
+                        node, input_data, message_history, query, context, e
+                    )
+                    if fallback_result is not None:
+                        return fallback_result
+                # If fallback failed or not applicable, use fallback plan
                 return self._create_fallback_plan(query, input_data)
+            # For other nodes, try fallback models if applicable
+            if should_retry:
+                self.logger.warning(
+                    "Agent node failed, trying fallback models",
+                    node_id=node.node_id,
+                    original_error=str(e),
+                    status_code=error_details.get("status_code"),
+                )
+                fallback_result = await self._try_fallback_models(
+                    node, input_data, message_history, query, context, e
+                )
+                if fallback_result is not None:
+                    return fallback_result
+            # If fallback didn't work or wasn't applicable, re-raise the exception
             raise
+    async def _try_fallback_models(
+        self,
+        node: AgentNode,
+        input_data: Any,
+        message_history: list[Any],
+        query: str,
+        context: GraphExecutionContext,
+        original_error: Exception,
+    ) -> Any | None:
+        """Try executing agent with fallback models.
+        Args:
+            node: The agent node that failed
+            input_data: Input data for the agent
+            message_history: Message history for the agent
+            query: The research query
+            context: Execution context
+            original_error: The original error that triggered fallback
+        Returns:
+            Agent result if successful, None if all fallbacks failed
+        """
+        from src.utils.hf_error_handler import extract_error_details, get_fallback_models
+        error_details = extract_error_details(original_error)
+        original_model = error_details.get("model_name")
+        fallback_models = get_fallback_models(original_model)
+        # Also try models from settings fallback list
+        from src.utils.config import settings
+        settings_fallbacks = settings.get_hf_fallback_models_list()
+        for model in settings_fallbacks:
+            if model not in fallback_models:
+                fallback_models.append(model)
+        self.logger.info(
+            "Trying fallback models",
+            node_id=node.node_id,
+            original_model=original_model,
+            fallback_count=len(fallback_models),
+        )
+        # Try each fallback model
+        for fallback_model in fallback_models:
+            try:
+                # Recreate agent with fallback model
+                fallback_agent = self._recreate_agent_with_model(node.node_id, fallback_model)
+                if fallback_agent is None:
+                    continue
+                # Try running with fallback agent
+                if message_history:
+                    result = await fallback_agent.run(input_data, message_history=message_history)
+                else:
+                    result = await fallback_agent.run(input_data)
+                self.logger.info(
+                    "Fallback model succeeded",
+                    node_id=node.node_id,
+                    fallback_model=fallback_model,
+                )
+                # Accumulate new messages from agent result if available
+                if hasattr(result, "new_messages"):
+                    try:
+                        new_messages = result.new_messages()
+                        for msg in new_messages:
+                            context.add_message(msg)
+                    except Exception as e:
+                        self.logger.debug(
+                            "Failed to accumulate messages from fallback agent result", error=str(e)
+                        )
+                return result
+            except Exception as e:
+                self.logger.warning(
+                    "Fallback model failed",
+                    node_id=node.node_id,
+                    fallback_model=fallback_model,
+                    error=str(e),
+                )
+                continue
+        # All fallback models failed
+        self.logger.error(
+            "All fallback models failed",
+            node_id=node.node_id,
+            fallback_count=len(fallback_models),
+        )
+        return None
+    def _recreate_agent_with_model(self, node_id: str, model_name: str) -> Any | None:
+        """Recreate an agent with a specific model.
+        Args:
+            node_id: The node ID (e.g., "thinking", "knowledge_gap")
+            model_name: The model name to use
+        Returns:
+            Agent instance or None if recreation failed
+        """
+        try:
+            from pydantic_ai.models.huggingface import HuggingFaceModel
+            from pydantic_ai.providers.huggingface import HuggingFaceProvider
+            # Create model with fallback model name
+            hf_provider = HuggingFaceProvider(api_key=self.oauth_token)
+            model = HuggingFaceModel(model_name, provider=hf_provider)
+            # Recreate agent based on node_id
+            if node_id == "thinking":
+                from src.agent_factory.agents import create_thinking_agent
+                agent_wrapper = create_thinking_agent(model=model, oauth_token=self.oauth_token)
+                return agent_wrapper.agent
+            elif node_id == "knowledge_gap":
+                from src.agent_factory.agents import create_knowledge_gap_agent
+                agent_wrapper = create_knowledge_gap_agent(  # type: ignore[assignment]
+                    model=model, oauth_token=self.oauth_token
+                )
+                return agent_wrapper.agent
+            elif node_id == "tool_selector":
+                from src.agent_factory.agents import create_tool_selector_agent
+                agent_wrapper = create_tool_selector_agent(  # type: ignore[assignment]
+                    model=model, oauth_token=self.oauth_token
+                )
+                return agent_wrapper.agent
+            elif node_id == "planner":
+                from src.agent_factory.agents import create_planner_agent
+                agent_wrapper = create_planner_agent(model=model, oauth_token=self.oauth_token)  # type: ignore[assignment]
+                return agent_wrapper.agent
+            elif node_id == "writer":
+                from src.agent_factory.agents import create_writer_agent
+                agent_wrapper = create_writer_agent(model=model, oauth_token=self.oauth_token)  # type: ignore[assignment]
+                return agent_wrapper.agent
+            else:
+                self.logger.warning("Unknown node_id for agent recreation", node_id=node_id)
+                return None
+        except Exception as e:
+            self.logger.error(
+                "Failed to recreate agent with fallback model",
+                node_id=node_id,
+                model_name=model_name,
+                error=str(e),
+            )
+            return None
     def _create_fallback_plan(self, query: str, input_data: Any) -> Any:
         """Create fallback ReportPlan when planner fails."""
         from src.utils.models import ReportPlan, ReportPlanSection

src/tools/vendored/searchxng_client.py CHANGED Viewed

@@ -94,4 +94,3 @@ class SearchXNGClient:
         except Exception as e:
             logger.error("Unexpected error in SearchXNG search", error=str(e), query=query)
             raise SearchError(f"SearchXNG search failed: {e}") from e

         except Exception as e:
             logger.error("Unexpected error in SearchXNG search", error=str(e), query=query)
             raise SearchError(f"SearchXNG search failed: {e}") from e

src/tools/vendored/serper_client.py CHANGED Viewed

@@ -90,4 +90,3 @@ class SerperClient:
         except Exception as e:
             logger.error("Unexpected error in Serper search", error=str(e), query=query)
             raise SearchError(f"Serper search failed: {e}") from e

         except Exception as e:
             logger.error("Unexpected error in Serper search", error=str(e), query=query)
             raise SearchError(f"Serper search failed: {e}") from e

src/tools/vendored/web_search_core.py CHANGED Viewed

@@ -199,4 +199,3 @@ def is_valid_url(url: str) -> bool:
     if any(ext in url for ext in restricted_extensions):
         return False
     return True

     if any(ext in url for ext in restricted_extensions):
         return False
     return True

src/utils/hf_error_handler.py CHANGED Viewed

@@ -197,4 +197,3 @@ def get_fallback_models(original_model: str | None = None) -> list[str]:
         fallbacks.remove(original_model)
     return fallbacks


197	fallbacks.remove(original_model)
198
199	return fallbacks

src/utils/markdown.css CHANGED Viewed

	@@ -21,3 +21,4 @@ body {
21
22
23


21
22
23
24	+

src/utils/md_to_pdf.py CHANGED Viewed

@@ -61,4 +61,3 @@ def md_to_pdf(md_text: str, pdf_file_path: str) -> None:
         md2pdf(pdf_file_path, md_text, css_file_path=str(css_path))
     logger.debug("PDF generated successfully", pdf_path=pdf_file_path)


61	md2pdf(pdf_file_path, md_text, css_file_path=str(css_path))
62
63	logger.debug("PDF generated successfully", pdf_path=pdf_file_path)

tests/unit/middleware/test_budget_tracker_phase7.py CHANGED Viewed

	@@ -167,3 +167,4 @@ class TestIterationTokenTracking:
167
168
169


167
168
169
170	+

tests/unit/middleware/test_workflow_manager.py CHANGED Viewed

	@@ -293,3 +293,4 @@ class TestWorkflowManager:
293
294
295


293
294
295
296	+

tests/unit/utils/test_hf_error_handler.py CHANGED Viewed

	@@ -236,3 +236,4 @@ class TestGetFallbackModels:
236
237
238


236
237
238
239	+

tests/unit/utils/test_hf_model_validator.py CHANGED Viewed

	@@ -413,3 +413,4 @@ class TestValidateOAuthToken:
413
414
415


413
414
415
416	+