Enhance tool normalization and API integration across modules

- Introduced normalization functions for tool statistics and error counts to ensure consistent schema across all trajectory entries, facilitating compatibility with HuggingFace datasets. - Updated batch processing to utilize normalized tool stats and error counts, improving data integrity. - Refactored vision tools and mixture of agents tool to integrate with OpenRouter API, replacing Nous Research API references and updating model configurations. - Enabled reasoning capabilities in API calls for enhanced response quality across various tools. - Improved error handling and API key validation for OpenRouter integration.
2026-01-14 13:40:10 +00:00 · 2026-01-14 13:40:10 +00:00 · 13d360030f
commit 13d360030f
parent 66daebe88f
6 changed files with 172 additions and 61 deletions
--- a/tools/mixture_of_agents_tool.py
+++ b/tools/mixture_of_agents_tool.py
@ -24,9 +24,9 @@ Architecture:
 2. Aggregator model synthesizes responses into a high-quality output
 3. Multiple layers can be used for iterative refinement (future enhancement)

-Models Used:
- Reference Models: claude-opus-4-20250514, gemini-2.5-pro, o4-mini, deepseek-r1
- Aggregator Model: claude-opus-4-20250514 (highest capability for synthesis)
+Models Used (via OpenRouter):
+- Reference Models: claude-opus-4, gemini-2.5-pro, gpt-4.1, deepseek-r1
+- Aggregator Model: claude-opus-4 (highest capability for synthesis)

 Configuration:
    To customize the MoA setup, modify the configuration constants at the top of this file:
@ -54,23 +54,23 @@ from pathlib import Path
 from typing import Dict, Any, List, Optional
 from openai import AsyncOpenAI

-# Initialize Nous Research API client for MoA processing
-nous_client = AsyncOpenAI(
-    api_key=os.getenv("NOUS_API_KEY"),
-    base_url="https://inference-api.nousresearch.com/v1"
+# Initialize OpenRouter API client for MoA processing
+openrouter_client = AsyncOpenAI(
+    api_key=os.getenv("OPENROUTER_API_KEY"),
+    base_url="https://openrouter.ai/api/v1"
 )

 # Configuration for MoA processing
-# Reference models - these generate diverse initial responses in parallel
+# Reference models - these generate diverse initial responses in parallel (OpenRouter slugs)
 REFERENCE_MODELS = [
-    "claude-opus-4-20250514",
-    "gemini-2.5-pro", 
-    "gpt-5",
-    "deepseek-r1"
+    "anthropic/claude-opus-4.5",
+    "google/gemini-3-pro-preview", 
+    "openai/gpt-5.2-pro",
+    "deepseek/deepseek-v3.2"
 ]

 # Aggregator model - synthesizes reference responses into final output
-AGGREGATOR_MODEL = "claude-opus-4-20250514"  # Use highest capability model for aggregation
+AGGREGATOR_MODEL = "anthropic/claude-opus-4.5"  # Use highest capability model for aggregation

 # Temperature settings optimized for MoA performance
 REFERENCE_TEMPERATURE = 0.6  # Balanced creativity for diverse perspectives
@ -187,7 +187,13 @@ async def _run_reference_model_safe(
            # Build parameters for the API call
            api_params = {
                "model": model,
-                "messages": [{"role": "user", "content": user_prompt}]
+                "messages": [{"role": "user", "content": user_prompt}],
+                "extra_body": {
+                    "reasoning": {
+                        "enabled": True,
+                        "effort": "xhigh"
+                    }
+                }
            }
            
            # GPT models (especially gpt-4o-mini) don't support custom temperature values
@ -195,7 +201,7 @@ async def _run_reference_model_safe(
            if not model.lower().startswith('gpt-'):
                api_params["temperature"] = temperature
            
-            response = await nous_client.chat.completions.create(**api_params)
+            response = await openrouter_client.chat.completions.create(**api_params)
            
            content = response.choices[0].message.content.strip()
            print(f"✅ {model} responded ({len(content)} characters)")
@ -248,7 +254,13 @@ async def _run_aggregator_model(
        "messages": [
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt}
-        ]
+        ],
+        "extra_body": {
+            "reasoning": {
+                "enabled": True,
+                "effort": "xhigh"
+            }
+        }
    }
    
    # GPT models (especially gpt-4o-mini) don't support custom temperature values
@ -256,7 +268,7 @@ async def _run_aggregator_model(
    if not AGGREGATOR_MODEL.lower().startswith('gpt-'):
        api_params["temperature"] = temperature
    
-    response = await nous_client.chat.completions.create(**api_params)
+    response = await openrouter_client.chat.completions.create(**api_params)
    
    content = response.choices[0].message.content.strip()
    print(f"✅ Aggregation complete ({len(content)} characters)")
@ -330,8 +342,8 @@ async def mixture_of_agents_tool(
        print(f"📝 Query: {user_prompt[:100]}{'...' if len(user_prompt) > 100 else ''}")
        
        # Validate API key availability
-        if not os.getenv("NOUS_API_KEY"):
-            raise ValueError("NOUS_API_KEY environment variable not set")
+        if not os.getenv("OPENROUTER_API_KEY"):
+            raise ValueError("OPENROUTER_API_KEY environment variable not set")
        
        # Use provided models or defaults
        ref_models = reference_models or REFERENCE_MODELS
@ -439,14 +451,14 @@ async def mixture_of_agents_tool(
        return json.dumps(result, indent=2, ensure_ascii=False)


-def check_nous_api_key() -> bool:
+def check_openrouter_api_key() -> bool:
    """
-    Check if the Nous Research API key is available in environment variables.
+    Check if the OpenRouter API key is available in environment variables.
    
    Returns:
        bool: True if API key is set, False otherwise
    """
-    return bool(os.getenv("NOUS_API_KEY"))
+    return bool(os.getenv("OPENROUTER_API_KEY"))


 def check_moa_requirements() -> bool:
@ -456,7 +468,7 @@ def check_moa_requirements() -> bool:
    Returns:
        bool: True if requirements are met, False otherwise
    """
-    return check_nous_api_key()
+    return check_openrouter_api_key()


 def get_debug_session_info() -> Dict[str, Any]:
@ -522,15 +534,15 @@ if __name__ == "__main__":
    print("=" * 50)
    
    # Check if API key is available
-    api_available = check_nous_api_key()
+    api_available = check_openrouter_api_key()
    
    if not api_available:
-        print("❌ NOUS_API_KEY environment variable not set")
-        print("Please set your API key: export NOUS_API_KEY='your-key-here'")
-        print("Get API key at: https://inference-api.nousresearch.com/")
+        print("❌ OPENROUTER_API_KEY environment variable not set")
+        print("Please set your API key: export OPENROUTER_API_KEY='your-key-here'")
+        print("Get API key at: https://openrouter.ai/")
        exit(1)
    else:
-        print("✅ Nous Research API key found")
+        print("✅ OpenRouter API key found")
    
    print("🛠️  MoA tools ready for use!")
    
--- a/tools/vision_tools.py
+++ b/tools/vision_tools.py
@ -3,7 +3,7 @@
 Vision Tools Module

 This module provides vision analysis tools that work with image URLs.
-Uses Gemini Flash via Nous Research API for intelligent image understanding.
+Uses Gemini 3 Flash Preview via OpenRouter API for intelligent image understanding.

 Available tools:
 - vision_analyze_tool: Analyze images from URLs with custom prompts
@ -38,14 +38,14 @@ from typing import Dict, Any, Optional
 from openai import AsyncOpenAI
 import httpx  # Use httpx for async HTTP requests

-# Initialize Nous Research API client for vision processing
-nous_client = AsyncOpenAI(
-    api_key=os.getenv("NOUS_API_KEY"),
-    base_url="https://inference-api.nousresearch.com/v1"
+# Initialize OpenRouter API client for vision processing
+openrouter_client = AsyncOpenAI(
+    api_key=os.getenv("OPENROUTER_API_KEY"),
+    base_url="https://openrouter.ai/api/v1"
 )

 # Configuration for vision processing
-DEFAULT_VISION_MODEL = "gemini-2.5-flash"
+DEFAULT_VISION_MODEL = "google/gemini-3-flash-preview"

 # Debug mode configuration
 DEBUG_MODE = os.getenv("VISION_TOOLS_DEBUG", "false").lower() == "true"
@ -220,7 +220,7 @@ async def vision_analyze_tool(
    Analyze an image from a URL using vision AI.
    
    This tool downloads images from URLs, converts them to base64, and processes
-    them using Gemini Flash via Nous Research API. The image is downloaded to a
+    them using Gemini 3 Flash Preview via OpenRouter API. The image is downloaded to a
    temporary location and automatically cleaned up after processing.
    
    The user_prompt parameter is expected to be pre-formatted by the calling
@ -230,7 +230,7 @@ async def vision_analyze_tool(
    Args:
        image_url (str): The URL of the image to analyze (must be http:// or https://)
        user_prompt (str): The pre-formatted prompt for the vision model
-        model (str): The vision model to use (default: gemini-2.5-flash)
+        model (str): The vision model to use (default: google/gemini-3-flash-preview)
    
    Returns:
        str: JSON string containing the analysis results with the following structure:
@ -271,8 +271,8 @@ async def vision_analyze_tool(
            raise ValueError("Invalid image URL format. Must start with http:// or https://")
        
        # Check API key availability
-        if not os.getenv("NOUS_API_KEY"):
-            raise ValueError("NOUS_API_KEY environment variable not set")
+        if not os.getenv("OPENROUTER_API_KEY"):
+            raise ValueError("OPENROUTER_API_KEY environment variable not set")
        
        # Download the image to a temporary location
        print(f"⬇️  Downloading image from URL...", flush=True)
@ -319,12 +319,18 @@ async def vision_analyze_tool(
        
        print(f"🧠 Processing image with {model}...", flush=True)
        
-        # Call the vision API
-        response = await nous_client.chat.completions.create(
+        # Call the vision API with reasoning enabled
+        response = await openrouter_client.chat.completions.create(
            model=model,
            messages=messages,
            temperature=0.1,  # Low temperature for consistent analysis
-            max_tokens=2000   # Generous limit for detailed analysis
+            max_tokens=2000,  # Generous limit for detailed analysis
+            extra_body={
+                "reasoning": {
+                    "enabled": True,
+                    "effort": "xhigh"
+                }
+            }
        )
        
        # Extract the analysis
@ -374,14 +380,14 @@ async def vision_analyze_tool(
                print(f"⚠️  Warning: Could not delete temporary file: {cleanup_error}", flush=True)


-def check_nous_api_key() -> bool:
+def check_openrouter_api_key() -> bool:
    """
-    Check if the Nous Research API key is available in environment variables.
+    Check if the OpenRouter API key is available in environment variables.
    
    Returns:
        bool: True if API key is set, False otherwise
    """
-    return bool(os.getenv("NOUS_API_KEY"))
+    return bool(os.getenv("OPENROUTER_API_KEY"))


 def check_vision_requirements() -> bool:
@ -391,7 +397,7 @@ def check_vision_requirements() -> bool:
    Returns:
        bool: True if requirements are met, False otherwise
    """
-    return check_nous_api_key()
+    return check_openrouter_api_key()


 def get_debug_session_info() -> Dict[str, Any]:
@ -425,15 +431,15 @@ if __name__ == "__main__":
    print("=" * 40)
    
    # Check if API key is available
-    api_available = check_nous_api_key()
+    api_available = check_openrouter_api_key()
    
    if not api_available:
-        print("❌ NOUS_API_KEY environment variable not set")
-        print("Please set your API key: export NOUS_API_KEY='your-key-here'")
-        print("Get API key at: https://inference-api.nousresearch.com/")
+        print("❌ OPENROUTER_API_KEY environment variable not set")
+        print("Please set your API key: export OPENROUTER_API_KEY='your-key-here'")
+        print("Get API key at: https://openrouter.ai/")
        exit(1)
    else:
-        print("✅ Nous Research API key found")
+        print("✅ OpenRouter API key found")
    
    print("🛠️ Vision tools ready for use!")
    print(f"🧠 Using model: {DEFAULT_VISION_MODEL}")
--- a/tools/web_tools.py
+++ b/tools/web_tools.py
@ -285,7 +285,13 @@ Create a markdown summary that captures all key information in a well-organized,
                    {"role": "user", "content": user_prompt}
                ],
                temperature=0.1,
-                max_tokens=max_tokens
+                max_tokens=max_tokens,
+                extra_body={
+                    "reasoning": {
+                        "enabled": True,
+                        "effort": "xhigh"
+                    }
+                }
            )
            return response.choices[0].message.content.strip()
        except Exception as api_error:
@ -398,7 +404,13 @@ Create a single, unified markdown summary."""
                {"role": "user", "content": synthesis_prompt}
            ],
            temperature=0.1,
-            max_tokens=4000
+            max_tokens=4000,
+            extra_body={
+                "reasoning": {
+                    "enabled": True,
+                    "effort": "xhigh"
+                }
+            }
        )
        final_summary = response.choices[0].message.content.strip()