DunaSpice
diff --git a/‎MCP_TESTING_CHECKLIST.md‎
Lines changed: 76 additions & 0 deletions b/‎MCP_TESTING_CHECKLIST.md‎
Lines changed: 76 additions & 0 deletions
diff --git a/‎core/mcp_connection_manager.py‎
Lines changed: 110 additions & 0 deletions b/‎core/mcp_connection_manager.py‎
Lines changed: 110 additions & 0 deletions
diff --git a/‎core/mcp_server_enhanced.py‎
Lines changed: 38 additions & 7 deletions b/‎core/mcp_server_enhanced.py‎
Lines changed: 38 additions & 7 deletions
diff --git a/‎core/utils/mcp_client_pool.py‎
Lines changed: 3 additions & 2 deletions b/‎core/utils/mcp_client_pool.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎debug.py‎
Lines changed: 51 additions & 0 deletions b/‎debug.py‎
Lines changed: 51 additions & 0 deletions
@@ -0,0 +1,76 @@
+# MCP Testing Checklist - Proper Development Process
+
+## ❌ WRONG WAY (What We Did)
+- [x] Test with manual JSON-RPC: `echo '{}' | python3 server.py`
+- [x] Test interactive mode: `python3 server.py --interactive`  
+- [x] Test direct tool calls: `python3 debug.py tool_name`
+- [x] Assume stdio transport works with Q CLI
+- [x] Add features before basic connection works
+
+## ✅ RIGHT WAY (What We Should Do)
+
+### Phase 1: Basic Q CLI Integration
+- [ ] Enable Q CLI debug logging: `export Q_LOG_LEVEL=trace`
+- [ ] Study existing working MCP servers in Q CLI
+- [ ] Create minimal server that only handles `initialize`
+- [ ] Test ONLY in Q CLI context: `q mcp add --name test --command "server.py"`
+- [ ] Verify server loads without "Transport closed" error
+
+### Phase 2: Protocol Compliance  
+- [ ] Study Q CLI MCP transport mechanism (not stdio)
+- [ ] Implement proper transport layer
+- [ ] Add server-side logging for all Q CLI interactions
+- [ ] Test `initialize` → `tools/list` → `tools/call` sequence
+- [ ] Verify JSON-RPC responses match Q CLI expectations
+
+### Phase 3: Functionality Testing
+- [ ] Add one tool at a time
+- [ ] Test each tool in Q CLI after adding
+- [ ] Verify tool responses display correctly in Q CLI
+- [ ] Test error handling in Q CLI context
+- [ ] Verify server stability during Q CLI sessions
+
+### Phase 4: Production Readiness
+- [ ] Load testing with multiple Q CLI sessions
+- [ ] Error recovery testing
+- [ ] Performance benchmarking in Q CLI
+- [ ] Documentation for Q CLI MCP development
+- [ ] Automated Q CLI integration tests
+
+## 🔍 Debug Commands
+
+```bash
+# Enable Q CLI debugging
+export Q_LOG_LEVEL=trace
+
+# Check Q CLI logs
+find /tmp -name "*qlog*" -o -name "*qchat*" 2>/dev/null
+tail -f /tmp/qlog/qchat.log
+
+# List working MCP servers
+q mcp list
+
+# Test MCP server loading
+q mcp add --name test-server --command "/path/to/server.py"
+
+# Remove failed server
+q mcp remove --name test-server
+```
+
+## 🚨 Red Flags (Stop Development)
+- "Transport closed" errors
+- Server loads but tools don't work in Q CLI
+- Manual testing works but Q CLI fails
+- No visibility into Q CLI interactions
+- Adding features before basic connection works
+
+## ✅ Green Flags (Continue Development)  
+- Server loads in Q CLI without errors
+- Tools list appears in Q CLI
+- Tool calls work and display results
+- Server remains stable during Q CLI use
+- Comprehensive logging shows all interactions
+
+---
+**Created**: 2025-09-21 03:15:48 UTC-07:00  
+**Purpose**: Prevent future MCP development failures
@@ -0,0 +1,110 @@
+#!/usr/bin/env python3
+"""
+MCP Connection Manager - Handle connection issues and provide direct access
+"""
+import json
+import subprocess
+import asyncio
+import sys
+import os
+
+class MCPConnectionManager:
+    """Manage MCP connections and provide direct tool access"""
+    
+    def __init__(self, server_path="/home/petr/jetson/core/mcp_server_enhanced.py"):
+        self.server_path = server_path
+        self.server_dir = os.path.dirname(server_path)
+    
+    def call_tool_direct(self, tool_name: str, arguments: dict = None) -> dict:
+        """Call MCP tool directly when connection is down"""
+        if arguments is None:
+            arguments = {}
+            
+        request = {
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "tools/call",
+            "params": {
+                "name": tool_name,
+                "arguments": arguments
+            }
+        }
+        
+        try:
+            # Call server directly
+            process = subprocess.run(
+                ["python3", self.server_path],
+                input=json.dumps(request),
+                capture_output=True,
+                text=True,
+                cwd=self.server_dir,
+                timeout=30
+            )
+            
+            if process.returncode == 0 and process.stdout:
+                result = json.loads(process.stdout.strip())
+                return result.get("result", {}).get("content", [{}])[0].get("text", "No response")
+            else:
+                return f"❌ Direct call failed: {process.stderr}"
+                
+        except Exception as e:
+            return f"❌ Connection error: {str(e)}"
+    
+    def test_system_limits(self):
+        """Test all system capabilities"""
+        print("🚀 Testing Phase 5 System Limits via Direct MCP Connection")
+        print("=" * 60)
+        
+        # Test 1: Maximum batch processing
+        print("\n🔥 Test 1: Maximum Batch Processing")
+        batch_result = self.call_tool_direct("batch_inference", {
+            "prompts": [
+                "Create FastAPI endpoint with JWT auth",
+                "Write async PostgreSQL connection pool", 
+                "Build WebSocket real-time handler",
+                "Generate comprehensive error middleware",
+                "Design microservices architecture",
+                "Implement Redis caching system",
+                "Create automated testing pipeline",
+                "Build Docker multi-stage deployment",
+                "Optimize Jetson CUDA utilization",
+                "Design scalable API gateway"
+            ]
+        })
+        print(batch_result)
+        
+        # Test 2: Intelligent model selection
+        print("\n🎯 Test 2: Intelligent Model Selection")
+        model_result = self.call_tool_direct("select_optimal_model", {
+            "prompt": "Real-time speech-to-text on Jetson Orin with CUDA, <100ms latency, 95% accuracy, noisy environment"
+        })
+        print(model_result)
+        
+        # Test 3: Memory limits
+        print("\n💾 Test 3: Memory Status and Limits")
+        memory_result = self.call_tool_direct("get_memory_status")
+        print(memory_result)
+        
+        # Test 4: System status
+        print("\n🚀 Test 4: System Status")
+        status_result = self.call_tool_direct("get_system_status")
+        print(status_result)
+        
+        # Test 5: Model management
+        print("\n🤖 Test 5: Model Management")
+        models_result = self.call_tool_direct("list_models")
+        print(models_result)
+        
+        # Test 6: Hot swap capabilities
+        print("\n🔄 Test 6: Hot Swap Test")
+        swap_result = self.call_tool_direct("hot_swap_models", {
+            "source_model": "llama-7b",
+            "target_model": "codellama-7b"
+        })
+        print(swap_result)
+        
+        print("\n✅ Phase 5 System Limits Test Complete!")
+
+if __name__ == "__main__":
+    manager = MCPConnectionManager()
+    manager.test_system_limits()
@@ -43,7 +43,8 @@ def handle_request(request):
                     {"name": "batch_inference", "description": "Multi-prompt processing", "inputSchema": {"type": "object", "properties": {"prompts": {"type": "array"}}, "required": ["prompts"]}},
                     {"name": "create_agent_session", "description": "Persistent conversations", "inputSchema": {"type": "object", "properties": {"session_id": {"type": "string"}}, "required": ["session_id"]}},
                     {"name": "reload_mcp_server", "description": "Hot reload MCP server for development", "inputSchema": {"type": "object", "properties": {}, "required": []}},
-                    {"name": "use_hf_mcp", "description": "Direct access to HuggingFace MCP tools", "inputSchema": {"type": "object", "properties": {"tool_name": {"type": "string"}, "arguments": {"type": "object"}}, "required": ["tool_name", "arguments"]}}
+                    {"name": "use_hf_mcp", "description": "Direct access to HuggingFace MCP tools", "inputSchema": {"type": "object", "properties": {"tool_name": {"type": "string"}, "arguments": {"type": "object"}}, "required": ["tool_name", "arguments"]}},
+                    {"name": "list_available_tools", "description": "List all available MCP tools with descriptions", "inputSchema": {"type": "object", "properties": {}, "required": []}}
                 ]
             }
         }
@@ -69,21 +70,23 @@ def handle_request(request):
                 prompt = args.get("prompt", "")
                 thinking_mode = args.get("thinking_mode", "immediate")
 
-                # Use real inference engine
+                # Use real inference engine with actual AI generation
                 try:
-                    mode_enum = ThinkingMode(thinking_mode) if thinking_mode in [m.value for m in ThinkingMode] else ThinkingMode.IMMEDIATE
-                    response = phase3_engine.generate_text(prompt, thinking_mode=mode_enum)
+                    # Call the real generate_text method that uses HuggingFace API
+                    response = phase3_engine.generate_text(prompt, thinking_mode=thinking_mode)
 
                     return {
                         "jsonrpc": "2.0",
                         "id": request.get("id"),
-                        "result": {"content": [{"type": "text", "text": f"🧠 {response}"}]}
+                        "result": {"content": [{"type": "text", "text": response}]}
                     }
                 except Exception as e:
+                    # Enhanced fallback with actual model selection
+                    selected_model = phase3_engine.select_optimal_model(prompt)
                     return {
                         "jsonrpc": "2.0",
                         "id": request.get("id"),
-                        "result": {"content": [{"type": "text", "text": f"🧠 JetsonMind {thinking_mode} mode: {prompt[:50]}... (simulated)"}]}
+                        "result": {"content": [{"type": "text", "text": f"🧠 {selected_model}: {prompt} → [Generated response would appear here with real models]"}]}
                     }
 
             elif tool_name == "get_system_status":
@@ -189,6 +192,7 @@ def handle_request(request):
                             continue
 
                         try:
+                            # Use real inference engine for batch processing
                             response = phase3_engine.generate_text(prompt, thinking_mode=ThinkingMode.IMMEDIATE)
                             results.append(f"{i+1}. {response}")
                         except Exception as e:
@@ -275,12 +279,39 @@ def handle_request(request):
                         "result": {"content": [{"type": "text", "text": f"❌ HF MCP Exception: {str(e)}"}]}
                     }
 
+            elif tool_name == "list_available_tools":
+                tools_info = [
+                    "🛠️ JetsonMind MCP Tools (13 available):",
+                    "",
+                    "1. list_models - List available AI models",
+                    "2. generate_text - Generate text with thinking modes",
+                    "3. get_system_status - Get system status",
+                    "4. get_memory_status - Get memory status", 
+                    "5. manage_model_loading - Load/unload models",
+                    "6. get_model_info - Get detailed model information",
+                    "7. select_optimal_model - AI model recommendation",
+                    "8. hot_swap_models - Instant model swapping",
+                    "9. batch_inference - Multi-prompt processing",
+                    "10. create_agent_session - Persistent conversations",
+                    "11. reload_mcp_server - Hot reload MCP server for development",
+                    "12. use_hf_mcp - Direct access to HuggingFace MCP tools",
+                    "13. list_available_tools - List all available MCP tools with descriptions",
+                    "",
+                    "💡 Usage: Ask Q CLI to 'Use [tool_name]' to invoke any tool"
+                ]
+                
+                return {
+                    "jsonrpc": "2.0",
+                    "id": request.get("id"),
+                    "result": {"content": [{"type": "text", "text": "\n".join(tools_info)}]}
+                }
+            
             # Tool not found - provide helpful suggestions
             available_tools = [
                 "list_models", "generate_text", "get_system_status", "get_memory_status",
                 "manage_model_loading", "get_model_info", "select_optimal_model", 
                 "hot_swap_models", "batch_inference", "create_agent_session",
-                "reload_mcp_server", "use_hf_mcp"
+                "reload_mcp_server", "use_hf_mcp", "list_available_tools"
             ]
 
             suggestion_text = f"❌ Tool '{tool_name}' not found.\n\n🛠️ Available JetsonMind MCP Tools:\n"
 
@@ -8,7 +8,8 @@
 import asyncio
 import logging
 from typing import Dict, Optional
-from mcp.client import Client
+from mcp.client.stdio import stdio_client
+from mcp.client.session import ClientSession
 
 logger = logging.getLogger("mcp-client-pool")
 
@@ -66,7 +67,7 @@ async def _connect_to_server(self, server_name: str, config: dict):
             logger.error(f"Error connecting to {server_name} server: {e}")
             raise
 
-    async def get_client(self, server_name: str) -> Client:
+    async def get_client(self, server_name: str) -> ClientSession:
         """
         Get MCP client for specified internal server.
         
 
@@ -0,0 +1,51 @@
+#!/usr/bin/env python3
+"""Quick MCP Debug Access - All Tools"""
+
+import json
+import subprocess
+import sys
+
+def call_debug_tool(tool_name, params=None):
+    request = {
+        "jsonrpc": "2.0",
+        "id": 1,
+        "method": "tools/call",
+        "params": {
+            "name": tool_name,
+            "arguments": params or {}
+        }
+    }
+    
+    result = subprocess.run([
+        'python3', '/home/petr/jetson/mcp_debug_server.py'
+    ], input=json.dumps(request), capture_output=True, text=True)
+    
+    if result.returncode == 0:
+        response = json.loads(result.stdout)
+        if "result" in response:
+            content = response["result"]["content"][0]["text"]
+            return json.loads(content)
+        else:
+            print(f"Error: {response.get('error')}")
+            return None
+    else:
+        print(f"Failed: {result.stderr}")
+        return None
+
+def main():
+    tools = ["debug_status", "hot_reload", "test_all_tools", "system_info", "memory_info", "process_info", "file_check", "run_command", "mcp_health", "error_trace"]
+    
+    if len(sys.argv) < 2:
+        print("Usage: python3 debug.py <tool_name> [params_json]")
+        print("Available tools:", ", ".join(tools))
+        return
+    
+    tool_name = sys.argv[1]
+    params = json.loads(sys.argv[2]) if len(sys.argv) > 2 else {}
+    
+    result = call_debug_tool(tool_name, params)
+    if result:
+        print(json.dumps(result, indent=2))
+
+if __name__ == "__main__":
+    main()