SecretiveShell · baryhuang · Mar 30, 2025 · Mar 31, 2025 · Mar 31, 2025 · Mar 31, 2025
diff --git a/.gitignore b/.gitignore
@@ -165,4 +165,11 @@ cython_debug/
 ## custom
 commands.md
 compose.yml
-config.json
+config.json
+
+screenshots/*
+.DS_Store
+
+.cursor
+agent_worker_task.json
+logs
diff --git a/agent_worker_task.json.example b/agent_worker_task.json.example
@@ -0,0 +1,7 @@
+{
+    "task": "Hi Olivia, tell me what's on your computer screen. You should include a response of 'the task has been completed' when the task is complete. Don't ask for what to do next.",
+    "model": "claude-3-7-sonnet-20250219",
+    "system_prompt": "You should include a response of 'the task has been completed' when the task is complete.\n\n You should include a response of 'the task has been completed' when you found yourself stuck in a loop with no progress.",
+    "verbose": true,
+    "max_iterations": 10
+} 
diff --git a/mcp_bridge/agent_worker/agent_worker.py b/mcp_bridge/agent_worker/agent_worker.py
@@ -0,0 +1,168 @@
+#!/usr/bin/env python
+"""Agent worker module that provides standalone command-line agent execution"""
+
+import asyncio
+import os
+from typing import Dict, List, Optional, Tuple
+
+from loguru import logger
+
+from mcp_bridge.agent_worker.utils import is_anthropic_model
+from mcp_bridge.agent_worker.anthropic_handler import process_with_anthropic
+from mcp_bridge.agent_worker.openai_handler import process_with_openai
+from mcp_bridge.agent_worker.customer_logs import get_logger, CustomerMessageLogger
+from mcp_bridge.mcp_clients.McpClientManager import ClientManager
+from mcp_bridge.utils import force_exit
+from lmos_openai_types import (
+    ChatCompletionRequestMessage,
+    ChatCompletionRequestSystemMessage,
+    ChatCompletionRequestUserMessage,
+)
+
+class AgentWorker:
+    """A standalone worker that processes tasks using MCP clients and LLM completions"""
+
+    def __init__(
+        self, 
+        task: str, 
+        model: str = "anthropic.claude-3-haiku-20240307-v1:0", 
+        system_prompt: Optional[str] = None,
+        max_iterations: int = 10,
+        session_id: Optional[str] = None,
+    ):
+        self.task = task
+        self.model = model
+        self.system_prompt = system_prompt or "You are a helpful assistant that completes tasks using available tools. Use the tools provided to you to help complete the user's task."
+        self.messages: List[ChatCompletionRequestMessage] = []
+        self.max_iterations = max_iterations
+        self.thinking_blocks: List[Dict[str, object]] = []
+        self.session_id = session_id
+        # Initialize customer message logger
+        self.customer_logger: CustomerMessageLogger = get_logger(initialize=True, session_id=self.session_id)
+        self.customer_logger.log_system_event("initialization", {
+            "task": task,
+            "model": model,
+            "max_iterations": max_iterations
+        })
+
+    async def initialize(self) -> None:
+        """Initialize the MCP clients"""
+        logger.info("Initializing MCP clients...")
+        # Start the ClientManager to load all available MCP clients
+        await ClientManager.initialize()
+
+        # Wait a moment for clients to start up
+        logger.info("Waiting for MCP clients to initialize...")
+        await asyncio.sleep(2)
+
+        # Check that at least one client is ready
+        max_attempts = 3
+        for attempt in range(max_attempts):
+            clients = ClientManager.get_clients()
+            ready_clients = [name for name, client in clients if client.session is not None]
+
+            if ready_clients:
+                logger.info(f"MCP clients ready: {', '.join(ready_clients)}")
+                # Log available clients to customer log
+                self.customer_logger.log_system_event("clients_ready", {
+                    "clients": ready_clients
+                })
+                break
+
+            logger.warning(f"No MCP clients ready yet, waiting (attempt {attempt+1}/{max_attempts})...")
+            await asyncio.sleep(2)
+
+        # Initialize the conversation with system and user messages
+        self.messages = [
+            ChatCompletionRequestSystemMessage(
+                role="system",
+                content=self.system_prompt
+            ),
+            ChatCompletionRequestUserMessage(
+                role="user",
+                content=self.task
+            )
+        ]
+
+        # Log initial messages to customer log
+        self.customer_logger.log_message("system", self.system_prompt)
+        self.customer_logger.log_message("user", self.task)
+
+    async def shutdown(self) -> None:
+        """Shutdown all MCP clients"""
+        logger.info("Shutting down MCP clients...")
+        # Log shutdown event
+        self.customer_logger.log_system_event("shutdown", {
+            "summary": self.customer_logger.get_summary()
+        })
+        # Exit the program
+        force_exit(0)
+
-        # Exit the program
-        force_exit(0)
-    
+        # Stop the event loop
+        loop = asyncio.get_event_loop()
+        loop.stop()
+        loop.close()
-        # Exit the program
-        force_exit(0)
-    
+        # Stop the event loop
+        loop = asyncio.get_event_loop()
+        loop.stop()
+        loop.close()
+    async def run_agent_loop(self) -> List[ChatCompletionRequestMessage]:
+        """Run the agent loop to process the task until completion"""
+        await self.initialize()
+        logger.info("Starting agent loop...")
+        self.customer_logger.log_system_event("agent_loop_start", {})
+
+        # Keep running until the task is complete
+        for iteration in range(self.max_iterations):
+            logger.info(f"Agent iteration {iteration+1}/{self.max_iterations}")
+            self.customer_logger.log_system_event("iteration_start", {
+                "iteration": iteration + 1,
+                "max_iterations": self.max_iterations
+            })
+
+            # Process with either Anthropic or OpenAI API based on model name
+            task_complete = False
+            if is_anthropic_model(self.model):
+                # Use Anthropic processing
+                _, updated_messages, thinking_blocks, task_complete = await process_with_anthropic(
+                    messages=self.messages,
+                    model=self.model,
+                    system_prompt=self.system_prompt,
+                    thinking_blocks=self.thinking_blocks,
+                    customer_logger=self.customer_logger
+                )
+                self.messages = updated_messages
+
+                # Check for duplicate thinking blocks before adding
+                # ThinkingBlock from Anthropic has a signature property
+                existing_signatures = {block.signature for block in self.thinking_blocks 
+                                      if block.signature}
+                unique_blocks = [block for block in thinking_blocks 
+                                if not block.signature or block.signature not in existing_signatures]
+                self.thinking_blocks.extend(unique_blocks)
+
+                # Log thinking blocks to customer log
+                for block in unique_blocks:
+                    if block.get("thinking"):
+                        self.customer_logger.log_thinking(
+                            block["thinking"],
+                            block.get("signature")
+                        )
+            else:
+                # Use OpenAI processing
+                updated_messages, task_complete = await process_with_openai(
+                    messages=self.messages,
+                    model=self.model,
+                    customer_logger=self.customer_logger
+                )
+                self.messages = updated_messages
+
+            # If task is complete, return the messages
+            if task_complete:
+                self.customer_logger.log_system_event("task_complete", {
+                    "iteration": iteration + 1,
+                    "summary": self.customer_logger.get_summary()
+                })
+                return self.messages
+
+        # If we reached max iterations without completion
+        logger.warning(f"Reached maximum iterations ({self.max_iterations}) without task completion")
+        self.customer_logger.log_system_event("max_iterations_reached", {
+            "max_iterations": self.max_iterations,
+            "summary": self.customer_logger.get_summary()
+        })
+
+        # Return final messages for inspection
+        return self.messages