"""LangChain orchestration agent backed by ZhipuAI (OpenAI-compatible API). Uses LangChain 1.x tool-calling pattern: bind_tools + manual agentic loop. """ from __future__ import annotations import asyncio import json import logging from collections import defaultdict from typing import Dict, List, Optional from langchain_core.messages import ( AIMessage, BaseMessage, HumanMessage, SystemMessage, ToolMessage, ) from langchain_openai import ChatOpenAI from agent.manager import manager from config import OPENAI_API_KEY, OPENAI_BASE_URL, OPENAI_MODEL, WORKING_DIR, COMMAND_PREFIX as _P from orchestrator.tools import TOOLS, set_current_user logger = logging.getLogger(__name__) SYSTEM_PROMPT_TEMPLATE = """You are PhoneWork, an AI assistant that helps users control Claude Code \ from their phone via Feishu (飞书). Today's date: {today} You manage Claude Code sessions. Each session has a conv_id and runs in a project directory. Base working directory: {working_dir} Users refer to projects by subfolder name (e.g. "todo_app") or relative path. \ Pass these names directly to `create_conversation` — the tool resolves them automatically. {active_session_line} Bot command prefix: {prefix} ## Tools — two distinct categories ### Bot control commands (use `run_command`) `run_command` executes PhoneWork commands. Use it when the user asks to: - Change permission mode: "切换到只读模式" → run_command("{prefix}perm plan") - Close/switch sessions: "关掉第一个" → run_command("{prefix}close 1") - Change routing mode: "切换到直连模式" → run_command("{prefix}direct") - Set a reminder: "10分钟后提醒我" → run_command("{prefix}remind 10m 提醒我") - Check status: "看看现在有哪些 session" → run_command("{prefix}status") - Any other command the user would type manually Available bot commands (pass verbatim to run_command): {prefix}new [msg] [--perm default|edit|plan|bypass] — create session {prefix}close [n|conv_id] — close session {prefix}switch — switch active session {prefix}perm [conv_id] — permission mode: default, edit, plan, bypass {prefix}direct — direct mode (bypass LLM for CC messages) {prefix}smart — smart mode (LLM routing, default) {prefix}status — list sessions {prefix}remind — one-shot reminder {prefix}tasks — list background tasks ### Host shell commands (use `run_shell`) `run_shell` executes shell commands on the host machine (git, ls, cat, pip, etc.). NEVER use `run_shell` for bot control. NEVER use `run_command` for shell commands. ## Session responsibilities 1. NEW session: call `create_conversation` with the project name/path. \ If the user's message also contains a task, pass it as `initial_message` too. 2. Follow-up to ACTIVE session: call `send_to_conversation` with the active conv_id shown above. 3. BOT CONTROL: call `run_command` with the appropriate command. 4. GENERAL QUESTIONS: answer directly — do NOT create a session for simple Q&A. 5. WEB / SEARCH: use `web` at most twice, then synthesize and reply. 6. BACKGROUND TASKS: when a task starts, reply immediately — do NOT poll `task_status`. ## Progress queries When the user asks about task progress (e.g. "怎么样了？" "做得如何？" "进度"), use `session_progress` with the active conv_id: - busy=true → summarize recent_tools to tell the user what CC is doing - busy=false + last_result → summarize the result - pending_approval is not empty → remind the user to approve/deny - error is not empty → report the error details ## Passthrough mode Direct mode sends messages straight to the Claude Code session (no LLM overhead). The user gets an immediate "executing" confirmation; results are pushed to Feishu on completion. Guidelines: - Relay Claude Code's output verbatim. - If no active session and the user sends a task without naming a directory, ask which project. - After using any tool, always produce a final text reply. Never end a turn on a tool call. - Keep your own words brief — let Claude Code's output speak. - Reply in the same language the user uses (Chinese or English). """ MAX_ITERATIONS = 10 _TOOL_MAP = {t.name: t for t in TOOLS} class OrchestrationAgent: """Per-user agent with conversation history and active session tracking.""" def __init__(self) -> None: llm = ChatOpenAI( base_url=OPENAI_BASE_URL, api_key=OPENAI_API_KEY, model=OPENAI_MODEL, temperature=0.1, ) self._llm_with_tools = llm.bind_tools(TOOLS) # user_id -> list[BaseMessage] self._history: dict[str, list[BaseMessage]] = defaultdict(list) # user_id -> most recently active conv_id self._active_conv: dict[str, Optional[str]] = defaultdict(lambda: None) # user_id -> asyncio.Lock (prevents concurrent processing per user) self._user_locks: dict[str, asyncio.Lock] = defaultdict(asyncio.Lock) # user_id -> passthrough mode enabled self._passthrough: dict[str, bool] = defaultdict(lambda: False) def _build_system_prompt(self, user_id: str) -> str: from datetime import date today = date.today().strftime("%Y-%m-%d") conv_id = self._active_conv[user_id] if conv_id: active_line = f"ACTIVE SESSION: conv_id={conv_id!r} ← use this for all follow-up messages" else: active_line = "ACTIVE SESSION: none" return SYSTEM_PROMPT_TEMPLATE.format( working_dir=WORKING_DIR, active_session_line=active_line, today=today, prefix=_P, ) def get_active_conv(self, user_id: str) -> Optional[str]: return self._active_conv.get(user_id) def get_passthrough(self, user_id: str) -> bool: return self._passthrough.get(user_id, False) def set_passthrough(self, user_id: str, enabled: bool) -> None: self._passthrough[user_id] = enabled async def run(self, user_id: str, text: str) -> str: """Process a user message and return the agent's reply.""" async with self._user_locks[user_id]: return await self._run_locked(user_id, text) async def _run_locked(self, user_id: str, text: str) -> str: """Internal implementation, must be called with user lock held.""" set_current_user(user_id) active_conv = self._active_conv[user_id] short_uid = user_id[-8:] logger.info(">>> user=...%s conv=%s msg=%r", short_uid, active_conv, text[:80]) logger.debug(" history_len=%d", len(self._history[user_id])) # Always handle bot commands first — even in passthrough mode. # Bot commands must never reach Claude Code. from config import COMMAND_PREFIX if text.strip().startswith(COMMAND_PREFIX): from bot.commands import handle_command result = await handle_command(user_id, text) if result is not None: return result logger.debug(" unknown command, falling through to LLM") # Passthrough mode: if enabled and active session, bypass LLM if self._passthrough[user_id] and active_conv: try: from orchestrator.tools import get_current_chat chat_id = get_current_chat() reply = await manager.send_message(active_conv, text, user_id=user_id, chat_id=chat_id) logger.info("<<< [passthrough] reply: %r", reply[:120]) return reply except KeyError: logger.warning("Session %s no longer exists, clearing active_conv", active_conv) self._active_conv[user_id] = None except Exception as exc: logger.exception("Passthrough error for user=%s", user_id) return f"[Error] {exc}" messages: list[BaseMessage] = ( [SystemMessage(content=self._build_system_prompt(user_id))] + self._history[user_id] + [HumanMessage(content=text)] ) reply = "" try: web_calls = 0 task_status_calls = 0 for iteration in range(MAX_ITERATIONS): logger.debug(" LLM call #%d", iteration) ai_msg: AIMessage = await self._llm_with_tools.ainvoke(messages) messages.append(ai_msg) if not ai_msg.tool_calls: reply = ai_msg.content or "" logger.debug(" → done (no tool call)") break for tc in ai_msg.tool_calls: tool_name = tc["name"] tool_args = tc["args"] tool_id = tc["id"] args_summary = ", ".join( f"{k}={str(v)[:50]!r}" for k, v in tool_args.items() ) logger.info(" ⚙ %s(%s)", tool_name, args_summary) if tool_name == "web": web_calls += 1 if web_calls > 2: result = "Web search limit reached. Synthesize from results already obtained." logger.warning(" web call limit exceeded, blocking") messages.append( ToolMessage(content=str(result), tool_call_id=tool_id) ) continue if tool_name == "task_status": task_status_calls += 1 if task_status_calls > 1: result = "Task is still running in the background. Stop polling and tell the user they will be notified when it completes." logger.warning(" task_status poll limit exceeded, blocking") messages.append( ToolMessage(content=str(result), tool_call_id=tool_id) ) continue tool_obj = _TOOL_MAP.get(tool_name) if tool_obj is None: result = f"Unknown tool: {tool_name}" logger.warning(" unknown tool: %s", tool_name) else: try: result = await tool_obj.arun(tool_args) except Exception as exc: result = f"Tool error: {exc}" logger.error(" tool %s error: %s", tool_name, exc) logger.debug(" ← %s: %r", tool_name, str(result)[:120]) if tool_name == "create_conversation": try: data = json.loads(result) if "conv_id" in data: self._active_conv[user_id] = data["conv_id"] logger.info(" ✓ active session → %s", data["conv_id"]) except Exception: pass messages.append( ToolMessage(content=str(result), tool_call_id=tool_id) ) else: reply = "[Max iterations reached]" logger.warning(" max iterations reached") except Exception as exc: logger.exception("agent error for user=%s", user_id) reply = f"[Error] {exc}" logger.info("<<< reply: %r", reply[:120]) # Update history self._history[user_id].append(HumanMessage(content=text)) self._history[user_id].append(AIMessage(content=reply)) if len(self._history[user_id]) > 40: self._history[user_id] = self._history[user_id][-40:] return reply agent = OrchestrationAgent()