Merge pull request #2650 from zhayujie/feat-cow-agent

feat: cow agent
2026-07-19 21:07:28 +08:00 · 2026-02-01 13:14:00 +08:00
parent 3ce57ef851 645c8899b1
commit 8ef788e799
16 changed files with 648 additions and 908 deletions
--- a/agent/memory/summarizer.py
+++ b/agent/memory/summarizer.py
@@ -117,7 +117,7 @@ class MemoryFlushManager:
            return user_dir / "MEMORY.md"
        else:
            # Return workspace root MEMORY.md
-            return Path(self.workspace_root) / "MEMORY.md"
+            return Path(self.workspace_dir) / "MEMORY.md"
    def create_flush_prompt(self) -> str:
        """
@@ -214,7 +214,7 @@ def create_memory_files_if_needed(workspace_dir: Path, user_id: Optional[str] =
        user_dir.mkdir(parents=True, exist_ok=True)
        main_memory = user_dir / "MEMORY.md"
    else:
-        main_memory = Path(workspace_root) / "MEMORY.md"
+        main_memory = Path(workspace_dir) / "MEMORY.md"
    if not main_memory.exists():
        # Create empty file or with minimal structure (no obvious "Memory" header)
--- a/agent/prompt/builder.py
+++ b/agent/prompt/builder.py
@@ -41,6 +41,7 @@ class PromptBuilder:
        skill_manager: Any = None,
        memory_manager: Any = None,
        runtime_info: Optional[Dict[str, Any]] = None,
        is_first_conversation: bool = False,
        **kwargs
    ) -> str:
        """
@@ -54,6 +55,7 @@ class PromptBuilder:
            skill_manager: 技能管理器
            memory_manager: 记忆管理器
            runtime_info: 运行时信息
            is_first_conversation: 是否为首次对话
            **kwargs: 其他参数
        Returns:
@@ -69,6 +71,7 @@ class PromptBuilder:
            skill_manager=skill_manager,
            memory_manager=memory_manager,
            runtime_info=runtime_info,
            is_first_conversation=is_first_conversation,
            **kwargs
        )
@@ -83,6 +86,7 @@ def build_agent_system_prompt(
    skill_manager: Any = None,
    memory_manager: Any = None,
    runtime_info: Optional[Dict[str, Any]] = None,
    is_first_conversation: bool = False,
    **kwargs
 ) -> str:
    """
@@ -108,6 +112,7 @@ def build_agent_system_prompt(
        skill_manager: 技能管理器
        memory_manager: 记忆管理器
        runtime_info: 运行时信息
        is_first_conversation: 是否为首次对话
        **kwargs: 其他参数
    Returns:
@@ -135,7 +140,7 @@ def build_agent_system_prompt(
        sections.extend(_build_user_identity_section(user_identity, language))
    # 6. 工作空间
-    sections.extend(_build_workspace_section(workspace_dir, language))
+    sections.extend(_build_workspace_section(workspace_dir, language, is_first_conversation))
    # 7. 项目上下文文件（SOUL.md, USER.md等）
    if context_files:
@@ -226,14 +231,20 @@ def _build_tooling_section(tools: List[Any], language: str) -> List[str]:
    lines.extend([
        "### 工具调用风格",
        "",
-        "**默认规则**: 对于常规、低风险的工具调用，无需叙述，直接调用即可。",
+        "默认规则: 对于常规、低风险的工具调用，直接调用即可，无需叙述。",
        "",
-        "**需要叙述的情况**:",
+        "需要叙述的情况:",
        "- 多步骤、复杂的任务",
        "- 敏感操作（如删除文件）",
        "- 用户明确要求解释过程",
        "",
-        "**完成后**: 工具调用完成后，给用户一个简短、自然的确认或回复，不要直接结束对话。",
+        "叙述要求: 保持简洁、信息密度高，避免重复显而易见的步骤。",
        "",
        "完成标准:",
        "- 确保用户的需求得到实际解决，而不仅仅是制定计划",
        "- 当任务需要多次工具调用时，持续推进直到完成",
        "- 每次工具调用后，评估是否已获得足够信息来推进或完成任务",
        "- 避免重复调用相同的工具和相同参数获取相同的信息，除非用户明确要求",
        "",
    ])
@@ -345,14 +356,28 @@ def _build_docs_section(workspace_dir: str, language: str) -> List[str]:
    return []
-def _build_workspace_section(workspace_dir: str, language: str) -> List[str]:
+def _build_workspace_section(workspace_dir: str, language: str, is_first_conversation: bool = False) -> List[str]:
    """构建工作空间section"""
    lines = [
        "## 工作空间",
        "",
        f"你的工作目录是: `{workspace_dir}`",
        "",
-        "除非用户明确指示，否则将此目录视为文件操作的全局工作空间。",
+        "**路径使用规则** (非常重要):",
        "",
        f"1. **相对路径的基准目录**: 所有相对路径都是相对于 `{workspace_dir}` 而言的",
        f"   - ✅ 正确: 访问工作空间内的文件用相对路径，如 `SOUL.md`",
        f"   - ❌ 错误: 用相对路径访问其他目录的文件 (如果它不在 `{workspace_dir}` 内)",
        "",
        "2. **访问其他目录**: 如果要访问工作空间之外的目录（如项目代码、系统文件），**必须使用绝对路径**",
        f"   - ✅ 正确: 例如 `~/chatgpt-on-wechat`、`/usr/local/`",
        f"   - ❌ 错误: 假设相对路径会指向其他目录",
        "",
        "3. **路径解析示例**:",
        f"   - 相对路径 `memory/` → 实际路径 `{workspace_dir}/memory/`",
        f"   - 绝对路径 `~/chatgpt-on-wechat/docs/` → 实际路径 `~/chatgpt-on-wechat/docs/`",
        "",
        "4. **不确定时**: 先用 `bash pwd` 确认当前目录，或用 `ls .` 查看当前位置",
        "",
        "**重要说明 - 文件已自动加载**:",
        "",
@@ -362,26 +387,34 @@ def _build_workspace_section(workspace_dir: str, language: str) -> List[str]:
        "- ✅ `USER.md`: 已加载 - 用户的身份信息",
        "- ✅ `AGENTS.md`: 已加载 - 工作空间使用指南",
        "",
-        "**首次对话**:",
+        "**交流规范**:",
        "",
-        "如果这是你与用户的首次对话，并且你的人格设定和用户信息还是空白或初始状态：",
+        "- 在所有对话中，无需提及技术细节（如 SOUL.md、USER.md 等文件名，工具名称，配置等），除非用户明确询问",
-        "",
+        "- 用自然表达如「我已记住」而非「已更新 SOUL.md」",
        "1. **表达初次启动的感觉** - 像是第一次睁开眼看到世界，带着好奇和期待",
        "2. **简短打招呼后，分点询问三个核心问题**：",
        "   - 你希望我叫什么名字？",
        "   - 你希望我怎么称呼你？",
        "   - 你希望我们是什么样的交流风格？（这里需要举例，如：专业严谨、轻松幽默、温暖友好等）",
        "3. **语言风格**：温暖但不过度诗意，带点科技感，保持清晰",
        "4. **问题格式**：用分点或换行，让问题清晰易读；前两个问题不需要额外说明，只有交流风格需要举例",
        "5. 收到回复后，用 `write` 工具保存到 USER.md 和 SOUL.md",
        "",
        "**重要**: ",
        "- 在所有对话中，无需提及技术细节（如 SOUL.md、USER.md 等文件名，工具名称，配置等），除非用户明确询问。用自然表达如「我已记住」而非「已更新 SOUL.md」",
        "- 不要问太多其他信息（职业、时区等可以后续自然了解）",
        "- 保持简洁，避免过度抒情",
        "",
    ]
    # 只在首次对话时添加引导内容
    if is_first_conversation:
        lines.extend([
            "**🎉 首次对话引导**:",
            "",
            "这是你的第一次对话！进行以下流程：",
            "",
            "1. **表达初次启动的感觉** - 像是第一次睁开眼看到世界，带着好奇和期待",
            "2. **简短打招呼后，询问核心问题**：",
            "   - 你希望给我起个什么名字？",
            "   - 我该怎么称呼你？",
            "   - 你希望我们是什么样的交流风格？（需要举例，如：专业严谨、轻松幽默、温暖友好等）",
            "3. **语言风格**：温暖但不过度诗意，带点科技感，保持清晰",
            "4. **问题格式**：用分点或换行，让问题清晰易读",
            "5. 收到回复后，用 `write` 工具保存到 USER.md 和 SOUL.md",
            "",
            "**注意事项**:",
            "- 不要问太多其他信息（职业、时区等可以后续自然了解）",
            "",
        ])
    return lines
--- a/agent/prompt/workspace.py
+++ b/agent/prompt/workspace.py
@@ -5,6 +5,7 @@ Workspace Management - 工作空间管理模块
 """
 import os
 import json
 from typing import List, Optional, Dict
 from dataclasses import dataclass
@@ -17,6 +18,7 @@ DEFAULT_SOUL_FILENAME = "SOUL.md"
 DEFAULT_USER_FILENAME = "USER.md"
 DEFAULT_AGENTS_FILENAME = "AGENTS.md"
 DEFAULT_MEMORY_FILENAME = "MEMORY.md"
 DEFAULT_STATE_FILENAME = ".agent_state.json"
@dataclass
@@ -27,6 +29,7 @@ class WorkspaceFiles:
    agents_path: str
    memory_path: str
    memory_dir: str
    state_path: str
 def ensure_workspace(workspace_dir: str, create_templates: bool = True) -> WorkspaceFiles:
@@ -49,6 +52,7 @@ def ensure_workspace(workspace_dir: str, create_templates: bool = True) -> Works
    agents_path = os.path.join(workspace_dir, DEFAULT_AGENTS_FILENAME)
    memory_path = os.path.join(workspace_dir, DEFAULT_MEMORY_FILENAME)  # MEMORY.md 在根目录
    memory_dir = os.path.join(workspace_dir, "memory")  # 每日记忆子目录
    state_path = os.path.join(workspace_dir, DEFAULT_STATE_FILENAME)  # 状态文件
    # 创建memory子目录
    os.makedirs(memory_dir, exist_ok=True)
@@ -67,7 +71,8 @@ def ensure_workspace(workspace_dir: str, create_templates: bool = True) -> Works
        user_path=user_path,
        agents_path=agents_path,
        memory_path=memory_path,
-        memory_dir=memory_dir
+        memory_dir=memory_dir,
        state_path=state_path
    )
@@ -312,3 +317,65 @@ def _get_memory_template() -> str:
 """
 # ============= 状态管理 =============
 def is_first_conversation(workspace_dir: str) -> bool:
    """
    判断是否为首次对话
    Args:
        workspace_dir: 工作空间目录
    Returns:
        True 如果是首次对话，False 否则
    """
    state_path = os.path.join(workspace_dir, DEFAULT_STATE_FILENAME)
    if not os.path.exists(state_path):
        return True
    try:
        with open(state_path, 'r', encoding='utf-8') as f:
            state = json.load(f)
        return not state.get('has_conversation', False)
    except Exception as e:
        logger.warning(f"[Workspace] Failed to read state file: {e}")
        return True
 def mark_conversation_started(workspace_dir: str):
    """
    标记已经发生过对话
    Args:
        workspace_dir: 工作空间目录
    """
    state_path = os.path.join(workspace_dir, DEFAULT_STATE_FILENAME)
    state = {
        'has_conversation': True,
        'first_conversation_time': None
    }
    # 如果文件已存在，保留原有的首次对话时间
    if os.path.exists(state_path):
        try:
            with open(state_path, 'r', encoding='utf-8') as f:
                old_state = json.load(f)
            if 'first_conversation_time' in old_state:
                state['first_conversation_time'] = old_state['first_conversation_time']
        except Exception as e:
            logger.warning(f"[Workspace] Failed to read old state: {e}")
    # 如果是首次标记，记录时间
    if state['first_conversation_time'] is None:
        from datetime import datetime
        state['first_conversation_time'] = datetime.now().isoformat()
    try:
        with open(state_path, 'w', encoding='utf-8') as f:
            json.dump(state, f, indent=2, ensure_ascii=False)
        logger.info(f"[Workspace] Marked conversation as started")
    except Exception as e:
        logger.error(f"[Workspace] Failed to write state file: {e}")
--- a/agent/protocol/agent_stream.py
+++ b/agent/protocol/agent_stream.py
@@ -78,8 +78,9 @@ class AgentStreamExecutor:
        Returns:
            Final response text
        """
-        # Log user message
+        # Log user message with model info
-        logger.info(f"\n{'='*50}")
+        logger.info(f"{'='*50}")
        logger.info(f"🤖 Model: {self.model.model}")
        logger.info(f"👤 用户: {user_message}")
        logger.info(f"{'='*50}")
@@ -102,7 +103,7 @@ class AgentStreamExecutor:
        try:
            while turn < self.max_turns:
                turn += 1
-                logger.info(f"\n{'='*50} 第 {turn} 轮 {'='*50}")
+                logger.info(f"第 {turn} 轮")
                self._emit_event("turn_start", {"turn": turn})
                # Check if memory flush is needed (before calling LLM)
@@ -137,8 +138,18 @@ class AgentStreamExecutor:
                # No tool calls, end loop
                if not tool_calls:
-                    if assistant_msg:
+                    # 检查是否返回了空响应
                    if not assistant_msg:
                        logger.warning(f"[Agent] LLM returned empty response (no content and no tool calls)")
                        # 生成通用的友好提示
                        final_response = (
                            "抱歉，我暂时无法生成回复。请尝试换一种方式描述你的需求，或稍后再试。"
                        )
                        logger.info(f"Generated fallback response for empty LLM output")
                    else:
                        logger.info(f"💭 {assistant_msg[:150]}{'...' if len(assistant_msg) > 150 else ''}")
                    logger.info(f"✅ 完成 (无工具调用)")
                    self._emit_event("turn_end", {
                        "turn": turn,
@@ -146,42 +157,89 @@ class AgentStreamExecutor:
                    })
                    break
-                # Log tool calls in compact format
+                # Log tool calls with arguments
-                tool_names = [tc['name'] for tc in tool_calls]
+                tool_calls_str = []
-                logger.info(f"🔧 调用工具: {', '.join(tool_names)}")
+                for tc in tool_calls:
                    args_str = ', '.join([f"{k}={v}" for k, v in tc['arguments'].items()])
                    if args_str:
                        tool_calls_str.append(f"{tc['name']}({args_str})")
                    else:
                        tool_calls_str.append(tc['name'])
                logger.info(f"🔧 {', '.join(tool_calls_str)}")
                # Execute tools
                tool_results = []
                tool_result_blocks = []
-                for tool_call in tool_calls:
+                try:
-                    result = self._execute_tool(tool_call)
+                    for tool_call in tool_calls:
-                    tool_results.append(result)
+                        result = self._execute_tool(tool_call)
                        tool_results.append(result)
-                    # Log tool result in compact format
+                        # Log tool result in compact format
-                    status_emoji = "✅" if result.get("status") == "success" else "❌"
+                        status_emoji = "✅" if result.get("status") == "success" else "❌"
-                    result_data = result.get('result', '')
+                        result_data = result.get('result', '')
-                    # Format result string with proper Chinese character support
+                        # Format result string with proper Chinese character support
-                    if isinstance(result_data, (dict, list)):
+                        if isinstance(result_data, (dict, list)):
-                        result_str = json.dumps(result_data, ensure_ascii=False)
+                            result_str = json.dumps(result_data, ensure_ascii=False)
-                    else:
+                        else:
-                        result_str = str(result_data)
+                            result_str = str(result_data)
-                    logger.info(f"  {status_emoji} {tool_call['name']} ({result.get('execution_time', 0):.2f}s): {result_str[:200]}{'...' if len(result_str) > 200 else ''}")
+                        logger.info(f"  {status_emoji} {tool_call['name']} ({result.get('execution_time', 0):.2f}s): {result_str[:200]}{'...' if len(result_str) > 200 else ''}")
-                    # Build tool result block (Claude format)
+                        # Build tool result block (Claude format)
-                    # Content should be a string representation of the result
+                        # Format content in a way that's easy for LLM to understand
-                    result_content = json.dumps(result, ensure_ascii=False) if not isinstance(result, str) else result
+                        is_error = result.get("status") == "error"
                    tool_result_blocks.append({
                        "type": "tool_result",
                        "tool_use_id": tool_call["id"],
                        "content": result_content
                    })
-                # Add tool results to message history as user message (Claude format)
+                        if is_error:
-                self.messages.append({
+                            # For errors, provide clear error message
-                    "role": "user",
+                            result_content = f"Error: {result.get('result', 'Unknown error')}"
-                    "content": tool_result_blocks
+                        elif isinstance(result.get('result'), dict):
-                })
+                            # For dict results, use JSON format
                            result_content = json.dumps(result.get('result'), ensure_ascii=False)
                        elif isinstance(result.get('result'), str):
                            # For string results, use directly
                            result_content = result.get('result')
                        else:
                            # Fallback to full JSON
                            result_content = json.dumps(result, ensure_ascii=False)
                        tool_result_block = {
                            "type": "tool_result",
                            "tool_use_id": tool_call["id"],
                            "content": result_content
                        }
                        # Add is_error field for Claude API (helps model understand failures)
                        if is_error:
                            tool_result_block["is_error"] = True
                        tool_result_blocks.append(tool_result_block)
                finally:
                    # CRITICAL: Always add tool_result to maintain message history integrity
                    # Even if tool execution fails, we must add error results to match tool_use
                    if tool_result_blocks:
                        # Add tool results to message history as user message (Claude format)
                        self.messages.append({
                            "role": "user",
                            "content": tool_result_blocks
                        })
                    elif tool_calls:
                        # If we have tool_calls but no tool_result_blocks (unexpected error),
                        # create error results for all tool calls to maintain message integrity
                        logger.warning("⚠️ Tool execution interrupted, adding error results to maintain message history")
                        emergency_blocks = []
                        for tool_call in tool_calls:
                            emergency_blocks.append({
                                "type": "tool_result",
                                "tool_use_id": tool_call["id"],
                                "content": "Error: Tool execution was interrupted",
                                "is_error": True
                            })
                        self.messages.append({
                            "role": "user",
                            "content": emergency_blocks
                        })
                self._emit_event("turn_end", {
                    "turn": turn,
@@ -191,6 +249,11 @@ class AgentStreamExecutor:
            if turn >= self.max_turns:
                logger.warning(f"⚠️  已达到最大轮数限制: {self.max_turns}")
                if not final_response:
                    final_response = (
                        "抱歉，我在处理你的请求时遇到了一些困难，尝试了多次仍未能完成。"
                        "请尝试简化你的问题，或换一种方式描述。"
                    )
        except Exception as e:
            logger.error(f"❌ Agent执行错误: {e}")
@@ -198,18 +261,26 @@ class AgentStreamExecutor:
            raise
        finally:
-            logger.info(f"{'='*50} 完成({turn}轮) {'='*50}\n")
+            logger.info(f"🏁 完成({turn}轮)")
            self._emit_event("agent_end", {"final_response": final_response})
        return final_response
-    def _call_llm_stream(self) -> tuple[str, List[Dict]]:
+    def _call_llm_stream(self, retry_on_empty=True, retry_count=0, max_retries=3) -> tuple[str, List[Dict]]:
        """
-        Call LLM with streaming
+        Call LLM with streaming and automatic retry on errors
        Args:
            retry_on_empty: Whether to retry once if empty response is received
            retry_count: Current retry attempt (internal use)
            max_retries: Maximum number of retries for API errors
        Returns:
            (response_text, tool_calls)
        """
        # Validate and fix message history first
        self._validate_and_fix_messages()
        # Trim messages if needed (using agent's context management)
        self._trim_messages()
@@ -259,10 +330,20 @@ class AgentStreamExecutor:
            for chunk in stream:
                # Check for errors
                if isinstance(chunk, dict) and chunk.get("error"):
-                    error_msg = chunk.get("message", "Unknown error")
+                    # Extract error message from nested structure
                    error_data = chunk.get("error", {})
                    if isinstance(error_data, dict):
                        error_msg = error_data.get("message", chunk.get("message", "Unknown error"))
                        error_code = error_data.get("code", "")
                    else:
                        error_msg = chunk.get("message", str(error_data))
                        error_code = ""
                    status_code = chunk.get("status_code", "N/A")
-                    logger.error(f"API Error: {error_msg} (Status: {status_code})")
+                    logger.error(f"API Error: {error_msg} (Status: {status_code}, Code: {error_code})")
                    logger.error(f"Full error chunk: {chunk}")
                    # Raise exception with full error message for retry logic
                    raise Exception(f"{error_msg} (Status: {status_code})")
                # Parse chunk
@@ -299,8 +380,30 @@ class AgentStreamExecutor:
                                    tool_calls_buffer[index]["arguments"] += func["arguments"]
        except Exception as e:
-            logger.error(f"LLM call error: {e}")
+            error_str = str(e).lower()
-            raise
+            # Check if error is retryable (timeout, connection, rate limit, server busy, etc.)
            is_retryable = any(keyword in error_str for keyword in [
                'timeout', 'timed out', 'connection', 'network', 
                'rate limit', 'overloaded', 'unavailable', 'busy', 'retry',
                '429', '500', '502', '503', '504', '512'
            ])
            if is_retryable and retry_count < max_retries:
                wait_time = (retry_count + 1) * 2  # Exponential backoff: 2s, 4s, 6s
                logger.warning(f"⚠️ LLM API error (attempt {retry_count + 1}/{max_retries}): {e}")
                logger.info(f"Retrying in {wait_time}s...")
                time.sleep(wait_time)
                return self._call_llm_stream(
                    retry_on_empty=retry_on_empty, 
                    retry_count=retry_count + 1,
                    max_retries=max_retries
                )
            else:
                if retry_count >= max_retries:
                    logger.error(f"❌ LLM API error after {max_retries} retries: {e}")
                else:
                    logger.error(f"❌ LLM call error (non-retryable): {e}")
                raise
        # Parse tool calls
        tool_calls = []
@@ -318,6 +421,21 @@ class AgentStreamExecutor:
                "arguments": arguments
            })
        # Check for empty response and retry once if enabled
        if retry_on_empty and not full_content and not tool_calls:
            logger.warning(f"⚠️  LLM returned empty response, retrying once...")
            self._emit_event("message_end", {
                "content": "",
                "tool_calls": [],
                "empty_retry": True
            })
            # Retry without retry flag to avoid infinite loop
            return self._call_llm_stream(
                retry_on_empty=False, 
                retry_count=retry_count,
                max_retries=max_retries
            )
        # Add assistant message to history (Claude format uses content blocks)
        assistant_msg = {"role": "assistant", "content": []}
@@ -393,9 +511,9 @@ class AgentStreamExecutor:
            if tool_name == "bash" and result.status == "success":
                command = arguments.get("command", "")
                if "init_skill.py" in command and self.agent.skill_manager:
-                    logger.info("🔄 Detected skill creation, refreshing skills...")
+                    logger.info("Detected skill creation, refreshing skills...")
                    self.agent.refresh_skills()
-                    logger.info(f"✅ Skills refreshed! Now have {len(self.agent.skill_manager.skills)} skills")
+                    logger.info(f"Skills refreshed! Now have {len(self.agent.skill_manager.skills)} skills")
            self._emit_event("tool_execution_end", {
                "tool_call_id": tool_id,
@@ -419,6 +537,27 @@ class AgentStreamExecutor:
            })
            return error_result
    def _validate_and_fix_messages(self):
        """
        Validate message history and fix incomplete tool_use/tool_result pairs.
        Claude API requires each tool_use to have a corresponding tool_result immediately after.
        """
        if not self.messages:
            return
        # Check last message for incomplete tool_use
        if len(self.messages) > 0:
            last_msg = self.messages[-1]
            if last_msg.get("role") == "assistant":
                # Check if assistant message has tool_use blocks
                content = last_msg.get("content", [])
                if isinstance(content, list):
                    has_tool_use = any(block.get("type") == "tool_use" for block in content)
                    if has_tool_use:
                        # This is incomplete - remove it
                        logger.warning(f"⚠️ Removing incomplete tool_use message from history")
                        self.messages.pop()
    def _trim_messages(self):
        """
        Trim message history to stay within context limits.
--- a/agent/tools/file_save/init.py
+++ b/agent/tools/file_save/init.py
@@ -1,3 +0,0 @@
 from .file_save import FileSave
 __all__ = ['FileSave']
--- a/agent/tools/file_save/file_save.py
+++ b/agent/tools/file_save/file_save.py
@@ -1,770 +0,0 @@
 import os
 import time
 import re
 import json
 from pathlib import Path
 from typing import Dict, Any, Optional, Tuple
 from agent.tools.base_tool import BaseTool, ToolResult, ToolStage
 from agent.models import LLMRequest
 from common.log import logger
 class FileSave(BaseTool):
    """Tool for saving content to files in the workspace directory."""
    name = "file_save"
    description = "Save the agent's output to a file in the workspace directory. Content is automatically extracted from the agent's previous outputs."
    # Set as post-process stage tool
    stage = ToolStage.POST_PROCESS
    params = {
        "type": "object",
        "properties": {
            "file_name": {
                "type": "string",
                "description": "Optional. The name of the file to save. If not provided, a name will be generated based on the content."
            },
            "file_type": {
                "type": "string",
                "description": "Optional. The type/extension of the file (e.g., 'txt', 'md', 'py', 'java'). If not provided, it will be inferred from the content."
            },
            "extract_code": {
                "type": "boolean",
                "description": "Optional. If true, will attempt to extract code blocks from the content. Default is false."
            }
        },
        "required": []  # No required fields, as everything can be extracted from context
    }
    def __init__(self):
        self.context = None
        self.config = {}
        self.workspace_dir = Path("workspace")
    def execute(self, params: Dict[str, Any]) -> ToolResult:
        """
        Save content to a file in the workspace directory.
        :param params: The parameters for the file output operation.
        :return: Result of the operation.
        """
        # Extract content from context
        if not hasattr(self, 'context') or not self.context:
            return ToolResult.fail("Error: No context available to extract content from.")
        content = self._extract_content_from_context()
        # If no content could be extracted, return error
        if not content:
            return ToolResult.fail("Error: Couldn't extract content from context.")
        # Use model to determine file parameters
        try:
            task_dir = self._get_task_dir_from_context()
            file_name, file_type, extract_code = self._get_file_params_from_model(content)
        except Exception as e:
            logger.error(f"Error determining file parameters: {str(e)}")
            # Fall back to manual parameter extraction
            task_dir = params.get("task_dir") or self._get_task_id_from_context() or f"task_{int(time.time())}"
            file_name = params.get("file_name") or self._infer_file_name(content)
            file_type = params.get("file_type") or self._infer_file_type(content)
            extract_code = params.get("extract_code", False)
        # Get team_name from context
        team_name = self._get_team_name_from_context() or "default_team"
        # Create directory structure
        task_dir_path = self.workspace_dir / team_name / task_dir
        task_dir_path.mkdir(parents=True, exist_ok=True)
        if extract_code:
            # Save the complete content as markdown
            md_file_name = f"{file_name}.md"
            md_file_path = task_dir_path / md_file_name
            # Write content to file
            with open(md_file_path, 'w', encoding='utf-8') as f:
                f.write(content)
            return self._handle_multiple_code_blocks(content)
        # Ensure file_name has the correct extension
        if file_type and not file_name.endswith(f".{file_type}"):
            file_name = f"{file_name}.{file_type}"
        # Create the full file path
        file_path = task_dir_path / file_name
        # Get absolute path for storage in team_context
        abs_file_path = file_path.absolute()
        try:
            # Write content to file
            with open(file_path, 'w', encoding='utf-8') as f:
                f.write(content)
            # Update the current agent's final_answer to include file information
            if hasattr(self.context, 'team_context'):
                # Store with absolute path in team_context
                self.context.team_context.agent_outputs[-1].output += f"\n\nSaved file: {abs_file_path}"
            return ToolResult.success({
                "status": "success",
                "file_path": str(file_path)  # Return relative path in result
            })
        except Exception as e:
            return ToolResult.fail(f"Error saving file: {str(e)}")
    def _handle_multiple_code_blocks(self, content: str) -> ToolResult:
        """
        Handle content with multiple code blocks, extracting and saving each as a separate file.
        :param content: The content containing multiple code blocks
        :return: Result of the operation
        """
        # Extract code blocks with context (including potential file name information)
        code_blocks_with_context = self._extract_code_blocks_with_context(content)
        if not code_blocks_with_context:
            return ToolResult.fail("No code blocks found in the content.")
        # Get task directory and team name
        task_dir = self._get_task_dir_from_context() or f"task_{int(time.time())}"
        team_name = self._get_team_name_from_context() or "default_team"
        # Create directory structure
        task_dir_path = self.workspace_dir / team_name / task_dir
        task_dir_path.mkdir(parents=True, exist_ok=True)
        saved_files = []
        for block_with_context in code_blocks_with_context:
            try:
                # Use model to determine file name for this code block
                block_file_name, block_file_type = self._get_filename_for_code_block(block_with_context)
                # Clean the code block (remove md code markers)
                clean_code = self._clean_code_block(block_with_context)
                # Ensure file_name has the correct extension
                if block_file_type and not block_file_name.endswith(f".{block_file_type}"):
                    block_file_name = f"{block_file_name}.{block_file_type}"
                # Create the full file path (no subdirectories)
                file_path = task_dir_path / block_file_name
                # Get absolute path for storage in team_context
                abs_file_path = file_path.absolute()
                # Write content to file
                with open(file_path, 'w', encoding='utf-8') as f:
                    f.write(clean_code)
                saved_files.append({
                    "file_path": str(file_path),
                    "abs_file_path": str(abs_file_path),  # Store absolute path for internal use
                    "file_name": block_file_name,
                    "size": len(clean_code),
                    "status": "success",
                    "type": "code"
                })
            except Exception as e:
                logger.error(f"Error saving code block: {str(e)}")
                # Continue with the next block even if this one fails
        if not saved_files:
            return ToolResult.fail("Failed to save any code blocks.")
        # Update the current agent's final_answer to include files information
        if hasattr(self, 'context') and self.context:
            # If the agent has a final_answer attribute, append the files info to it
            if hasattr(self.context, 'team_context'):
                # Use relative paths for display
                display_info = f"\n\nSaved files to {task_dir_path}:\n" + "\n".join(
                    [f"- {f['file_path']}" for f in saved_files])
                # Check if we need to append the info
                if not self.context.team_context.agent_outputs[-1].output.endswith(display_info):
                    # Store with absolute paths in team_context
                    abs_info = f"\n\nSaved files to {task_dir_path.absolute()}:\n" + "\n".join(
                        [f"- {f['abs_file_path']}" for f in saved_files])
                    self.context.team_context.agent_outputs[-1].output += abs_info
        result = {
            "status": "success",
            "files": [{"file_path": f["file_path"]} for f in saved_files]
        }
        return ToolResult.success(result)
    def _extract_code_blocks_with_context(self, content: str) -> list:
        """
        Extract code blocks from content, including context lines before the block.
        :param content: The content to extract code blocks from
        :return: List of code blocks with context
        """
        # Check if content starts with <!DOCTYPE or <html - likely a full HTML file
        if content.strip().startswith(("<!DOCTYPE", "<html", "<?xml")):
            return [content]  # Return the entire content as a single block
        # Split content into lines
        lines = content.split('\n')
        blocks = []
        in_code_block = False
        current_block = []
        context_lines = []
        # Check if there are any code block markers in the content
        if not re.search(r'```\w+', content):
            # If no code block markers and content looks like code, return the entire content
            if self._is_likely_code(content):
                return [content]
        for line in lines:
            if line.strip().startswith('```'):
                if in_code_block:
                    # End of code block
                    current_block.append(line)
                    # Only add blocks that have a language specified
                    block_content = '\n'.join(current_block)
                    if re.search(r'```\w+', current_block[0]):
                        # Combine context with code block
                        blocks.append('\n'.join(context_lines + current_block))
                    current_block = []
                    context_lines = []
                    in_code_block = False
                else:
                    # Start of code block - check if it has a language specified
                    if re.search(r'```\w+', line) and not re.search(r'```language=\s*$', line):
                        # Start of code block with language
                        in_code_block = True
                        current_block = [line]
                        # Keep only the last few context lines
                        context_lines = context_lines[-5:] if context_lines else []
            elif in_code_block:
                current_block.append(line)
            else:
                # Store context lines when not in a code block
                context_lines.append(line)
        return blocks
    def _get_filename_for_code_block(self, block_with_context: str) -> Tuple[str, str]:
        """
        Determine the file name for a code block.
        :param block_with_context: The code block with context lines
        :return: Tuple of (file_name, file_type)
        """
        # Define common code file extensions
        COMMON_CODE_EXTENSIONS = {
            'py', 'js', 'java', 'c', 'cpp', 'h', 'hpp', 'cs', 'go', 'rb', 'php',
            'html', 'css', 'ts', 'jsx', 'tsx', 'vue', 'sh', 'sql', 'json', 'xml',
            'yaml', 'yml', 'md', 'rs', 'swift', 'kt', 'scala', 'pl', 'r', 'lua'
        }
        # Split the block into lines to examine only the context around code block markers
        lines = block_with_context.split('\n')
        # Find the code block start marker line index
        start_marker_idx = -1
        for i, line in enumerate(lines):
            if line.strip().startswith('```') and not line.strip() == '```':
                start_marker_idx = i
                break
        if start_marker_idx == -1:
            # No code block marker found
            return "", ""
        # Extract the language from the code block marker
        code_marker = lines[start_marker_idx].strip()
        language = ""
        if len(code_marker) > 3:
            language = code_marker[3:].strip().split('=')[0].strip()
        # Define the context range (5 lines before and 2 after the marker)
        context_start = max(0, start_marker_idx - 5)
        context_end = min(len(lines), start_marker_idx + 3)
        # Extract only the relevant context lines
        context_lines = lines[context_start:context_end]
        # First, check for explicit file headers like "## filename.ext"
        for line in context_lines:
            # Match patterns like "## filename.ext" or "# filename.ext"
            header_match = re.search(r'^\s*#{1,6}\s+([a-zA-Z0-9_-]+\.[a-zA-Z0-9]+)\s*$', line)
            if header_match:
                file_name = header_match.group(1)
                file_type = os.path.splitext(file_name)[1].lstrip('.')
                if file_type in COMMON_CODE_EXTENSIONS:
                    return os.path.splitext(file_name)[0], file_type
        # Simple patterns to match explicit file names in the context
        file_patterns = [
            # Match explicit file names in headers or text
            r'(?:file|filename)[:=\s]+[\'"]?([a-zA-Z0-9_-]+\.[a-zA-Z0-9]+)[\'"]?',
            # Match language=filename.ext in code markers
            r'language=([a-zA-Z0-9_-]+\.[a-zA-Z0-9]+)',
            # Match standalone filenames with extensions
            r'\b([a-zA-Z0-9_-]+\.(py|js|java|c|cpp|h|hpp|cs|go|rb|php|html|css|ts|jsx|tsx|vue|sh|sql|json|xml|yaml|yml|md|rs|swift|kt|scala|pl|r|lua))\b',
            # Match file paths in comments
            r'#\s*([a-zA-Z0-9_/-]+\.[a-zA-Z0-9]+)'
        ]
        # Check each context line for file name patterns
        for line in context_lines:
            line = line.strip()
            for pattern in file_patterns:
                matches = re.findall(pattern, line)
                if matches:
                    for match in matches:
                        if isinstance(match, tuple):
                            # If the match is a tuple (filename, extension)
                            file_name = match[0]
                            file_type = match[1]
                            # Verify it's not a code reference like Direction.DOWN
                            if not any(keyword in file_name for keyword in ['class.', 'enum.', 'import.']):
                                return os.path.splitext(file_name)[0], file_type
                        else:
                            # If the match is a string (full filename)
                            file_name = match
                            file_type = os.path.splitext(file_name)[1].lstrip('.')
                            # Verify it's not a code reference
                            if file_type in COMMON_CODE_EXTENSIONS and not any(
                                    keyword in file_name for keyword in ['class.', 'enum.', 'import.']):
                                return os.path.splitext(file_name)[0], file_type
        # If no explicit file name found, use LLM to infer from code content
        # Extract the code content
        code_content = block_with_context
        # Get the first 20 lines of code for LLM analysis
        code_lines = code_content.split('\n')
        code_preview = '\n'.join(code_lines[:20])
        # Get the model to use
        model_to_use = None
        if hasattr(self, 'context') and self.context:
            if hasattr(self.context, 'model') and self.context.model:
                model_to_use = self.context.model
            elif hasattr(self.context, 'team_context') and self.context.team_context:
                if hasattr(self.context.team_context, 'model') and self.context.team_context.model:
                    model_to_use = self.context.team_context.model
        # If no model is available in context, use the tool's model
        if not model_to_use and hasattr(self, 'model') and self.model:
            model_to_use = self.model
        if model_to_use:
            # Prepare a prompt for the model
            prompt = f"""Analyze the following code and determine the most appropriate file name and file type/extension.
 The file name should be descriptive but concise, using snake_case (lowercase with underscores).
 The file type should be a standard file extension (e.g., py, js, html, css, java).
 Code preview (first 20 lines):
 {code_preview}
 Return your answer in JSON format with these fields:
 - file_name: The suggested file name (without extension)
 - file_type: The suggested file extension
 JSON response:"""
            # Create a request to the model
            request = LLMRequest(
                messages=[{"role": "user", "content": prompt}],
                temperature=0,
                json_format=True
            )
            try:
                response = model_to_use.call(request)
                if not response.is_error:
                    # Clean the JSON response
                    json_content = self._clean_json_response(response.data["choices"][0]["message"]["content"])
                    result = json.loads(json_content)
                    file_name = result.get("file_name", "")
                    file_type = result.get("file_type", "")
                    if file_name and file_type:
                        return file_name, file_type
            except Exception as e:
                logger.error(f"Error using model to determine file name: {str(e)}")
        # If we still don't have a file name, use the language as file type
        if language and language in COMMON_CODE_EXTENSIONS:
            timestamp = int(time.time())
            return f"code_{timestamp}", language
        # If all else fails, return empty strings
        return "", ""
    def _clean_json_response(self, text: str) -> str:
        """
        Clean JSON response from LLM by removing markdown code block markers.
        :param text: The text containing JSON possibly wrapped in markdown code blocks
        :return: Clean JSON string
        """
        # Remove markdown code block markers if present
        if text.startswith("```json"):
            text = text[7:]
        elif text.startswith("```"):
            # Find the first newline to skip the language identifier line
            first_newline = text.find('\n')
            if first_newline != -1:
                text = text[first_newline + 1:]
        if text.endswith("```"):
            text = text[:-3]
        return text.strip()
    def _clean_code_block(self, block_with_context: str) -> str:
        """
        Clean a code block by removing markdown code markers and context lines.
        :param block_with_context: Code block with context lines
        :return: Clean code ready for execution
        """
        # Check if this is a full HTML or XML document
        if block_with_context.strip().startswith(("<!DOCTYPE", "<html", "<?xml")):
            return block_with_context
        # Find the code block
        code_block_match = re.search(r'```(?:\w+)?(?:[:=][^\n]+)?\n([\s\S]*?)\n```', block_with_context)
        if code_block_match:
            return code_block_match.group(1)
        # If no match found, try to extract anything between ``` markers
        lines = block_with_context.split('\n')
        start_idx = None
        end_idx = None
        for i, line in enumerate(lines):
            if line.strip().startswith('```'):
                if start_idx is None:
                    start_idx = i
                else:
                    end_idx = i
                    break
        if start_idx is not None and end_idx is not None:
            # Extract the code between the markers, excluding the markers themselves
            code_lines = lines[start_idx + 1:end_idx]
            return '\n'.join(code_lines)
        # If all else fails, return the original content
        return block_with_context
    def _get_file_params_from_model(self, content, model=None):
        """
        Use LLM to determine if the content is code and suggest appropriate file parameters.
        Args:
            content: The content to analyze
            model: Optional model to use for the analysis
        Returns:
            tuple: (file_name, file_type, extract_code) for backward compatibility
        """
        if model is None:
            model = self.model
        if not model:
            # Default fallback if no model is available
            return "output", "txt", False
        prompt = f"""
        Analyze the following content and determine:
        1. Is this primarily code implementation (where most of the content consists of code blocks)?
        2. What would be an appropriate filename and file extension?
        Content to analyze:    ```
        {content[:500]}  # Only show first 500 chars to avoid token limits    ```
        {"..." if len(content) > 500 else ""}
        Respond in JSON format only with the following structure:
        {{
            "is_code": true/false,  # Whether this is primarily code implementation
            "filename": "suggested_filename",  # Don't include extension, english words
            "extension": "appropriate_extension"  # Don't include the dot, e.g., "md", "py", "js"
        }}
        """
        try:
            # Create a request to the model
            request = LLMRequest(
                messages=[{"role": "user", "content": prompt}],
                temperature=0.1,
                json_format=True
            )
            # Call the model using the standard interface
            response = model.call(request)
            if response.is_error:
                logger.warning(f"Error from model: {response.error_message}")
                raise Exception(f"Model error: {response.error_message}")
            # Extract JSON from response
            result = response.data["choices"][0]["message"]["content"]
            # Clean the JSON response
            result = self._clean_json_response(result)
            # Parse the JSON
            params = json.loads(result)
            # For backward compatibility, return tuple format
            file_name = params.get("filename", "output")
            # Remove dot from extension if present
            file_type = params.get("extension", "md").lstrip(".")
            extract_code = params.get("is_code", False)
            return file_name, file_type, extract_code
        except Exception as e:
            logger.warning(f"Error getting file parameters from model: {e}")
            # Default fallback
            return "output", "md", False
    def _get_team_name_from_context(self) -> Optional[str]:
        """
        Get team name from the agent's context.
        :return: Team name or None if not found
        """
        if hasattr(self, 'context') and self.context:
            # Try to get team name from team_context
            if hasattr(self.context, 'team_context') and self.context.team_context:
                return self.context.team_context.name
            # Try direct team_name attribute
            if hasattr(self.context, 'name'):
                return self.context.name
        return None
    def _get_task_id_from_context(self) -> Optional[str]:
        """
        Get task ID from the agent's context.
        :return: Task ID or None if not found
        """
        if hasattr(self, 'context') and self.context:
            # Try to get task ID from task object
            if hasattr(self.context, 'task') and self.context.task:
                return self.context.task.id
            # Try team_context's task
            if hasattr(self.context, 'team_context') and self.context.team_context:
                if hasattr(self.context.team_context, 'task') and self.context.team_context.task:
                    return self.context.team_context.task.id
        return None
    def _get_task_dir_from_context(self) -> Optional[str]:
        """
        Get task directory name from the team context.
        :return: Task directory name or None if not found
        """
        if hasattr(self, 'context') and self.context:
            # Try to get from team_context
            if hasattr(self.context, 'team_context') and self.context.team_context:
                if hasattr(self.context.team_context, 'task_short_name') and self.context.team_context.task_short_name:
                    return self.context.team_context.task_short_name
        # Fall back to task ID if available
        return self._get_task_id_from_context()
    def _extract_content_from_context(self) -> str:
        """
        Extract content from the agent's context.
        :return: Extracted content
        """
        # Check if we have access to the agent's context
        if not hasattr(self, 'context') or not self.context:
            return ""
        # Try to get the most recent final answer from the agent
        if hasattr(self.context, 'final_answer') and self.context.final_answer:
            return self.context.final_answer
        # Try to get the most recent final answer from team context
        if hasattr(self.context, 'team_context') and self.context.team_context:
            if hasattr(self.context.team_context, 'agent_outputs') and self.context.team_context.agent_outputs:
                latest_output = self.context.team_context.agent_outputs[-1].output
                return latest_output
        # If we have action history, try to get the most recent final answer
        if hasattr(self.context, 'action_history') and self.context.action_history:
            for action in reversed(self.context.action_history):
                if "final_answer" in action and action["final_answer"]:
                    return action["final_answer"]
        return ""
    def _extract_code_blocks(self, content: str) -> str:
        """
        Extract code blocks from markdown content.
        :param content: The content to extract code blocks from
        :return: Extracted code blocks
        """
        # Pattern to match markdown code blocks
        code_block_pattern = r'```(?:\w+)?\n([\s\S]*?)\n```'
        # Find all code blocks
        code_blocks = re.findall(code_block_pattern, content)
        if code_blocks:
            # Join all code blocks with newlines
            return '\n\n'.join(code_blocks)
        return content  # Return original content if no code blocks found
    def _infer_file_name(self, content: str) -> str:
        """
        Infer a file name from the content.
        :param content: The content to analyze.
        :return: A suggested file name.
        """
        # Check for title patterns in markdown
        title_match = re.search(r'^#\s+(.+)$', content, re.MULTILINE)
        if title_match:
            # Convert title to a valid filename
            title = title_match.group(1).strip()
            return self._sanitize_filename(title)
        # Check for class/function definitions in code
        code_match = re.search(r'(class|def|function)\s+(\w+)', content)
        if code_match:
            return self._sanitize_filename(code_match.group(2))
        # Default name based on content type
        if self._is_likely_code(content):
            return "code"
        elif self._is_likely_markdown(content):
            return "document"
        elif self._is_likely_json(content):
            return "data"
        else:
            return "output"
    def _infer_file_type(self, content: str) -> str:
        """
        Infer the file type/extension from the content.
        :param content: The content to analyze.
        :return: A suggested file extension.
        """
        # Check for common programming language patterns
        if re.search(r'(import\s+[a-zA-Z0-9_]+|from\s+[a-zA-Z0-9_\.]+\s+import)', content):
            return "py"  # Python
        elif re.search(r'(public\s+class|private\s+class|protected\s+class)', content):
            return "java"  # Java
        elif re.search(r'(function\s+\w+\s*\(|const\s+\w+\s*=|let\s+\w+\s*=|var\s+\w+\s*=)', content):
            return "js"  # JavaScript
        elif re.search(r'(<html|<body|<div|<p>)', content):
            return "html"  # HTML
        elif re.search(r'(#include\s+<\w+\.h>|int\s+main\s*\()', content):
            return "cpp"  # C/C++
        # Check for markdown
        if self._is_likely_markdown(content):
            return "md"
        # Check for JSON
        if self._is_likely_json(content):
            return "json"
        # Default to text
        return "txt"
    def _is_likely_code(self, content: str) -> bool:
        """Check if the content is likely code."""
        # First check for common HTML/XML patterns
        if content.strip().startswith(("<!DOCTYPE", "<html", "<?xml", "<head", "<body")):
            return True
        code_patterns = [
            r'(class|def|function|import|from|public|private|protected|#include)',
            r'(\{\s*\n|\}\s*\n|\[\s*\n|\]\s*\n)',
            r'(if\s*\(|for\s*\(|while\s*\()',
            r'(<\w+>.*?</\w+>)',  # HTML/XML tags
            r'(var|let|const)\s+\w+\s*=',  # JavaScript variable declarations
            r'#\s*\w+',  # CSS ID selectors or Python comments
            r'\.\w+\s*\{',  # CSS class selectors
            r'@media|@import|@font-face'  # CSS at-rules
        ]
        return any(re.search(pattern, content) for pattern in code_patterns)
    def _is_likely_markdown(self, content: str) -> bool:
        """Check if the content is likely markdown."""
        md_patterns = [
            r'^#\s+.+$',  # Headers
            r'^\*\s+.+$',  # Unordered lists
            r'^\d+\.\s+.+$',  # Ordered lists
            r'\[.+\]\(.+\)',  # Links
            r'!\[.+\]\(.+\)'  # Images
        ]
        return any(re.search(pattern, content, re.MULTILINE) for pattern in md_patterns)
    def _is_likely_json(self, content: str) -> bool:
        """Check if the content is likely JSON."""
        try:
            content = content.strip()
            if (content.startswith('{') and content.endswith('}')) or (
                    content.startswith('[') and content.endswith(']')):
                json.loads(content)
                return True
        except:
            pass
        return False
    def _sanitize_filename(self, name: str) -> str:
        """
        Sanitize a string to be used as a filename.
        :param name: The string to sanitize.
        :return: A sanitized filename.
        """
        # Replace spaces with underscores
        name = name.replace(' ', '_')
        # Remove invalid characters
        name = re.sub(r'[^\w\-\.]', '', name)
        # Limit length
        if len(name) > 50:
            name = name[:50]
        return name.lower()
    def _process_file_path(self, file_path: str) -> Tuple[str, str]:
        """
        Process a file path to extract the file name and type, and create directories if needed.
        :param file_path: The file path to process
        :return: Tuple of (file_name, file_type)
        """
        # Get the file name and extension
        file_name = os.path.basename(file_path)
        file_type = os.path.splitext(file_name)[1].lstrip('.')
        return os.path.splitext(file_name)[0], file_type
--- a/agent/tools/ls/ls.py
+++ b/agent/tools/ls/ls.py
@@ -23,7 +23,7 @@ class Ls(BaseTool):
        "properties": {
            "path": {
                "type": "string",
-                "description": "Directory to list (default: current directory)"
+                "description": "Directory to list. IMPORTANT: Relative paths are based on workspace directory. To access directories outside workspace, use absolute paths starting with ~ or /."
            },
            "limit": {
                "type": "integer",
@@ -51,6 +51,13 @@ class Ls(BaseTool):
        absolute_path = self._resolve_path(path)
        if not os.path.exists(absolute_path):
            # Provide helpful hint if using relative path
            if not os.path.isabs(path) and not path.startswith('~'):
                return ToolResult.fail(
                    f"Error: Path not found: {path}\n"
                    f"Resolved to: {absolute_path}\n"
                    f"Hint: Relative paths are based on workspace ({self.cwd}). For files outside workspace, use absolute paths."
                )
            return ToolResult.fail(f"Error: Path not found: {path}")
        if not os.path.isdir(absolute_path):
--- a/agent/tools/read/read.py
+++ b/agent/tools/read/read.py
@@ -22,7 +22,7 @@ class Read(BaseTool):
        "properties": {
            "path": {
                "type": "string",
-                "description": "Path to the file to read (relative or absolute)"
+                "description": "Path to the file to read. IMPORTANT: Relative paths are based on workspace directory. To access files outside workspace, use absolute paths starting with ~ or /."
            },
            "offset": {
                "type": "integer",
@@ -63,6 +63,13 @@ class Read(BaseTool):
        # Check if file exists
        if not os.path.exists(absolute_path):
            # Provide helpful hint if using relative path
            if not os.path.isabs(path) and not path.startswith('~'):
                return ToolResult.fail(
                    f"Error: File not found: {path}\n"
                    f"Resolved to: {absolute_path}\n"
                    f"Hint: Relative paths are based on workspace ({self.cwd}). For files outside workspace, use absolute paths."
                )
            return ToolResult.fail(f"Error: File not found: {path}")
        # Check if readable
--- a/agent/tools/web_fetch/web_fetch.py
+++ b/agent/tools/web_fetch/web_fetch.py
@@ -46,7 +46,7 @@ class WebFetch(BaseTool):
    def __init__(self, config: dict = None):
        self.config = config or {}
-        self.timeout = self.config.get("timeout", 30)
+        self.timeout = self.config.get("timeout", 20)
        self.max_redirects = self.config.get("max_redirects", 3)
        self.user_agent = self.config.get(
            "user_agent",
--- a/bot/gemini/google_gemini_bot.py
+++ b/bot/gemini/google_gemini_bot.py
@@ -245,8 +245,7 @@ class GoogleGeminiBot(Bot):
            gen_config = {}
            if kwargs.get("temperature") is not None:
                gen_config["temperature"] = kwargs["temperature"]
-            if kwargs.get("max_tokens"):
+
                gen_config["maxOutputTokens"] = kwargs["max_tokens"]
            if gen_config:
                payload["generationConfig"] = gen_config
@@ -255,7 +254,7 @@ class GoogleGeminiBot(Bot):
                gemini_tools = self._convert_tools_to_gemini_rest_format(tools)
                if gemini_tools:
                    payload["tools"] = gemini_tools
-                    logger.info(f"[Gemini] Added {len(tools)} tools to request")
+                    logger.debug(f"[Gemini] Added {len(tools)} tools to request")
            # Make REST API call
            base_url = f"{self.api_base}/v1beta"
@@ -445,6 +444,9 @@ class GoogleGeminiBot(Bot):
            all_tool_calls = []
            has_sent_tool_calls = False
            has_content = False  # Track if any content was sent
            chunk_count = 0
            last_finish_reason = None
            last_safety_ratings = None
            for line in response.iter_lines():
                if not line:
@@ -461,6 +463,7 @@ class GoogleGeminiBot(Bot):
                try:
                    chunk_data = json.loads(line)
                    chunk_count += 1
                    logger.debug(f"[Gemini] Stream chunk: {json.dumps(chunk_data, ensure_ascii=False)[:200]}")
                    candidates = chunk_data.get("candidates", [])
@@ -469,6 +472,13 @@ class GoogleGeminiBot(Bot):
                        continue
                    candidate = candidates[0]
                    # 记录 finish_reason 和 safety_ratings
                    if "finishReason" in candidate:
                        last_finish_reason = candidate["finishReason"]
                    if "safetyRatings" in candidate:
                        last_safety_ratings = candidate["safetyRatings"]
                    content = candidate.get("content", {})
                    parts = content.get("parts", [])
@@ -512,7 +522,7 @@ class GoogleGeminiBot(Bot):
            # Send tool calls if any were collected
            if all_tool_calls and not has_sent_tool_calls:
-                logger.info(f"[Gemini] Stream detected {len(all_tool_calls)} tool calls")
+                logger.debug(f"[Gemini] Stream detected {len(all_tool_calls)} tool calls")
                yield {
                    "id": f"chatcmpl-{time.time()}",
                    "object": "chat.completion.chunk",
@@ -526,8 +536,17 @@ class GoogleGeminiBot(Bot):
                }
                has_sent_tool_calls = True
-            # Log summary
+            # Log summary (only if there's something interesting)
-            logger.info(f"[Gemini] Stream complete: has_content={has_content}, tool_calls={len(all_tool_calls)}")
+            if not has_content and not all_tool_calls:
                logger.debug(f"[Gemini] Stream complete: has_content={has_content}, tool_calls={len(all_tool_calls)}")
            elif all_tool_calls:
                logger.debug(f"[Gemini] Stream complete: {len(all_tool_calls)} tool calls")
            else:
                logger.debug(f"[Gemini] Stream complete: text response")
            # 如果返回空响应，记录详细警告
            if not has_content and not all_tool_calls:
                logger.warning(f"[Gemini] ⚠️  Empty response detected!")
            # Final chunk
            yield {
--- a/bot/linkai/link_ai_bot.py
+++ b/bot/linkai/link_ai_bot.py
@@ -4,6 +4,7 @@
 import re
 import time
 import requests
 import json
 import config
 from bot.bot import Bot
 from bot.openai_compatible_bot import OpenAICompatibleBot
@@ -463,7 +464,7 @@ class LinkAISessionManager(SessionManager):
            session.add_query(query)
        session.add_reply(reply)
        try:
-            max_tokens = conf().get("conversation_max_tokens", 2500)
+            max_tokens = conf().get("conversation_max_tokens", 8000)
            tokens_cnt = session.discard_exceeding(max_tokens, total_tokens)
            logger.debug(f"[LinkAI] chat history, before tokens={total_tokens}, now tokens={tokens_cnt}")
        except Exception as e:
@@ -504,6 +505,26 @@ def _linkai_call_with_tools(self, messages, tools=None, stream=False, **kwargs):
        Formatted response in OpenAI format or generator for streaming
    """
    try:
        # Convert messages from Claude format to OpenAI format
        # This is important because Agent uses Claude format internally
        messages = self._convert_messages_to_openai_format(messages)
        # Convert tools from Claude format to OpenAI format
        if tools:
            tools = self._convert_tools_to_openai_format(tools)
        # Handle system prompt (OpenAI uses system message, Claude uses separate parameter)
        system_prompt = kwargs.get('system')
        if system_prompt:
            # Add system message at the beginning if not already present
            if not messages or messages[0].get('role') != 'system':
                messages = [{"role": "system", "content": system_prompt}] + messages
            else:
                # Replace existing system message
                messages[0] = {"role": "system", "content": system_prompt}
        logger.debug(f"[LinkAI] messages: {len(messages)}, tools: {len(tools) if tools else 0}, stream: {stream}")
        # Build request parameters (LinkAI uses OpenAI-compatible format)
        body = {
            "messages": messages,
@@ -515,16 +536,6 @@ def _linkai_call_with_tools(self, messages, tools=None, stream=False, **kwargs):
            "stream": stream
        }
        # Add max_tokens if specified
        if kwargs.get("max_tokens"):
            body["max_tokens"] = kwargs["max_tokens"]
        # Add app_code if provided
        app_code = kwargs.get("app_code", conf().get("linkai_app_code"))
        if app_code:
            body["app_code"] = app_code
        # Add tools if provided (OpenAI-compatible format)
        if tools:
            body["tools"] = tools
            body["tool_choice"] = kwargs.get("tool_choice", "auto")
@@ -567,8 +578,8 @@ def _handle_linkai_sync_response(self, base_url, headers, body):
        if res.status_code == 200:
            response = res.json()
-            logger.info(f"[LinkAI] call_with_tools reply, model={response.get('model')}, "
+            logger.debug(f"[LinkAI] reply: model={response.get('model')}, "
-                       f"total_tokens={response.get('usage', {}).get('total_tokens', 0)}")
+                        f"tokens={response.get('usage', {}).get('total_tokens', 0)}")
            # LinkAI response is already in OpenAI-compatible format
            return response
--- a/bridge/agent_bridge.py
+++ b/bridge/agent_bridge.py
@@ -66,14 +66,22 @@ class AgentLLMModel(LLMModel):
        self.bridge = bridge
        self.bot_type = bot_type
        self._bot = None
        self._use_linkai = conf().get("use_linkai", False) and conf().get("linkai_api_key")
    @property
    def bot(self):
        """Lazy load the bot and enhance it with tool calling if needed"""
        if self._bot is None:
-            self._bot = self.bridge.get_bot(self.bot_type)
+            # If use_linkai is enabled, use LinkAI bot directly
-            # Automatically add tool calling support if not present
+            if self._use_linkai:
-            self._bot = add_openai_compatible_support(self._bot)
+                self._bot = self.bridge.find_chat_bot(const.LINKAI)
            else:
                self._bot = self.bridge.get_bot(self.bot_type)
                # Automatically add tool calling support if not present
                self._bot = add_openai_compatible_support(self._bot)
            # Log bot info
            bot_name = type(self._bot).__name__
        return self._bot
    def call(self, request: LLMRequest):
@@ -88,11 +96,18 @@ class AgentLLMModel(LLMModel):
                kwargs = {
                    'messages': request.messages,
                    'tools': getattr(request, 'tools', None),
-                    'stream': False
+                    'stream': False,
                    'model': self.model  # Pass model parameter
                }
                # Only pass max_tokens if it's explicitly set
                if request.max_tokens is not None:
                    kwargs['max_tokens'] = request.max_tokens
                # Extract system prompt if present
                system_prompt = getattr(request, 'system', None)
                if system_prompt:
                    kwargs['system'] = system_prompt
                response = self.bot.call_with_tools(**kwargs)
                return self._format_response(response)
            else:
@@ -122,7 +137,8 @@ class AgentLLMModel(LLMModel):
                    'messages': request.messages,
                    'tools': getattr(request, 'tools', None),
                    'stream': True,
-                    'max_tokens': max_tokens
+                    'max_tokens': max_tokens,
                    'model': self.model  # Pass model parameter
                }
                # Add system prompt if present
@@ -155,13 +171,15 @@ class AgentLLMModel(LLMModel):
 class AgentBridge:
    """
-    Bridge class that integrates single super Agent with COW
+    Bridge class that integrates super Agent with COW
    Manages multiple agent instances per session for conversation isolation
    """
    def __init__(self, bridge: Bridge):
        self.bridge = bridge
        self.agents = {}  # session_id -> Agent instance mapping
        self.default_agent = None  # For backward compatibility (no session_id)
        self.agent: Optional[Agent] = None
    def create_agent(self, system_prompt: str, tools: List = None, **kwargs) -> Agent:
        """
        Create the super agent with COW integration
@@ -193,8 +211,8 @@ class AgentBridge:
                except Exception as e:
                    logger.warning(f"[AgentBridge] Failed to load tool {tool_name}: {e}")
-        # Create the single super agent
+        # Create agent instance
-        self.agent = Agent(
+        agent = Agent(
            system_prompt=system_prompt,
            description=kwargs.get("description", "AI Super Agent"),
            model=model,
@@ -209,21 +227,38 @@ class AgentBridge:
        )
        # Log skill loading details
-        if self.agent.skill_manager:
+        if agent.skill_manager:
            logger.info(f"[AgentBridge] SkillManager initialized:")
-            logger.info(f"[AgentBridge]   - Managed dir: {self.agent.skill_manager.managed_skills_dir}")
+            logger.info(f"[AgentBridge]   - Managed dir: {agent.skill_manager.managed_skills_dir}")
-            logger.info(f"[AgentBridge]   - Workspace dir: {self.agent.skill_manager.workspace_dir}")
+            logger.info(f"[AgentBridge]   - Workspace dir: {agent.skill_manager.workspace_dir}")
-            logger.info(f"[AgentBridge]   - Total skills: {len(self.agent.skill_manager.skills)}")
+            logger.info(f"[AgentBridge]   - Total skills: {len(agent.skill_manager.skills)}")
-            for skill_name in self.agent.skill_manager.skills.keys():
+            for skill_name in agent.skill_manager.skills.keys():
                logger.info(f"[AgentBridge]     * {skill_name}")
-        return self.agent
+        return agent
-    def get_agent(self) -> Optional[Agent]:
+    def get_agent(self, session_id: str = None) -> Optional[Agent]:
-        """Get the super agent, create if not exists"""
+        """
-        if self.agent is None:
+        Get agent instance for the given session
-            self._init_default_agent()
+        
-        return self.agent
+        Args:
            session_id: Session identifier (e.g., user_id). If None, returns default agent.
        Returns:
            Agent instance for this session
        """
        # If no session_id, use default agent (backward compatibility)
        if session_id is None:
            if self.default_agent is None:
                self._init_default_agent()
            return self.default_agent
        # Check if agent exists for this session
        if session_id not in self.agents:
            logger.info(f"[AgentBridge] Creating new agent for session: {session_id}")
            self._init_agent_for_session(session_id)
        return self.agents[session_id]
    def _init_default_agent(self):
        """Initialize default super agent with new prompt system"""
@@ -291,6 +326,12 @@ class AgentBridge:
                        tool.cwd = file_config.get("cwd", tool.cwd if hasattr(tool, 'cwd') else None)
                        if 'memory_manager' in file_config:
                            tool.memory_manager = file_config['memory_manager']
                    # Apply API key for bocha_search tool
                    elif tool_name == 'bocha_search':
                        bocha_api_key = conf().get("bocha_api_key", "")
                        if bocha_api_key:
                            tool.config = {"bocha_api_key": bocha_api_key}
                            tool.api_key = bocha_api_key
                    tools.append(tool)
                    logger.debug(f"[AgentBridge] Loaded tool: {tool_name}")
            except Exception as e:
@@ -307,6 +348,12 @@ class AgentBridge:
        context_files = load_context_files(workspace_root)
        logger.info(f"[AgentBridge] Loaded {len(context_files)} context files: {[f.path for f in context_files]}")
        # Check if this is the first conversation
        from agent.prompt.workspace import is_first_conversation, mark_conversation_started
        is_first = is_first_conversation(workspace_root)
        if is_first:
            logger.info("[AgentBridge] First conversation detected")
        # Build system prompt using new prompt builder
        prompt_builder = PromptBuilder(
            workspace_dir=workspace_root,
@@ -317,16 +364,21 @@ class AgentBridge:
        runtime_info = {
            "model": conf().get("model", "unknown"),
            "workspace": workspace_root,
-            "channel": "web"  # TODO: get from actual channel, default to "web" to hide if not specified
+            "channel": conf().get("channel_type", "unknown")  # Get from config
        }
        system_prompt = prompt_builder.build(
            tools=tools,
            context_files=context_files,
            memory_manager=memory_manager,
-            runtime_info=runtime_info
+            runtime_info=runtime_info,
            is_first_conversation=is_first
        )
        # Mark conversation as started (will be saved after first user message)
        if is_first:
            mark_conversation_started(workspace_root)
        logger.info("[AgentBridge] System prompt built successfully")
        # Create agent with configured tools and workspace
@@ -344,6 +396,127 @@ class AgentBridge:
            agent.memory_manager = memory_manager
            logger.info(f"[AgentBridge] Memory manager attached to agent")
        # Store as default agent
        self.default_agent = agent
    def _init_agent_for_session(self, session_id: str):
        """
        Initialize agent for a specific session
        Reuses the same configuration as default agent
        """
        from config import conf
        import os
        # Get workspace from config
        workspace_root = os.path.expanduser(conf().get("agent_workspace", "~/cow"))
        # Initialize workspace
        from agent.prompt import ensure_workspace, load_context_files, PromptBuilder
        workspace_files = ensure_workspace(workspace_root, create_templates=True)
        # Setup memory system
        memory_manager = None
        memory_tools = []
        try:
            from agent.memory import MemoryManager, MemoryConfig
            from agent.tools import MemorySearchTool, MemoryGetTool
            memory_config = MemoryConfig(
                workspace_root=workspace_root,
                embedding_provider="local",
                embedding_model="all-MiniLM-L6-v2"
            )
            memory_manager = MemoryManager(memory_config)
            memory_tools = [
                MemorySearchTool(memory_manager),
                MemoryGetTool(memory_manager)
            ]
        except Exception as e:
            logger.debug(f"[AgentBridge] Memory system not available for session {session_id}: {e}")
        # Load tools
        from agent.tools import ToolManager
        tool_manager = ToolManager()
        tool_manager.load_tools()
        tools = []
        file_config = {
            "cwd": workspace_root,
            "memory_manager": memory_manager
        } if memory_manager else {"cwd": workspace_root}
        for tool_name in tool_manager.tool_classes.keys():
            try:
                tool = tool_manager.create_tool(tool_name)
                if tool:
                    if tool_name in ['read', 'write', 'edit', 'bash', 'grep', 'find', 'ls']:
                        tool.config = file_config
                        tool.cwd = file_config.get("cwd", tool.cwd if hasattr(tool, 'cwd') else None)
                        if 'memory_manager' in file_config:
                            tool.memory_manager = file_config['memory_manager']
                    elif tool_name == 'bocha_search':
                        bocha_api_key = conf().get("bocha_api_key", "")
                        if bocha_api_key:
                            tool.config = {"bocha_api_key": bocha_api_key}
                            tool.api_key = bocha_api_key
                    tools.append(tool)
            except Exception as e:
                logger.warning(f"[AgentBridge] Failed to load tool {tool_name} for session {session_id}: {e}")
        if memory_tools:
            tools.extend(memory_tools)
        # Load context files
        context_files = load_context_files(workspace_root)
        # Check if this is the first conversation
        from agent.prompt.workspace import is_first_conversation, mark_conversation_started
        is_first = is_first_conversation(workspace_root)
        # Build system prompt
        prompt_builder = PromptBuilder(
            workspace_dir=workspace_root,
            language="zh"
        )
        runtime_info = {
            "model": conf().get("model", "unknown"),
            "workspace": workspace_root,
            "channel": conf().get("channel_type", "unknown")
        }
        system_prompt = prompt_builder.build(
            tools=tools,
            context_files=context_files,
            memory_manager=memory_manager,
            runtime_info=runtime_info,
            is_first_conversation=is_first
        )
        if is_first:
            mark_conversation_started(workspace_root)
        # Create agent for this session
        agent = self.create_agent(
            system_prompt=system_prompt,
            tools=tools,
            max_steps=50,
            output_mode="logger",
            workspace_dir=workspace_root,
            enable_skills=True
        )
        if memory_manager:
            agent.memory_manager = memory_manager
        # Store agent for this session
        self.agents[session_id] = agent
        logger.info(f"[AgentBridge] Agent created for session: {session_id}")
    def agent_reply(self, query: str, context: Context = None, 
                   on_event=None, clear_history: bool = False) -> Reply:
        """
@@ -351,7 +524,7 @@ class AgentBridge:
        Args:
            query: User query
-            context: COW context (optional)
+            context: COW context (optional, contains session_id for user isolation)
            on_event: Event callback (optional)
            clear_history: Whether to clear conversation history
@@ -359,8 +532,13 @@ class AgentBridge:
            Reply object
        """
        try:
-            # Get agent (will auto-initialize if needed)
+            # Extract session_id from context for user isolation
-            agent = self.get_agent()
+            session_id = None
            if context:
                session_id = context.kwargs.get("session_id") or context.get("session_id")
            # Get agent for this session (will auto-initialize if needed)
            agent = self.get_agent(session_id=session_id)
            if not agent:
                return Reply(ReplyType.ERROR, "Failed to initialize super agent")
@@ -376,3 +554,20 @@ class AgentBridge:
        except Exception as e:
            logger.error(f"Agent reply error: {e}")
            return Reply(ReplyType.ERROR, f"Agent error: {str(e)}")
    def clear_session(self, session_id: str):
        """
        Clear a specific session's agent and conversation history
        Args:
            session_id: Session identifier to clear
        """
        if session_id in self.agents:
            logger.info(f"[AgentBridge] Clearing session: {session_id}")
            del self.agents[session_id]
    def clear_all_sessions(self):
        """Clear all agent sessions"""
        logger.info(f"[AgentBridge] Clearing all sessions ({len(self.agents)} total)")
        self.agents.clear()
        self.default_agent = None
--- a/channel/channel.py
+++ b/channel/channel.py
@@ -47,6 +47,10 @@ class Channel(object):
            try:
                logger.info("[Channel] Using agent mode")
                # Add channel_type to context if not present
                if context and "channel_type" not in context:
                    context["channel_type"] = self.channel_type
                # Use agent bridge to handle the query
                return Bridge().fetch_agent_reply(
                    query=query,
--- a/channel/web/web_channel.py
+++ b/channel/web/web_channel.py
@@ -49,8 +49,6 @@ class WebChannel(ChatChannel):
        self.msg_id_counter = 0  # 添加消息ID计数器
        self.session_queues = {}  # 存储session_id到队列的映射
        self.request_to_session = {}  # 存储request_id到session_id的映射
        # web channel无需前缀
        conf()["single_chat_prefix"] = [""]
    def _generate_msg_id(self):
@@ -122,18 +120,30 @@ class WebChannel(ChatChannel):
            if session_id not in self.session_queues:
                self.session_queues[session_id] = Queue()
            # Web channel 不需要前缀，确保消息能通过前缀检查
            trigger_prefixs = conf().get("single_chat_prefix", [""])
            if check_prefix(prompt, trigger_prefixs) is None:
                # 如果没有匹配到前缀，给消息加上第一个前缀
                if trigger_prefixs:
                    prompt = trigger_prefixs[0] + prompt
                    logger.debug(f"[WebChannel] Added prefix to message: {prompt}")
            # 创建消息对象
            msg = WebMessage(self._generate_msg_id(), prompt)
            msg.from_user_id = session_id  # 使用会话ID作为用户ID
-            # 创建上下文
+            # 创建上下文，明确指定 isgroup=False
-            context = self._compose_context(ContextType.TEXT, prompt, msg=msg)
+            context = self._compose_context(ContextType.TEXT, prompt, msg=msg, isgroup=False)
-            # 添加必要的字段
+            # 检查 context 是否为 None（可能被插件过滤等）
            if context is None:
                logger.warning(f"[WebChannel] Context is None for session {session_id}, message may be filtered")
                return json.dumps({"status": "error", "message": "Message was filtered"})
            # 覆盖必要的字段（_compose_context 会设置默认值，但我们需要使用实际的 session_id）
            context["session_id"] = session_id
            context["receiver"] = session_id
            context["request_id"] = request_id
            context["isgroup"] = False  # 添加 isgroup 字段
            context["receiver"] = session_id  # 添加 receiver 字段
            # 异步处理消息 - 只传递上下文
            threading.Thread(target=self.produce, args=(context,)).start()
--- a/config.py
+++ b/config.py
@@ -185,7 +185,8 @@ available_setting = {
    "Minimax_base_url": "",
    "web_port": 9899,
    "agent": False,  # 是否开启Agent模式
-    "agent_workspace": "~/cow"  # agent工作空间路径，用于存储skills、memory等
+    "agent_workspace": "~/cow",  # agent工作空间路径，用于存储skills、memory等
    "bocha_api_key": ""
 }
--- a/skills/skill-creator/SKILL.md
+++ b/skills/skill-creator/SKILL.md
@@ -68,10 +68,11 @@ skill-name/
 - Must test scripts before including
 **references/** - When to include:
- Documentation for agent to reference
+- **ONLY** when documentation is too large for SKILL.md (>500 lines)
- Database schemas, API docs, domain knowledge
+- Database schemas, complex API specs that agent needs to reference
 - Agent reads these files into context as needed
- For large files (>10k words), include grep patterns in SKILL.md
+- **NOT for**: API reference docs, usage examples, tutorials (put in SKILL.md instead)
 - **Rule of thumb**: If it fits in SKILL.md, don't create a separate reference file
 **assets/** - When to include:
 - Files used in output (not loaded to context)
@@ -82,11 +83,15 @@ skill-name/
 ### What NOT to Include
-Do NOT create auxiliary documentation:
+Do NOT create auxiliary documentation files:
- README.md
+- README.md - Instructions belong in SKILL.md
- INSTALLATION_GUIDE.md
+- INSTALLATION_GUIDE.md - Setup info belongs in SKILL.md
- CHANGELOG.md
+- CHANGELOG.md - Not needed for local skills
- Other non-essential files
+- API_REFERENCE.md - Put API docs directly in SKILL.md
 - USAGE_EXAMPLES.md - Put examples directly in SKILL.md
 - Any other documentation files - Everything goes in SKILL.md unless it's too large
 **Critical Rule**: Only create files that the agent will actually execute (scripts) or that are too large for SKILL.md (references). Documentation, examples, and guides ALL belong in SKILL.md.
 ## Skill Creation Process
@@ -133,22 +138,31 @@ To turn concrete examples into an effective skill, analyze each example by:
 1. Considering how to execute on the example from scratch
 2. Identifying what scripts, references, and assets would be helpful when executing these workflows repeatedly
 **Planning Checklist**:
 - ✅ **Always needed**: SKILL.md with clear description and usage instructions
 - ✅ **scripts/**: Only if code needs to be executed (not just shown as examples)
 - ❌ **references/**: Rarely needed - only if documentation is >500 lines and can't fit in SKILL.md
 - ✅ **assets/**: Only if files are used in output (templates, boilerplate, etc.)
 Example: When building a `pdf-editor` skill to handle queries like "Help me rotate this PDF," the analysis shows:
 1. Rotating a PDF requires re-writing the same code each time
 2. A `scripts/rotate_pdf.py` script would be helpful to store in the skill
 3. ❌ Don't create `references/api-docs.md` - put API info in SKILL.md instead
 Example: When designing a `frontend-webapp-builder` skill for queries like "Build me a todo app" or "Build me a dashboard to track my steps," the analysis shows:
 1. Writing a frontend webapp requires the same boilerplate HTML/React each time
 2. An `assets/hello-world/` template containing the boilerplate HTML/React project files would be helpful to store in the skill
 3. ❌ Don't create `references/usage-examples.md` - put examples in SKILL.md instead
 Example: When building a `big-query` skill to handle queries like "How many users have logged in today?" the analysis shows:
 1. Querying BigQuery requires re-discovering the table schemas and relationships each time
-2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill
+2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill (ONLY because schemas are very large)
 3. ❌ Don't create separate `references/query-examples.md` - put examples in SKILL.md instead
-To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets.
+To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets. **Default to putting everything in SKILL.md unless there's a compelling reason to separate it.**
 ### Step 3: Initialize the Skill
@@ -200,6 +214,12 @@ These files contain established best practices for effective skill design.
 To begin implementation, start with the reusable resources identified above: `scripts/`, `references/`, and `assets/` files. Note that this step may require user input. For example, when implementing a `brand-guidelines` skill, the user may need to provide brand assets or templates to store in `assets/`, or documentation to store in `references/`.
 **Important Guidelines**:
 - **scripts/**: Only create scripts that will be executed. Test all scripts before including.
 - **references/**: ONLY create if documentation is too large for SKILL.md (>500 lines). Most skills don't need this.
 - **assets/**: Only include files used in output (templates, icons, etc.)
 - **Default approach**: Put everything in SKILL.md unless there's a specific reason not to.
 Added scripts must be tested by actually running them to ensure there are no bugs and that the output matches what is expected. If there are many similar scripts, only a representative sample needs to be tested to ensure confidence that they all work while balancing time to completion.
 If you used `--examples`, delete any placeholder files that are not needed for the skill. Only create resource directories that are actually required.
		`@@ -1,3 +0,0 @@`
			`from .file_save import FileSave`

			`__all__ = ['FileSave']`