修改skill目录

2026-04-18 23:39:47 +08:00 · 2026-04-18 23:39:47 +08:00 · 2911c67771
commit 2911c67771
parent 2fa779e61e 1535014c3e
228 changed files with 1580 additions and 28 deletions
--- a/.features/skill/MEMORY.md
+++ b/.features/skill/MEMORY.md
@ -1,7 +1,8 @@
 # Skill 功能

 > 负责范围：技能包管理服务 - 核心实现
-> 最后更新：2026-04-16
+
+> 最后更新：2026-04-18

 ## 当前状态

@ -22,6 +23,10 @@ Skill 系统支持两种来源：官方 skills (`./skills/`) 和用户 skills (`

 - 2026-04-16: 为 `auto-daily-summary` 和 `competitor-news-intel` 新增 Python CLI 脚本 MVP，统一采用 `argparse + JSON stdout` 模式
 - 2026-04-16: 新增 6 个纯 `SKILL.md` 型业务 skill：`market-academic-insight`、`financial-report-generator`、`contract-document-generator`、`sales-decision-report`、`auto-daily-summary`、`competitor-news-intel`
+- 2026-04-18: `create_robot_project` 改为自动加载 `skills/autoload/{SKILLS_SUBDIR}` 下所有 skill，并跳过已显式传入的同名 skill
+- 2026-04-18: `/api/v1/skill/list` 的官方库改为同时读取 `skills/common` 和 `skills/{SKILLS_SUBDIR}`，并按目录顺序去重
+- 2026-04-18: `_extract_skills_to_robot` 改为通过环境变量 `SKILLS_SUBDIR` 选择官方 skills 子目录，默认使用 `skills/common`
+
 - 2025-02-11: 初始化 skill 功能 memory

 ## Gotchas（开发必读）
@ -32,6 +37,9 @@ Skill 系统支持两种来源：官方 skills (`./skills/`) 和用户 skills (`
 - ⚠️ `auto-daily-summary` 需要特别注意中文分句、action 边界截断、risk 窗口裁剪，否则容易把整句/整段吞进去
 - ⚠️ `competitor-news-intel` 的 payload 校验应按命令拆分（collect/analyze/run），不要共用一套最小校验
 - ⚠️ `competitor-news-intel` 的 `collect/run` 依赖 `BAIDU_API_KEY`；无该环境变量时应返回稳定错误 JSON，不要静默降级
+
+- ⚠️ `_extract_skills_to_robot` 只会从 `skills/{SKILLS_SUBDIR}` 读取官方 skills，默认是 `common`
+
 - ⚠️ 执行脚本必须使用绝对路径
 - ⚠️ MCP 配置优先级：Skill MCP > 默认 MCP > 用户参数
 - ⚠️ 上传大小限制：50MB（ZIP），解压后最大 500MB
--- a/routes/skill_manager.py
+++ b/routes/skill_manager.py
@ -10,7 +10,7 @@ from typing import List, Optional
 from dataclasses import dataclass
 from fastapi import APIRouter, HTTPException, Query, UploadFile, File, Form
 from pydantic import BaseModel
-from utils.settings import SKILLS_DIR
+from utils.settings import SKILLS_DIR, SKILLS_SUBDIR
 import aiofiles

 logger = logging.getLogger('app')
@ -427,27 +427,39 @@ def get_official_skills(base_dir: str) -> List[SkillItem]:
        List of SkillItem objects
    """
    skills = []
+    skill_names = set()
+
    # Use SKILLS_DIR from settings, relative to base_dir
    if os.path.isabs(SKILLS_DIR):
-        official_skills_dir = SKILLS_DIR
+        skills_root_dir = SKILLS_DIR
    else:
-        official_skills_dir = os.path.join(base_dir, SKILLS_DIR)
+        skills_root_dir = os.path.join(base_dir, SKILLS_DIR)

-    if not os.path.exists(official_skills_dir):
-        logger.warning(f"Official skills directory not found: {official_skills_dir}")
-        return skills
+    official_skills_dirs = [
+        os.path.join(skills_root_dir, "common"),
+        os.path.join(skills_root_dir, SKILLS_SUBDIR),
+    ]

-    for skill_name in os.listdir(official_skills_dir):
-        skill_path = os.path.join(official_skills_dir, skill_name)
-        if os.path.isdir(skill_path):
-            metadata = get_skill_metadata_legacy(skill_path)
-            if metadata:
-                skills.append(SkillItem(
-                    name=metadata['name'],
-                    description=metadata['description'],
-                    user_skill=False
-                ))
-                logger.debug(f"Found official skill: {metadata['name']}")
+    for official_skills_dir in official_skills_dirs:
+        if not os.path.exists(official_skills_dir):
+            logger.warning(f"Official skills directory not found: {official_skills_dir}")
+            continue
+
+        for skill_name in os.listdir(official_skills_dir):
+            if skill_name in skill_names:
+                continue
+
+            skill_path = os.path.join(official_skills_dir, skill_name)
+            if os.path.isdir(skill_path):
+                metadata = get_skill_metadata_legacy(skill_path)
+                if metadata:
+                    skills.append(SkillItem(
+                        name=metadata['name'],
+                        description=metadata['description'],
+                        user_skill=False
+                    ))
+                    skill_names.add(skill_name)
+                    logger.debug(f"Found official skill: {metadata['name']} from {official_skills_dir}")

    return skills

@ -498,7 +510,7 @@ async def list_skills(
        SkillListResponse containing all skills

    Notes:
-        - Official skills are read from the /skills directory
+        - Official skills are read from /skills/common and /skills/{SKILLS_SUBDIR}
        - User skills are read from /projects/uploads/{bot_id}/skills directory
        - User skills are marked with user_skill: true
    """
--- a/skills/autoload/onprem/rag-retrieve/.claude-plugin/plugin.json
+++ b/skills/autoload/onprem/rag-retrieve/.claude-plugin/plugin.json
--- a/skills/autoload/onprem/rag-retrieve/README.md
+++ b/skills/autoload/onprem/rag-retrieve/README.md
--- a/skills/autoload/onprem/rag-retrieve/hooks/hook-backup.md
+++ b/skills/autoload/onprem/rag-retrieve/hooks/hook-backup.md
--- a/skills/autoload/onprem/rag-retrieve/hooks/pre_prompt.py
+++ b/skills/autoload/onprem/rag-retrieve/hooks/pre_prompt.py
--- a/skills/autoload/onprem/rag-retrieve/hooks/retrieval-policy.md
+++ b/skills/autoload/onprem/rag-retrieve/hooks/retrieval-policy.md
--- a/skills/autoload/onprem/rag-retrieve/mcp_common.py
+++ b/skills/autoload/onprem/rag-retrieve/mcp_common.py
--- a/skills/autoload/onprem/rag-retrieve/rag_retrieve_server.py
+++ b/skills/autoload/onprem/rag-retrieve/rag_retrieve_server.py
--- a/skills/autoload/onprem/rag-retrieve/rag_retrieve_tools.json
+++ b/skills/autoload/onprem/rag-retrieve/rag_retrieve_tools.json
--- a/skills/autoload/support/rag-retrieve/.claude-plugin/plugin.json
+++ b/skills/autoload/support/rag-retrieve/.claude-plugin/plugin.json
@ -0,0 +1,22 @@
+{
+  "name": "rag-retrieve",
+  "description": "Provides RAG and table RAG retrieval tools through a PrePrompt hook and MCP server.",
+  "hooks": {
+    "PrePrompt": [
+      {
+        "type": "command",
+        "command": "python hooks/pre_prompt.py"
+      }
+    ]
+  },
+  "mcpServers": {
+    "rag_retrieve": {
+      "transport": "stdio",
+      "command": "python",
+      "args": [
+        "./rag_retrieve_server.py",
+        "{bot_id}"
+      ]
+    }
+  }
+}
--- a/skills/autoload/support/rag-retrieve/README.md
+++ b/skills/autoload/support/rag-retrieve/README.md
@ -0,0 +1,99 @@
+# RAG Retrieve
+
+An example autoload skill that demonstrates how to integrate `rag-retrieve` and `table-rag-retrieve` through Claude Plugins hooks and an MCP server.
+
+## Overview
+
+This skill uses a `PrePrompt` hook to inject retrieval guidance into the prompt, and starts an MCP server that exposes retrieval capabilities for the current bot.
+
+### PrePrompt Hook
+Runs when the system prompt is loaded and injects retrieval policy content.
+- File: `hooks/pre_prompt.py`
+- Purpose: load retrieval instructions and add them to the prompt context
+
+### MCP Server
+Provides retrieval tools over stdio for the current `bot_id`.
+- File: `rag_retrieve_server.py`
+- Purpose: expose `rag-retrieve` and related retrieval tools to the agent
+
+## Directory Structure
+
+```text
+rag-retrieve/
+├── README.md                      # Skill documentation
+├── .claude-plugin/
+│   └── plugin.json                # Hook and MCP server configuration
+├── hooks/
+│   ├── pre_prompt.py              # PrePrompt hook script
+│   └── retrieval-policy.md        # Retrieval policy injected into the prompt
+├── mcp_common.py                  # Shared MCP utilities
+├── rag_retrieve_server.py         # MCP server entrypoint
+└── rag_retrieve_tools.json        # Tool definitions
+```
+
+## `plugin.json` Format
+
+```json
+{
+  "name": "rag-retrieve",
+  "description": "rag-retrieve and table-rag-retrieve",
+  "hooks": {
+    "PrePrompt": [
+      {
+        "type": "command",
+        "command": "python hooks/pre_prompt.py"
+      }
+    ]
+  },
+  "mcpServers": {
+    "rag_retrieve": {
+      "transport": "stdio",
+      "command": "python",
+      "args": [
+        "./skills_autoload/rag-retrieve/rag_retrieve_server.py",
+        "{bot_id}"
+      ]
+    }
+  }
+}
+```
+
+## Hook Script Behavior
+
+The hook script runs as a subprocess, receives input through environment variables, and writes the injected content to stdout.
+
+### Available Environment Variables
+
+| Environment Variable | Description | Applies To |
+|----------------------|-------------|------------|
+| `ASSISTANT_ID` | Bot ID | All hooks |
+| `USER_IDENTIFIER` | User identifier | All hooks |
+| `SESSION_ID` | Session ID | All hooks |
+| `LANGUAGE` | Language code | All hooks |
+| `HOOK_TYPE` | Hook type | All hooks |
+
+### PrePrompt Example
+
+```python
+#!/usr/bin/env python3
+import os
+import sys
+
+
+def main():
+    user_identifier = os.environ.get('USER_IDENTIFIER', '')
+    bot_id = os.environ.get('ASSISTANT_ID', '')
+
+    print(f"## Retrieval Context\n\nUser: {user_identifier}\nBot: {bot_id}")
+    return 0
+
+
+if __name__ == '__main__':
+    sys.exit(main())
+```
+
+## Example Use Cases
+
+1. **Prompt-time retrieval guidance**: inject retrieval rules before the model starts reasoning
+2. **Bot-specific retrieval setup**: start the MCP server with the current `bot_id`
+3. **Unified retrieval access**: expose RAG and table RAG tools through a single skill
--- a/skills/autoload/support/rag-retrieve/hooks/hook-backup.md
+++ b/skills/autoload/support/rag-retrieve/hooks/hook-backup.md
@ -0,0 +1,55 @@
+# Retrieval Policy
+
+### 1. Retrieval Order and Tool Selection
+- Follow this section for source choice, tool choice, query rewrite, `top_k`, fallback, result handling, and citations.
+- Use this default retrieval order and execute it sequentially: skill-enabled knowledge retrieval tools > `rag_retrieve` / `table_rag_retrieve`.
+- Do NOT answer from model knowledge first.
+- Do NOT bypass the retrieval flow and inspect local filesystem documents on your own.
+- Do NOT use local filesystem retrieval as a fallback knowledge source.
+- Local filesystem documents are not a recommended retrieval source here because file formats are inconsistent and have not been normalized or parsed for reliable knowledge lookup.
+- Knowledge must be retrieved through the supported knowledge tools only: skill-enabled retrieval scripts, `table_rag_retrieve`, and `rag_retrieve`.
+- When a suitable skill-enabled knowledge retrieval tool is available, use it first.
+- If no suitable skill-enabled retrieval tool is available, or if its result is insufficient, continue with `rag_retrieve` or `table_rag_retrieve`.
+- Use `table_rag_retrieve` first for values, prices, quantities, inventory, specifications, rankings, comparisons, summaries, extraction, lists, tables, name lookup, historical coverage, mixed questions, and unclear cases.
+- Use `rag_retrieve` first only for clearly pure concept, definition, workflow, policy, or explanation questions without structured data needs.
+- After each retrieval step, evaluate sufficiency before moving to the next source. Do NOT run these retrieval sources in parallel.
+
+### 2. Query Preparation
+- Do NOT pass the raw user question unless it already works well for retrieval.
+- Rewrite for recall: extract entity, time scope, attributes, and intent.
+- Add useful variants: synonyms, aliases, abbreviations, related titles, historical names, and category terms.
+- Expand list-style, extraction, overview, historical, roster, timeline, and archive queries more aggressively.
+- Preserve meaning. Do NOT introduce unrelated topics.
+
+### 3. Retrieval Breadth (`top_k`)
+- Apply `top_k` only to `rag_retrieve`. Use the smallest sufficient value, then expand only if coverage is insufficient.
+- Use `30` for simple fact lookup.
+- Use `50` for moderate synthesis, comparison, summarization, or disambiguation.
+- Use `100` for broad recall, such as comprehensive analysis, scattered knowledge, multiple entities or periods, or list / catalog / timeline / roster / overview requests.
+- Raise `top_k` when keyword branches are many or results are too few, repetitive, incomplete, sparse, or too narrow.
+- Use this expansion order: `30 -> 50 -> 100`. If unsure, use `100`.
+
+### 4. Result Evaluation
+- Treat results as insufficient if they are empty, start with `Error:`, say `no excel files found`, are off-topic, miss the core entity or scope, or provide no usable evidence.
+- Also treat results as insufficient when they cover only part of the request, or when full-list, historical, comparison, or mixed data + explanation requests return only partial or truncated coverage.
+
+### 5. Fallback and Sequential Retry
+- If the first retrieval result is insufficient, call the next supported retrieval source in the default order before replying.
+- `table_rag_retrieve` now performs an internal fallback to `rag_retrieve` when it returns `no excel files found`, but this does NOT change the higher-level retrieval order.
+- If `table_rag_retrieve` is insufficient or empty, continue with `rag_retrieve`.
+- If `rag_retrieve` is insufficient or empty, continue with `table_rag_retrieve`.
+- Say no relevant information was found only after all applicable skill-enabled retrieval tools, `rag_retrieve`, and `table_rag_retrieve` have been tried and still do not provide enough evidence.
+- Do NOT reply that no relevant information was found before the supported knowledge retrieval flow has been exhausted.
+
+### 6. Table RAG Result Handling
+- Follow all `[INSTRUCTION]` and `[EXTRA_INSTRUCTION]` content in `table_rag_retrieve` results.
+- If results are truncated, explicitly tell the user total matches (`N+M`), displayed count (`N`), and omitted count (`M`).
+- Cite data sources using filenames from `file_ref_table`.
+
+### 7. Citation Requirements for Retrieved Knowledge
+- When using knowledge from `rag_retrieve` or `table_rag_retrieve`, you MUST generate `<CITATION ... />` tags.
+- Follow the citation format returned by each tool.
+- Place citations immediately after the paragraph or bullet list that uses the knowledge.
+- Do NOT collect citations at the end.
+- Use 1-2 citations per paragraph or bullet list when possible.
+- If learned knowledge is used, include at least 1 `<CITATION ... />`.
--- a/skills/autoload/support/rag-retrieve/hooks/pre_prompt.py
+++ b/skills/autoload/support/rag-retrieve/hooks/pre_prompt.py
--- a/skills/autoload/support/rag-retrieve/hooks/retrieval-policy.md
+++ b/skills/autoload/support/rag-retrieve/hooks/retrieval-policy.md
@ -0,0 +1,80 @@
+# Retrieval Policy
+
+## 0. Task Classification
+
+Classify the request before acting:
+- **Knowledge retrieval** (facts, summaries, comparisons, prices, lists, timelines, extraction, etc.): follow this policy strictly.
+- **Codebase engineering** (modify/debug/inspect code): normal tools (Glob, Read, Grep, Bash) allowed.
+- **Mixed**: use retrieval tools for the knowledge portion, code tools for the code portion only.
+- **Uncertain**: default to knowledge retrieval.
+
+## 1. Critical Enforcement
+
+For knowledge retrieval tasks, **this policy overrides generic codebase exploration behavior**.
+
+- **Prohibited tools**: `Glob`, `Read`, `LS`, Bash (`ls`, `find`, `cat`, `head`, `tail`, `grep`, etc.) — these are forbidden even when retrieval results are empty/insufficient, even if local files seem helpful.
+- **Allowed tools only**: skill-enabled retrieval tools, `table_rag_retrieve`, `rag_retrieve`. No other source for factual answering.
+- Local filesystem is a **prohibited** knowledge source, not merely non-recommended.
+- Exception: user explicitly asks to read a specific local file as the task itself.
+
+## 2. Retrieval Order and Tool Selection
+
+Execute **sequentially, one at a time**. Do NOT run in parallel. Do NOT probe filesystem first.
+
+1. **Skill-enabled retrieval tools** (use first when available)
+2. **`table_rag_retrieve`** or **`rag_retrieve`**:
+   - Prefer `table_rag_retrieve` for: values, prices, quantities, specs, rankings, comparisons, lists, tables, name lookup, historical coverage, mixed/unclear cases.
+   - Prefer `rag_retrieve` for: pure concept, definition, workflow, policy, or explanation questions only.
+
+- Do NOT answer from model knowledge first.
+- After each step, evaluate sufficiency before proceeding.
+
+## 3. Query Preparation
+
+- Do NOT pass raw user question unless it already works well for retrieval.
+- Rewrite for recall: extract entity, time scope, attributes, intent. Add synonyms, aliases, abbreviations, historical names, category terms.
+- Expand list/extraction/overview/timeline queries more aggressively. Preserve meaning.
+
+## 4. Retrieval Breadth (`top_k`)
+
+- Apply `top_k` only to `rag_retrieve`. Use smallest sufficient value, expand if insufficient.
+- `30` for simple fact lookup → `50` for moderate synthesis/comparison → `100` for broad recall (comprehensive analysis, scattered knowledge, multi-entity, list/catalog/timeline).
+- Expansion order: `30 → 50 → 100`. If unsure, use `100`.
+
+## 5. Result Evaluation
+
+Treat as insufficient if: empty, `Error:`, `no excel files found`, off-topic, missing core entity/scope, no usable evidence, partial coverage, or truncated results.
+
+## 6. Fallback and Sequential Retry
+
+On insufficient results, follow this sequence:
+
+1. Rewrite query, retry same tool (once)
+2. Switch to next retrieval source in default order
+3. For `rag_retrieve`, expand `top_k`: `30 → 50 → 100`
+4. `table_rag_retrieve` insufficient → try `rag_retrieve`; `rag_retrieve` insufficient → try `table_rag_retrieve`
+
+- `table_rag_retrieve` internally falls back to `rag_retrieve` on `no excel files found`, but this does NOT change the higher-level order.
+- Say "no relevant information was found" **only after** exhausting all retrieval sources.
+- Do NOT switch to local filesystem inspection at any point.
+
+## 7. Table RAG Result Handling
+
+- Follow all `[INSTRUCTION]` and `[EXTRA_INSTRUCTION]` in results.
+- If truncated: tell user total (`N+M`), displayed (`N`), omitted (`M`).
+- Cite sources using filenames from `file_ref_table`.
+
+## 8. Citation Requirements
+
+- MUST generate `<CITATION ... />` tags when using retrieval results.
+- Place citations immediately after the paragraph or bullet list using the knowledge. Do NOT collect at end.
+- 1-2 citations per paragraph/bullet. At least 1 citation when using retrieved knowledge.
+
+## 9. Pre-Reply Self-Check
+
+Before replying to a knowledge retrieval task, verify:
+- Used only whitelisted retrieval tools — no local filesystem inspection?
+- Exhausted retrieval flow before concluding "not found"?
+- Citations placed immediately after each relevant paragraph?
+
+If any answer is "no", correct the process first.
--- a/skills/autoload/support/rag-retrieve/mcp_common.py
+++ b/skills/autoload/support/rag-retrieve/mcp_common.py
--- a/skills/autoload/support/rag-retrieve/rag_retrieve_server.py
+++ b/skills/autoload/support/rag-retrieve/rag_retrieve_server.py
@ -0,0 +1,351 @@
+#!/usr/bin/env python3
+"""
+RAG检索MCP服务器
+调用本地RAG API进行文档检索
+"""
+
+import asyncio
+import hashlib
+import json
+import re
+import sys
+import os
+from typing import Any, Dict, List
+
+try:
+    import requests
+except ImportError:
+    print("Error: requests module is required. Please install it with: pip install requests")
+    sys.exit(1)
+
+from mcp_common import (
+    create_error_response,
+    create_success_response,
+    create_initialize_response,
+    create_ping_response,
+    create_tools_list_response,
+    load_tools_from_json,
+    handle_mcp_streaming
+)
+BACKEND_HOST = os.getenv("BACKEND_HOST", "https://api-dev.gptbase.ai")
+MASTERKEY = os.getenv("MASTERKEY", "master")
+
+# Citation instruction prefixes injected into tool results
+DOCUMENT_CITATION_INSTRUCTIONS = """<CITATION_INSTRUCTIONS>
+When using the retrieved knowledge below, you MUST add XML citation tags for factual claims.
+
+## Document Knowledge
+Format: `<CITATION file="file_uuid" filename="name.pdf" page=3 />`
+- Use `file` attribute with the UUID from document markers
+- Use `filename` attribute with the actual filename from document markers
+- Use `page` attribute (singular) with the page number
+- `page` MUST be 0-based and must match the `pages:` values shown in the learned knowledge context
+
+## Web Page Knowledge
+Format: `<CITATION url="https://example.com/page" />`
+- Use `url` attribute with the web page URL from the source metadata
+- Do not use `file`, `filename`, or `page` attributes for web sources
+- If content is grounded in a web source, prefer a web citation with `url` over a file citation
+
+## Placement Rules
+- Citations MUST appear IMMEDIATELY AFTER the paragraph or bullet list that uses the knowledge
+- NEVER collect all citations and place them at the end of your response
+- Limit to 1-2 citations per paragraph/bullet list
+- If your answer uses learned knowledge, you MUST generate at least 1 `<CITATION ... />` in the response
+</CITATION_INSTRUCTIONS>
+
+"""
+
+TABLE_CITATION_INSTRUCTIONS = """<CITATION_INSTRUCTIONS>
+When using the retrieved table knowledge below, you MUST add XML citation tags for factual claims.
+
+Format: `<CITATION file="file_id" filename="name.xlsx" sheet=1 rows=[2, 4] />`
+- Parse `__src`: `F1S2R5` = file_ref F1, sheet 2, row 5
+- Look up file_id in `file_ref_table`
+- Combine same-sheet rows into one citation: `rows=[2, 4, 6]`
+- MANDATORY: Create SEPARATE citation for EACH (file, sheet) combination
+- NEVER put <CITATION> on the same line as a bullet point or table row
+- Citations MUST be on separate lines AFTER the complete list/table
+- NEVER include the `__src` column in your response - it is internal metadata only
+- Citations MUST appear IMMEDIATELY AFTER the paragraph or bullet list that uses the knowledge
+- NEVER collect all citations and place them at the end of your response
+</CITATION_INSTRUCTIONS>
+
+"""
+
+def rag_retrieve(query: str, top_k: int = 100) -> Dict[str, Any]:
+    """调用RAG检索API"""
+    try:
+        bot_id = ""
+        if len(sys.argv) > 1:
+            bot_id = sys.argv[1]
+
+        url = f"{BACKEND_HOST}/v1/rag_retrieve/{bot_id}"
+        if not url:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": "Error: RAG API URL not provided. Please provide URL as command line argument."
+                    }
+                ]
+            }
+
+        # 获取masterkey并生成认证token
+        masterkey = MASTERKEY
+        token_input = f"{masterkey}:{bot_id}"
+        auth_token = hashlib.md5(token_input.encode()).hexdigest()
+
+        headers = {
+            "content-type": "application/json",
+            "authorization": f"Bearer {auth_token}"
+        }
+        data = {
+            "query": query,
+            "top_k": top_k
+        }
+        
+        # 发送POST请求
+        response = requests.post(url, json=data, headers=headers, timeout=30)
+        
+        if response.status_code != 200:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: RAG API returned status code {response.status_code}. Response: {response.text}"
+                    }
+                ]
+            }
+        
+        # 解析响应
+        try:
+            response_data = response.json()
+        except json.JSONDecodeError as e:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: Failed to parse API response as JSON. Error: {str(e)}, Raw response: {response.text}"
+                    }
+                ]
+            }
+        
+        # 提取markdown字段
+        if "markdown" in response_data:
+            markdown_content = response_data["markdown"]
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": DOCUMENT_CITATION_INSTRUCTIONS + markdown_content
+                    }
+                ]
+            }
+        else:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: 'markdown' field not found in API response. Response: {json.dumps(response_data, indent=2, ensure_ascii=False)}"
+                    }
+                ]
+            }
+
+    except requests.exceptions.RequestException as e:
+        return {
+            "content": [
+                {
+                    "type": "text",
+                    "text": f"Error: Failed to connect to RAG API. {str(e)}"
+                }
+            ]
+        }
+    except Exception as e:
+        return {
+            "content": [
+                {
+                    "type": "text",
+                    "text": f"Error: {str(e)}"
+                }
+            ]
+        }
+
+
+def table_rag_retrieve(query: str) -> Dict[str, Any]:
+    """调用Table RAG检索API"""
+    try:
+        bot_id = ""
+        if len(sys.argv) > 1:
+            bot_id = sys.argv[1]
+
+        url = f"{BACKEND_HOST}/v1/table_rag_retrieve/{bot_id}"
+
+        masterkey = MASTERKEY
+        token_input = f"{masterkey}:{bot_id}"
+        auth_token = hashlib.md5(token_input.encode()).hexdigest()
+
+        headers = {
+            "content-type": "application/json",
+            "authorization": f"Bearer {auth_token}"
+        }
+        data = {
+            "query": query,
+        }
+
+        response = requests.post(url, json=data, headers=headers, timeout=300)
+
+        if response.status_code != 200:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: Table RAG API returned status code {response.status_code}. Response: {response.text}"
+                    }
+                ]
+            }
+
+        try:
+            response_data = response.json()
+        except json.JSONDecodeError as e:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: Failed to parse API response as JSON. Error: {str(e)}, Raw response: {response.text}"
+                    }
+                ]
+            }
+
+        if "markdown" in response_data:
+            markdown_content = response_data["markdown"]
+            if re.search(r"^no excel files found", markdown_content, re.IGNORECASE):
+                rag_result = rag_retrieve(query)
+                content = rag_result.get("content", [])
+                if content and content[0].get("type") == "text":
+                    content[0]["text"] = "No table_rag_retrieve results were found. The content below is the fallback result from rag_retrieve：\n\n" + content[0]["text"]
+                return rag_result
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": TABLE_CITATION_INSTRUCTIONS + markdown_content
+                    }
+                ]
+            }
+        else:
+            return {
+                "content": [
+                    {
+                        "type": "text",
+                        "text": f"Error: 'markdown' field not found in API response. Response: {json.dumps(response_data, indent=2, ensure_ascii=False)}"
+                    }
+                ]
+            }
+
+    except requests.exceptions.RequestException as e:
+        return {
+            "content": [
+                {
+                    "type": "text",
+                    "text": f"Error: Failed to connect to Table RAG API. {str(e)}"
+                }
+            ]
+        }
+    except Exception as e:
+        return {
+            "content": [
+                {
+                    "type": "text",
+                    "text": f"Error: {str(e)}"
+                }
+            ]
+        }
+
+
+async def handle_request(request: Dict[str, Any]) -> Dict[str, Any]:
+    """Handle MCP request"""
+    try:
+        method = request.get("method")
+        params = request.get("params", {})
+        request_id = request.get("id")
+        
+        if method == "initialize":
+            return create_initialize_response(request_id, "rag-retrieve")
+        
+        elif method == "ping":
+            return create_ping_response(request_id)
+        
+        elif method == "tools/list":
+            # 从 JSON 文件加载工具定义
+            tools = load_tools_from_json("rag_retrieve_tools.json")
+            if not tools:
+                # 如果 JSON 文件不存在，使用默认定义
+                tools = [
+                    {
+                        "name": "rag_retrieve",
+                        "description": "调用RAG检索API，根据查询内容检索相关文档。返回包含相关内容的markdown格式结果。",
+                        "inputSchema": {
+                            "type": "object",
+                            "properties": {
+                                "query": {
+                                    "type": "string",
+                                    "description": "检索查询内容"
+                                }
+                            },
+                            "required": ["query"]
+                        }
+                    }
+                ]
+            return create_tools_list_response(request_id, tools)
+        
+        elif method == "tools/call":
+            tool_name = params.get("name")
+            arguments = params.get("arguments", {})
+            
+            if tool_name == "rag_retrieve":
+                query = arguments.get("query", "")
+                top_k = arguments.get("top_k", 100)
+
+                if not query:
+                    return create_error_response(request_id, -32602, "Missing required parameter: query")
+
+                result = rag_retrieve(query, top_k)
+
+                return {
+                    "jsonrpc": "2.0",
+                    "id": request_id,
+                    "result": result
+                }
+
+            elif tool_name == "table_rag_retrieve":
+                query = arguments.get("query", "")
+
+                if not query:
+                    return create_error_response(request_id, -32602, "Missing required parameter: query")
+
+                result = table_rag_retrieve(query)
+
+                return {
+                    "jsonrpc": "2.0",
+                    "id": request_id,
+                    "result": result
+                }
+            
+            else:
+                return create_error_response(request_id, -32601, f"Unknown tool: {tool_name}")
+        
+        else:
+            return create_error_response(request_id, -32601, f"Unknown method: {method}")
+    
+    except Exception as e:
+        return create_error_response(request.get("id"), -32603, f"Internal error: {str(e)}")
+
+
+async def main():
+    """Main entry point."""
+    await handle_mcp_streaming(handle_request)
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
--- a/skills/autoload/support/rag-retrieve/rag_retrieve_tools.json
+++ b/skills/autoload/support/rag-retrieve/rag_retrieve_tools.json
@ -0,0 +1,35 @@
+[
+  {
+    "name": "rag_retrieve",
+    "description": "Retrieve relevant documents from the knowledge base. Returns markdown results. Use this tool first only for clearly pure concept, definition, workflow, policy, or explanation questions without structured data needs. If the result is insufficient, try table_rag_retrieve before replying with no result.",
+    "inputSchema": {
+      "type": "object",
+      "properties": {
+        "query": {
+          "type": "string",
+          "description": "Retrieval query content. Rewrite the query when needed to improve recall."
+        },
+        "top_k": {
+          "type": "integer",
+          "description": "Number of top results to retrieve. Choose dynamically based on retrieval breadth and coverage needs.",
+          "default": 100
+        }
+      },
+      "required": ["query"]
+    }
+  },
+  {
+    "name": "table_rag_retrieve",
+    "description": "Retrieve relevant table data from Excel or spreadsheet files in the knowledge base. Returns markdown results. Use this tool first for structured data, lists, statistics, extraction, mixed questions, and unclear cases. If the result is insufficient, try rag_retrieve before replying with no result.",
+    "inputSchema": {
+      "type": "object",
+      "properties": {
+        "query": {
+          "type": "string",
+          "description": "Retrieval query content for table data. Rewrite the query when needed to improve recall."
+        }
+      },
+      "required": ["query"]
+    }
+  }
+]
--- a/skills/common/docx/LICENSE.txt
+++ b/skills/common/docx/LICENSE.txt
--- a/skills/common/docx/SKILL.md
+++ b/skills/common/docx/SKILL.md
--- a/skills/common/docx/docx-js.md
+++ b/skills/common/docx/docx-js.md
--- a/skills/common/docx/ooxml.md
+++ b/skills/common/docx/ooxml.md
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chart.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chart.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-main.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-main.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-picture.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-picture.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/pml.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/pml.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-math.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-math.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/sml.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/sml.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-main.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-main.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/wml.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/wml.xsd
--- a/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/xml.xsd
+++ b/skills/common/docx/ooxml/schemas/ISO-IEC29500-4_2016/xml.xsd
--- a/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-contentTypes.xsd
+++ b/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-contentTypes.xsd
--- a/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-coreProperties.xsd
+++ b/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-coreProperties.xsd
--- a/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-digSig.xsd
+++ b/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-digSig.xsd
--- a/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-relationships.xsd
+++ b/skills/common/docx/ooxml/schemas/ecma/fouth-edition/opc-relationships.xsd
--- a/skills/common/docx/ooxml/schemas/mce/mc.xsd
+++ b/skills/common/docx/ooxml/schemas/mce/mc.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-2010.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-2010.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-2012.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-2012.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-2018.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-2018.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-cex-2018.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-cex-2018.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-cid-2016.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-cid-2016.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-sdtdatahash-2020.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-sdtdatahash-2020.xsd
--- a/skills/common/docx/ooxml/schemas/microsoft/wml-symex-2015.xsd
+++ b/skills/common/docx/ooxml/schemas/microsoft/wml-symex-2015.xsd
--- a/skills/common/docx/ooxml/scripts/pack.py
+++ b/skills/common/docx/ooxml/scripts/pack.py
--- a/skills/common/docx/ooxml/scripts/unpack.py
+++ b/skills/common/docx/ooxml/scripts/unpack.py
--- a/skills/common/docx/ooxml/scripts/validate.py
+++ b/skills/common/docx/ooxml/scripts/validate.py
--- a/skills/common/docx/ooxml/scripts/validation/init.py
+++ b/skills/common/docx/ooxml/scripts/validation/init.py
--- a/skills/common/docx/ooxml/scripts/validation/base.py
+++ b/skills/common/docx/ooxml/scripts/validation/base.py
--- a/skills/common/docx/ooxml/scripts/validation/docx.py
+++ b/skills/common/docx/ooxml/scripts/validation/docx.py
--- a/skills/common/docx/ooxml/scripts/validation/pptx.py
+++ b/skills/common/docx/ooxml/scripts/validation/pptx.py
--- a/skills/common/docx/ooxml/scripts/validation/redlining.py
+++ b/skills/common/docx/ooxml/scripts/validation/redlining.py
--- a/skills/common/docx/scripts/init.py
+++ b/skills/common/docx/scripts/init.py
--- a/skills/common/docx/scripts/document.py
+++ b/skills/common/docx/scripts/document.py
--- a/skills/common/docx/scripts/templates/comments.xml
+++ b/skills/common/docx/scripts/templates/comments.xml
--- a/skills/common/docx/scripts/templates/commentsExtended.xml
+++ b/skills/common/docx/scripts/templates/commentsExtended.xml
--- a/skills/common/docx/scripts/templates/commentsExtensible.xml
+++ b/skills/common/docx/scripts/templates/commentsExtensible.xml
--- a/skills/common/docx/scripts/templates/commentsIds.xml
+++ b/skills/common/docx/scripts/templates/commentsIds.xml
--- a/skills/common/docx/scripts/templates/people.xml
+++ b/skills/common/docx/scripts/templates/people.xml
--- a/skills/common/docx/scripts/utilities.py
+++ b/skills/common/docx/scripts/utilities.py
--- a/skills/common/imap-smtp-email/SKILL.md
+++ b/skills/common/imap-smtp-email/SKILL.md
--- a/skills/common/imap-smtp-email/scripts/imap.js
+++ b/skills/common/imap-smtp-email/scripts/imap.js
--- a/skills/common/imap-smtp-email/scripts/smtp.js
+++ b/skills/common/imap-smtp-email/scripts/smtp.js
--- a/skills/common/imap-smtp-email/setup.sh
+++ b/skills/common/imap-smtp-email/setup.sh
--- a/skills/common/pdf/LICENSE.txt
+++ b/skills/common/pdf/LICENSE.txt
--- a/skills/common/pdf/SKILL.md
+++ b/skills/common/pdf/SKILL.md
--- a/skills/common/pdf/forms.md
+++ b/skills/common/pdf/forms.md
--- a/skills/common/pdf/reference.md
+++ b/skills/common/pdf/reference.md
--- a/skills/common/pdf/scripts/check_bounding_boxes.py
+++ b/skills/common/pdf/scripts/check_bounding_boxes.py
--- a/skills/common/pdf/scripts/check_bounding_boxes_test.py
+++ b/skills/common/pdf/scripts/check_bounding_boxes_test.py
--- a/skills/common/pdf/scripts/check_fillable_fields.py
+++ b/skills/common/pdf/scripts/check_fillable_fields.py
--- a/skills/common/pdf/scripts/convert_pdf_to_images.py
+++ b/skills/common/pdf/scripts/convert_pdf_to_images.py
--- a/skills/common/pdf/scripts/create_validation_image.py
+++ b/skills/common/pdf/scripts/create_validation_image.py
--- a/skills/common/pdf/scripts/extract_form_field_info.py
+++ b/skills/common/pdf/scripts/extract_form_field_info.py
--- a/skills/common/pdf/scripts/fill_fillable_fields.py
+++ b/skills/common/pdf/scripts/fill_fillable_fields.py
--- a/skills/common/pdf/scripts/fill_pdf_form_with_annotations.py
+++ b/skills/common/pdf/scripts/fill_pdf_form_with_annotations.py
--- a/skills/common/pptx/LICENSE.txt
+++ b/skills/common/pptx/LICENSE.txt
--- a/skills/common/pptx/SKILL.md
+++ b/skills/common/pptx/SKILL.md
--- a/skills/common/pptx/html2pptx.md
+++ b/skills/common/pptx/html2pptx.md
--- a/skills/common/pptx/ooxml.md
+++ b/skills/common/pptx/ooxml.md
--- a/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chart.xsd
+++ b/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chart.xsd
--- a/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd
+++ b/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd
--- a/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd
+++ b/skills/common/pptx/ooxml/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd
--- a/Show More
+++ b/Show More