diff --git a/.github/workflows/auto-unit-test.yml b/.github/workflows/auto-unit-test.yml
index 1595fc769..dace8dab6 100644
--- a/.github/workflows/auto-unit-test.yml
+++ b/.github/workflows/auto-unit-test.yml
@@ -36,7 +36,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
-          python-version: '3.10'
+          python-version: '3.11'
 
       - name: Install uv
         run: pip install --upgrade uv
diff --git a/.github/workflows/sdk_publish.yml b/.github/workflows/sdk_publish.yml
index 1e5759277..3cc413381 100644
--- a/.github/workflows/sdk_publish.yml
+++ b/.github/workflows/sdk_publish.yml
@@ -21,7 +21,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
-          python-version: '3.10'
+          python-version: '3.11'
 
       - name: Install build dependencies
         run: |
diff --git a/.gitignore b/.gitignore
index ec5b3a3f9..e0bac2b47 100644
--- a/.gitignore
+++ b/.gitignore
@@ -61,4 +61,9 @@ data/
 sdk/benchmark/.env
 /docker/.env.bak
 
-.venv
\ No newline at end of file
+.venv
+
+.pytest-tmp
+doc/mermaid
+
+.claude/skills/python-import-triage
\ No newline at end of file
diff --git a/backend/adapters/__init__.py b/backend/adapters/__init__.py
new file mode 100644
index 000000000..ed46fc888
--- /dev/null
+++ b/backend/adapters/__init__.py
@@ -0,0 +1,13 @@
+from adapters.exception import JiuwenSDKError, JiuwenSDKUnavailableError, NexentCapabilityError
+
+try:
+    from adapters.jiuwen_sdk_adapter import JiuwenSDKAdapter
+except ModuleNotFoundError:
+    JiuwenSDKAdapter = None  # type: ignore[assignment, misc]
+
+__all__ = [
+    "JiuwenSDKError",
+    "JiuwenSDKUnavailableError",
+    "NexentCapabilityError",
+    "JiuwenSDKAdapter",
+]
diff --git a/backend/adapters/exception.py b/backend/adapters/exception.py
new file mode 100644
index 000000000..63812d3af
--- /dev/null
+++ b/backend/adapters/exception.py
@@ -0,0 +1,13 @@
+class JiuwenSDKError(Exception):
+    """Jiuwen SDK 调用失败的通用异常"""
+    pass
+
+
+class JiuwenSDKUnavailableError(JiuwenSDKError):
+    """Jiuwen SDK 不可用（依赖缺失或未启用）"""
+    pass
+
+
+class NexentCapabilityError(Exception):
+    """nexent 原生模式不支持该能力"""
+    pass
diff --git a/backend/adapters/jiuwen_sdk_adapter.py b/backend/adapters/jiuwen_sdk_adapter.py
new file mode 100644
index 000000000..f62ce9d06
--- /dev/null
+++ b/backend/adapters/jiuwen_sdk_adapter.py
@@ -0,0 +1,514 @@
+"""
+openjiuwen SDK adapter for Nexent.
+
+This module must be imported lazily (not at module load time) because
+openjiuwen 0.1.13 has circular import bugs in its __init__.py files that
+prevent the SDK from loading unless we bypass them.
+
+Import flow:
+  backend/adapters/__init__.py -> try/except -> JiuwenSDKAdapter = None
+  -> when needed: _install_jiuwen_bypasser() -> openjiuwen imports work
+"""
+import asyncio
+import importlib.abc
+import importlib.machinery
+import json
+import logging
+import os
+import sys
+import types
+from typing import Any, List, Literal, Optional
+
+logger = logging.getLogger("jiuwen_adapter")
+
+from adapters.exception import JiuwenSDKError
+
+
+# ----------------------------------------------------------------------
+# Circular import bypasser for openjiuwen 0.1.13
+#
+# openjiuwen has broken __init__.py files that create circular import chains:
+#   tune/__init__.py -> tune.optimizer -> core.operator -> agent_evolving -> ...
+# This bypasser prevents those __init__.py files from executing while still
+# allowing regular .py submodule files to load normally.
+# ----------------------------------------------------------------------
+_CIRCULAR_CHAIN = {
+    "openjiuwen.agent_evolving",
+    "openjiuwen.agent_evolving.trainer",
+    "openjiuwen.agent_evolving.trainer.trainer",
+    "openjiuwen.agent_evolving.trainer.progress",
+    "openjiuwen.core",
+    "openjiuwen.dev_tools",
+    "openjiuwen.dev_tools.tune",
+    "openjiuwen.dev_tools.tune.optimizer",
+    "openjiuwen.dev_tools.tune.optimizer.instruction_optimizer",
+    "openjiuwen.dev_tools.prompt_builder",
+    "openjiuwen.dev_tools.prompt_builder.builder",
+}
+
+
+class _JiuwenInitBypasser(importlib.abc.MetaPathFinder, importlib.abc.Loader):
+    """
+    Meta path finder that intercepts __init__.py loading within openjiuwen,
+    blocking only the packages in the circular import chain while letting
+    all other modules (including base.py files) load normally.
+    """
+
+    def find_spec(self, fullname: str, path: Any, target: Any = None) -> Any:
+        if not fullname.startswith("openjiuwen") or fullname == "openjiuwen":
+            return None
+
+        try:
+            import openjiuwen as _oj
+
+            pkg_root = _oj.__path__[0]
+        except ImportError:
+            return None
+
+        parts = fullname.split(".")[1:]
+        file_path = pkg_root
+        for p in parts:
+            file_path = os.path.join(file_path, p)
+
+        is_package = os.path.isdir(file_path)
+        if not is_package:
+            return None
+
+        init_path = os.path.join(file_path, "__init__.py")
+        if not os.path.exists(init_path):
+            return None
+
+        if fullname not in _CIRCULAR_CHAIN:
+            return None
+
+        spec = importlib.machinery.ModuleSpec(
+            fullname, self, is_package=True, origin="<init bypassed>"
+        )
+        spec.submodule_search_locations = [file_path]
+        return spec
+
+    def create_module(self, module: Any) -> None:
+        return None
+
+    def exec_module(self, module: Any) -> None:
+        import openjiuwen as _oj
+
+        pkg_root = _oj.__path__[0]
+        parts = module.__name__.split(".")[1:]
+        file_path = pkg_root
+        for p in parts:
+            file_path = os.path.join(file_path, p)
+        module.__path__ = [file_path]
+        module.__file__ = os.path.join(file_path, "__init__.py")
+
+    def __getattr__(self, name: str) -> Any:
+        """Handle special attributes like find_distributions to prevent recursion."""
+        import openjiuwen as _oj
+        import importlib
+
+        # Prevent recursion when Python scans sys.meta_path for find_distributions etc.
+        if name in (
+            "find_distributions",
+            "find_module",
+            "__path__",
+            "__name__",
+            "__file__",
+            "__loader__",
+            "__package__",
+            "__spec__",
+        ):
+            raise AttributeError(name)
+
+        pkg_root = _oj.__path__[0]
+        parts = self.__name__.split(".")[1:] + [name]
+        file_path = pkg_root
+        for p in parts:
+            file_path = os.path.join(file_path, p)
+
+        # If it's a package directory, import it as a submodule
+        if os.path.isdir(file_path) and os.path.exists(os.path.join(file_path, "__init__.py")):
+            return importlib.import_module(f"{self.__name__}.{name}")
+        # If it's a regular .py file
+        if os.path.exists(file_path + ".py"):
+            return importlib.import_module(f"{self.__name__}.{name}")
+        raise AttributeError(name)
+
+
+_bypasser_installed = False
+
+
+def _install_jiuwen_bypasser() -> bool:
+    """
+    Install the circular import bypasser for openjiuwen.
+    Returns True if installed, False if already installed or openjiuwen not available.
+    """
+    global _bypasser_installed
+    if _bypasser_installed:
+        return True
+
+    # Stub missing optional dependencies before openjiuwen import chain reaches them
+    _stubbed = [
+        ("pymilvus", {"is_successful": lambda *args, **kwargs: True}),
+        ("dashscope", {}),
+        ("pdfplumber", {}),
+    ]
+    for _name, _attrs in _stubbed:
+        if _name not in sys.modules:
+            _mod = types.ModuleType(_name)
+            for _k, _v in _attrs.items():
+                setattr(_mod, _k, _v)
+            sys.modules[_name] = _mod
+            _mod.__path__ = []
+
+    # Pre-create nested stub modules for pymilvus.client.utils chain
+    if "pymilvus.client" not in sys.modules:
+        _client_mod = types.ModuleType("pymilvus.client")
+        _client_mod.__path__ = []
+        sys.modules["pymilvus.client"] = _client_mod
+    if "pymilvus.client.utils" not in sys.modules:
+        _utils_mod = types.ModuleType("pymilvus.client.utils")
+        _utils_mod.is_successful = lambda *args, **kwargs: True
+        sys.modules["pymilvus.client.utils"] = _utils_mod
+
+    # Stub dashscope sub-modules that may be imported lazily
+    _dashscope_subs = [
+        ("dashscope.api_entities", {}),
+        ("dashscope.api_entities.data", {}),
+        ("dashscope.api_entities.dashscope_response", {"DashScopeAPIResponse": object}),
+        ("dashscope.common", {"REQUEST_TIMEOUT_KEYWORD": "timeout"}),
+        ("dashscope.common.constants", {"REQUEST_TIMEOUT_KEYWORD": "timeout"}),
+    ]
+    for _name, _attrs in _dashscope_subs:
+        if _name not in sys.modules:
+            _m = types.ModuleType(_name)
+            _m.__path__ = []
+            for _k, _v in _attrs.items():
+                setattr(_m, _k, _v)
+            sys.modules[_name] = _m
+
+    try:
+        import openjiuwen  # noqa: F401
+    except ImportError:
+        return False
+
+    for finder in sys.meta_path:
+        if isinstance(finder, _JiuwenInitBypasser):
+            _bypasser_installed = True
+            return True
+
+    sys.meta_path.insert(0, _JiuwenInitBypasser())
+    _bypasser_installed = True
+    return True
+
+
+# ----------------------------------------------------------------------
+# Language helpers
+# ----------------------------------------------------------------------
+LANGUAGE_MAP = {"zh": "zh-CN", "en": "en-US"}
+
+
+def normalize_language(language: str) -> str:
+    return LANGUAGE_MAP.get(language, "zh-CN")
+
+
+def run_async(coro):
+    """
+    Safely run async coroutine from sync context (FastAPI or Celery).
+    Handles existing event loops properly.
+    """
+    try:
+        loop = asyncio.get_running_loop()
+    except RuntimeError:
+        return asyncio.run(coro)
+
+    if loop.is_running():
+        try:
+            import nest_asyncio
+            nest_asyncio.apply()
+            return loop.run_until_complete(coro)
+        except ImportError:
+            import concurrent.futures
+
+            def run_in_thread():
+                new_loop = asyncio.new_event_loop()
+                asyncio.set_event_loop(new_loop)
+                try:
+                    return new_loop.run_until_complete(coro)
+                finally:
+                    new_loop.close()
+
+            with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
+                future = executor.submit(run_in_thread)
+                return future.result()
+
+    return loop.run_until_complete(coro)
+
+
+# ----------------------------------------------------------------------
+# Jiuwen SDK lazy import helpers
+# ----------------------------------------------------------------------
+def _lazy_import_jiuwen_config():
+    """Lazily import only lightweight Jiuwen config classes."""
+    _install_jiuwen_bypasser()
+
+    try:
+        import openjiuwen  # noqa: F401
+    except ImportError as e:
+        raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
+
+    from openjiuwen.core.foundation.llm.schema.config import (
+        ModelRequestConfig,
+        ModelClientConfig,
+        ProviderType,
+    )
+
+    return ModelRequestConfig, ModelClientConfig, ProviderType
+
+
+def build_jiuwen_model_configs(model_id: int, tenant_id: str):
+    """将 nexent 模型配置转换为 Jiuwen 配置对象"""
+    from database.model_management_db import get_model_by_model_id
+    from utils.config_utils import get_model_name_from_config
+
+    ModelRequestConfig, ModelClientConfig, ProviderType = _lazy_import_jiuwen_config()
+
+    model_config = get_model_by_model_id(model_id, tenant_id)
+    if not model_config:
+        raise JiuwenSDKError(f"model_id={model_id} not found")
+
+    api_base = (model_config.get("base_url", "") or "").strip()
+    if not api_base:
+        api_base = "https://api.openai.com/v1"
+
+    # Jiuwen ModelClientConfig defaults to timeout=60.0, max_retries=3.
+    # For prompt optimization calls, 60s can be too small. Reuse Nexent model config timeout_seconds.
+    timeout_seconds = model_config.get("timeout_seconds")
+    if timeout_seconds is None:
+        timeout_seconds = 120
+
+    ssl_cert = model_config.get("ssl_cert") or None
+    ssl_verify = model_config.get("ssl_verify", True)
+    if ssl_verify and not ssl_cert:
+        ssl_verify = False
+
+    client_config = ModelClientConfig(
+        client_provider=ProviderType.OpenAI,
+        api_key=model_config["api_key"],
+        api_base=api_base,
+        timeout=float(timeout_seconds),
+        verify_ssl=ssl_verify,
+        ssl_cert=ssl_cert,
+    )
+
+    request_config = ModelRequestConfig(
+        model_name=get_model_name_from_config(model_config),
+        temperature=0.3,
+    )
+    return request_config, client_config
+
+
+def _lazy_import_jiuwen_builders():
+    """Lazily import prompt builders only when optimization paths need them."""
+    _install_jiuwen_bypasser()
+
+    try:
+        import openjiuwen  # noqa: F401
+    except ImportError as e:
+        raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
+
+    from openjiuwen.dev_tools.prompt_builder.builder.feedback_prompt_builder import (
+        FeedbackPromptBuilder,
+    )
+    from openjiuwen.dev_tools.prompt_builder.builder.badcase_prompt_builder import (
+        BadCasePromptBuilder,
+    )
+
+    return FeedbackPromptBuilder, BadCasePromptBuilder
+
+
+def _unwrap_prompt_response(text: str) -> str:
+    """Strip JSON wrapper or markdown fence that Jiuwen LLM sometimes generates."""
+    _logger = logging.getLogger("jiuwen_adapter")
+    _logger.debug(f"[unwrap] raw ({len(text)} chars): {text[:200]}")
+
+    # Step 1: strip markdown code fences
+    text = text.strip()
+    if text.startswith("```"):
+        for lang in ("json", ""):
+            fence = f"```{lang}\n"
+            if text.startswith(fence):
+                text = text[len(fence):]
+                if text.endswith("\n```"):
+                    text = text[:-4]
+                elif text.endswith("```"):
+                    text = text[:-3]
+                break
+        text = text.strip()
+        _logger.debug(f"[unwrap] after fence strip ({len(text)} chars)")
+
+    # Step 2: try standard JSON parse (handles format 1 and 2)
+    if text.startswith("{"):
+        try:
+            parsed = json.loads(text)
+            if isinstance(parsed, dict) and "prompt" in parsed:
+                result = parsed["prompt"].strip()
+                _logger.debug(f"[unwrap] extracted prompt ({len(result)} chars)")
+                return result
+            if isinstance(parsed, dict) and "result" in parsed:
+                result = parsed["result"].strip()
+                _logger.debug(f"[unwrap] extracted result ({len(result)} chars)")
+                return result
+        except Exception:
+            pass
+
+    # Step 3: format 3 and 4 - raw text (possibly multi-line), return as-is
+    _logger.debug(f"[unwrap] no JSON wrapper, returning raw ({len(text)} chars)")
+    return text
+
+
+def _lazy_import_jiuwen_tune_types():
+    """Lazily import Jiuwen tune types only when badcase flow needs them."""
+    _install_jiuwen_bypasser()
+    from openjiuwen.dev_tools.tune.base import Case, EvaluatedCase
+    return Case, EvaluatedCase
+
+
+def to_jiuwen_evaluated_case(bad_case) -> Any:
+    """将 nexent BadCase 转换为 Jiuwen EvaluatedCase"""
+    Case, EvaluatedCase = _lazy_import_jiuwen_tune_types()
+
+    case = Case(
+        inputs={"question": bad_case.question},
+        label={"answer": bad_case.label or ""},
+    )
+    return EvaluatedCase(
+        case=case,
+        answer={"content": bad_case.answer},
+        score=0.0,
+        reason=bad_case.reason or "",
+    )
+
+
+# ----------------------------------------------------------------------
+# Main adapter class
+# ----------------------------------------------------------------------
+class JiuwenSDKAdapter:
+    """
+    Jiuwen SDK 调用适配器
+
+    封装 Jiuwen SDK 的所有调用，内部不处理降级，
+    失败时抛出 JiuwenSDKError，由上层 PromptOptimizationService 决定是否降级
+    """
+
+    def __init__(self, model_id: int, tenant_id: str):
+        self.model_id = model_id
+        self.tenant_id = tenant_id
+        self.logger = logging.getLogger("jiuwen_adapter")
+
+    def _ensure_available(self):
+        """确保 Jiuwen SDK 可用"""
+        if not _bypasser_installed:
+            _install_jiuwen_bypasser()
+
+        try:
+            import openjiuwen  # noqa: F401
+        except ImportError as e:
+            raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
+
+    def optimize(
+        self,
+        prompt: str,
+        feedback: str,
+        mode: Literal["general", "insert", "select"] = "general",
+        start_pos: Optional[int] = None,
+        end_pos: Optional[int] = None,
+        language: str = "zh",
+    ) -> str:
+        """
+        调用 Jiuwen FeedbackPromptBuilder
+
+        Raises:
+            JiuwenSDKError: SDK 调用失败
+        """
+        self._ensure_available()
+
+        logger.info(f"[jiuwen-adapter] mode={mode}, start_pos={start_pos}, end_pos={end_pos}")
+
+        request_config, client_config = build_jiuwen_model_configs(
+            self.model_id, self.tenant_id
+        )
+        logger.info(
+            f"[jiuwen-adapter] model_id={self.model_id}, tenant_id={self.tenant_id}, "
+            f"api_base={client_config.api_base}, model={request_config.model_name}, "
+            f"timeout={getattr(client_config, 'timeout', None)}, max_retries={getattr(client_config, 'max_retries', None)}"
+        )
+        FeedbackPromptBuilder, _ = _lazy_import_jiuwen_builders()
+
+        builder = FeedbackPromptBuilder(
+            model_config=request_config,
+            model_client_config=client_config,
+        )
+
+        try:
+            result = run_async(
+                builder.build(
+                    prompt=prompt,
+                    feedback=feedback,
+                    mode=mode,
+                    start_pos=start_pos,
+                    end_pos=end_pos,
+                    language=normalize_language(language),
+                )
+            )
+            if result is None:
+                raise JiuwenSDKError("Jiuwen FeedbackPromptBuilder 返回为空")
+            return _unwrap_prompt_response(str(result))
+        except Exception as e:
+            self.logger.error(f"Jiuwen FeedbackPromptBuilder 调用失败: {e}")
+            raise JiuwenSDKError(f"优化调用失败: {e}") from e
+
+    def optimize_badcase(
+        self,
+        prompt: str,
+        bad_cases: List,
+        language: str = "zh",
+    ) -> str:
+        """
+        调用 Jiuwen BadCasePromptBuilder
+
+        Raises:
+            JiuwenSDKError: SDK 调用失败
+        """
+        self._ensure_available()
+
+        _, BadCasePromptBuilder = _lazy_import_jiuwen_builders()
+
+        request_config, client_config = build_jiuwen_model_configs(
+            self.model_id, self.tenant_id
+        )
+        builder = BadCasePromptBuilder(
+            model_config=request_config,
+            model_client_config=client_config,
+        )
+
+        jiuwen_cases = [to_jiuwen_evaluated_case(bc) for bc in bad_cases]
+
+        try:
+            result = run_async(
+                builder.build(
+                    prompt=prompt,
+                    cases=jiuwen_cases,
+                    language=normalize_language(language),
+                )
+            )
+            if result is None:
+                raise JiuwenSDKError("Jiuwen BadCasePromptBuilder 返回为空")
+            return _unwrap_prompt_response(str(result))
+        except Exception as e:
+            self.logger.error(f"Jiuwen BadCasePromptBuilder 调用失败: {e}")
+            raise JiuwenSDKError(f"BadCasePromptBuilder 调用失败: {e}") from e
+
+    def generate(self, **kwargs) -> dict:
+        """调用 Jiuwen 提示词生成能力"""
+        self._ensure_available()
+        raise JiuwenSDKError("Jiuwen 提示词生成能力尚未实现")
diff --git a/backend/agents/create_agent_info.py b/backend/agents/create_agent_info.py
index 50df7eb99..7e3b42e28 100644
--- a/backend/agents/create_agent_info.py
+++ b/backend/agents/create_agent_info.py
@@ -1,12 +1,12 @@
-﻿import threading
+﻿import json
+import threading
 import logging
-from typing import List, Optional
+from typing import Any, Dict, List, Optional
 from urllib.parse import urljoin
-from datetime import datetime
 
 from jinja2 import Template, StrictUndefined
 from nexent.core.utils.observer import MessageObserver
-from nexent.core.agents.agent_model import AgentRunInfo, ModelConfig, AgentConfig, ToolConfig, ExternalA2AAgentConfig, AgentHistory
+from nexent.core.agents.agent_model import AgentRunInfo, ModelConfig, AgentConfig, ToolConfig, ExternalA2AAgentConfig, AgentHistory, AgentVerificationConfig
 from nexent.core.agents.agent_context import ContextManagerConfig
 from nexent.memory.memory_service import search_memory_in_levels
 
@@ -22,7 +22,11 @@
 from database.a2a_agent_db import PROTOCOL_JSONRPC
 from services.memory_config_service import build_memory_context
 from services.image_service import get_video_understanding_model, get_vlm_model
-from database.agent_db import search_agent_info_by_agent_id, query_sub_agents_id_list
+from database.agent_db import (
+    search_agent_info_by_agent_id,
+    query_sub_agent_relations,
+    resolve_sub_agent_version_no,
+)
 from database.agent_version_db import query_current_version_no
 from database.tool_db import search_tools_for_sub_agent
 from database.model_management_db import get_model_records, get_model_by_model_id
@@ -33,12 +37,71 @@
 from utils.config_utils import tenant_config_manager, get_model_name_from_config
 from utils.context_utils import build_context_components
 from consts.const import LOCAL_MCP_SERVER, MODEL_CONFIG_MAPPING, LANGUAGE, DATA_PROCESS_SERVICE, MINIO_DEFAULT_BUCKET
+from consts.model import AgentToolParamsRequest, ToolParamsRequest
 from consts.exceptions import ValidationError
 
 logger = logging.getLogger("create_agent_info")
 logger.setLevel(logging.DEBUG)
 
 
+def _normalize_tool_params_request(tool_params: Optional[ToolParamsRequest | Dict[str, Any]]) -> ToolParamsRequest:
+    """Normalize request-scoped tool parameter overrides into a ToolParamsRequest."""
+    if tool_params is None:
+        return ToolParamsRequest()
+    if isinstance(tool_params, ToolParamsRequest):
+        return tool_params
+    if not isinstance(tool_params, dict):
+        raise ValidationError("tool_params must be an object.")
+    try:
+        return ToolParamsRequest.model_validate(tool_params)
+    except Exception as exc:
+        raise ValidationError(f"Invalid tool_params payload: {exc}") from exc
+
+
+def _get_agent_tool_overrides(
+    tool_params: Optional[ToolParamsRequest],
+    agent_name: Optional[str],
+) -> Dict[str, Dict[str, Any]]:
+    """Resolve tool overrides for a specific agent by its name."""
+    if tool_params is None:
+        return {}
+    if not agent_name:
+        return {}
+    agent_override = tool_params.agents.get(agent_name)
+    if agent_override is None:
+        return {}
+    return dict(agent_override.tools)
+
+
+def _merge_tool_params(
+    tool_record: Dict[str, Any],
+    override_params: Optional[Dict[str, Any]],
+    extra_params: Optional[Dict[str, Any]] = None,
+) -> Dict[str, Any]:
+    """Merge request overrides on top of tool instance defaults from DB.
+
+    Args:
+        tool_record: Tool configuration from database
+        override_params: Request-scoped overrides from tool_params
+        extra_params: Additional internal params not in DB schema (e.g., document_paths)
+
+    Returns:
+        Merged params dict with DB defaults, overrides, and extra params
+    """
+    merged_params: Dict[str, Any] = {}
+    for param in tool_record.get("params", []):
+        merged_params[param["name"]] = param.get("default")
+
+    if override_params:
+        merged_params.update(override_params)
+
+    # Extra params (e.g., internal access control params) always take precedence
+    if extra_params:
+        merged_params.update(extra_params)
+
+    return merged_params
+
+
 def _build_internal_s3_url(file: dict) -> str:
     """Build a valid S3 URL for internal tools from uploaded file metadata."""
     if not isinstance(file, dict):
@@ -310,18 +373,23 @@ async def create_agent_config(
     allow_memory_search: bool = True,
     version_no: int = 0,
     override_model_id: int | None = None,
+    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
 ):
+    normalized_tool_params = _normalize_tool_params_request(tool_params)
     agent_info = search_agent_info_by_agent_id(
         agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
 
     # create sub agent
-    sub_agent_id_list = query_sub_agents_id_list(
+    sub_agent_relations = query_sub_agent_relations(
         main_agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
     managed_agents = []
-    for sub_agent_id in sub_agent_id_list:
-        # Get the current published version for this sub-agent (from draft version 0)
-        sub_agent_version_no = query_current_version_no(
-            agent_id=sub_agent_id, tenant_id=tenant_id) or 0
+    for rel in sub_agent_relations:
+        sub_agent_id = rel['selected_agent_id']
+        sub_agent_version_no = resolve_sub_agent_version_no(
+            selected_agent_id=sub_agent_id,
+            selected_agent_version_no=rel.get('selected_agent_version_no'),
+            tenant_id=tenant_id,
+        )
         sub_agent_config = await create_agent_config(
             agent_id=sub_agent_id,
             tenant_id=tenant_id,
@@ -331,13 +399,20 @@ async def create_agent_config(
             allow_memory_search=allow_memory_search,
             version_no=sub_agent_version_no,
             override_model_id=None,
+            tool_params=normalized_tool_params,
         )
         managed_agents.append(sub_agent_config)
 
     # create external A2A agents (synchronous function, no await needed)
     external_a2a_agents = _get_external_a2a_agents(agent_id, tenant_id, version_no)
 
-    tool_list = await create_tool_config_list(agent_id, tenant_id, user_id, version_no=version_no)
+    tool_list = await create_tool_config_list(
+        agent_id,
+        tenant_id,
+        user_id,
+        version_no=version_no,
+        tool_params=normalized_tool_params,
+    )
 
     # Build system prompt: prioritize segmented fields, fallback to original prompt field if not available
     duty_prompt = agent_info.get("duty_prompt", "")
@@ -383,6 +458,77 @@ async def create_agent_config(
             # Bubble up to streaming layer so it can emit <MEM_FAILED> and fall back
             raise Exception(f"Failed to retrieve memory list: {e}")
 
+    # Append active memory tools if memory is enabled
+    if memory_context.user_config.memory_switch and memory_context.memory_config:
+        try:
+            memory_metadata = {
+                "memory_config": memory_context.memory_config,
+                "memory_user_config": memory_context.user_config,
+                "tenant_id": memory_context.tenant_id,
+                "user_id": memory_context.user_id,
+                "agent_id": memory_context.agent_id,
+            }
+
+            store_tool_config = ToolConfig(
+                class_name="StoreMemoryTool",
+                name="store_memory",
+                description=(
+                    "Save important information to long-term memory for future recall. "
+                    "Use this when the user shares personal preferences, facts about themselves, "
+                    "project context, or instructions that should persist across conversations. "
+                    "Do NOT store transient information like temporary calculations, information "
+                    "already in the knowledge base, or data the user explicitly says to forget."
+                ),
+                inputs=json.dumps({
+                    "content": {
+                        "type": "string",
+                        "description": "The information to remember",
+                        "description_zh": "需要记住的信息"
+                    }
+                }, ensure_ascii=False),
+                output_type="string",
+                params={},
+                source="local",
+                usage=None,
+                metadata=memory_metadata,
+            )
+            tool_list.append(store_tool_config)
+
+            search_tool_config = ToolConfig(
+                class_name="SearchMemoryTool",
+                name="search_memory",
+                description=(
+                    "Search long-term memory for relevant information from previous interactions. "
+                    "Use this when you need context about the user's preferences, past decisions, "
+                    "or previously discussed topics that aren't in the current conversation. "
+                    "The system already provides some memory context automatically -- use this tool "
+                    "when you need to search for specific information not already available."
+                ),
+                inputs=json.dumps({
+                    "query": {
+                        "type": "string",
+                        "description": "Natural language query describing what to search for",
+                        "description_zh": "描述要搜索内容的自然语言查询"
+                    },
+                    "top_k": {
+                        "type": "integer",
+                        "description": "Maximum number of results to return",
+                        "description_zh": "返回结果的最大数量",
+                        "default": 5,
+                        "nullable": True
+                    }
+                }, ensure_ascii=False),
+                output_type="string",
+                params={},
+                source="local",
+                usage=None,
+                metadata=memory_metadata,
+            )
+            tool_list.append(search_tool_config)
+            logger.debug("Active memory tools appended to agent tool list")
+        except Exception as e:
+            logger.warning(f"Failed to append active memory tools: {e}")
+
     # Build knowledge base summary
     knowledge_base_summary = ""
     try:
@@ -413,7 +559,6 @@ async def create_agent_config(
     # Get skills list for prompt template
     skills = _get_skills_for_template(agent_id, tenant_id, version_no)
 
-    time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
     is_manager = len(managed_agents) > 0 or len(external_a2a_agents) > 0
 
     render_kwargs = {
@@ -428,7 +573,6 @@ async def create_agent_config(
         "APP_DESCRIPTION": app_description,
         "memory_list": memory_list,
         "knowledge_base_summary": knowledge_base_summary,
-        "time": time_str,
         "user_id": user_id,
     }
     system_prompt = Template(prompt_template["system_prompt"], undefined=StrictUndefined).render(render_kwargs)
@@ -457,7 +601,6 @@ async def create_agent_config(
             few_shots=few_shots_prompt,
             app_name=app_name,
             app_description=app_description,
-            time_str=time_str,
             user_id=user_id,
             language=language,
             is_manager=is_manager,
@@ -490,21 +633,48 @@ async def create_agent_config(
         external_a2a_agents=external_a2a_agents,
         context_manager_config=cm_config,
         context_components=context_components,
+        verification_config=AgentVerificationConfig.model_validate(agent_info.get("verification_config") or {}),
     )
     return agent_config
 
 
-async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int = 0):
-    # create tool
+async def create_tool_config_list(
+    agent_id,
+    tenant_id,
+    user_id,
+    version_no: int = 0,
+    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
+):
     tool_config_list = []
     langchain_tools = await discover_langchain_tools()
+    normalized_tool_params = _normalize_tool_params_request(tool_params)
 
     # now only admin can modify the agent, user_id is not used
     tools_list = search_tools_for_sub_agent(agent_id, tenant_id, version_no=version_no)
+
+    # Look up agent name for use in error messages.
+    # Agent name is optional for tool_params matching (matching uses tool identifiers only),
+    # but we include it in error messages so callers can identify which agent/tool caused a failure.
+    agent_info = search_agent_info_by_agent_id(agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
+    agent_name = agent_info.get("name") if agent_info else None
+    agent_tool_overrides = _get_agent_tool_overrides(normalized_tool_params, agent_name)
+
+    tool_keys_seen = set()
     for tool in tools_list:
-        param_dict = {}
-        for param in tool.get("params", []):
-            param_dict[param["name"]] = param.get("default")
+        tool_identifier = tool.get("name") or tool.get("class_name")
+        if tool_identifier in tool_keys_seen:
+            raise ValidationError(
+                f"Duplicate tool identifier '{tool_identifier}' found in agent '{agent_name or agent_id}'."
+            )
+        tool_keys_seen.add(tool_identifier)
+
+        override_params = None
+        if tool.get("name") in agent_tool_overrides:
+            override_params = agent_tool_overrides[tool.get("name")]
+        elif tool.get("class_name") in agent_tool_overrides:
+            override_params = agent_tool_overrides[tool.get("class_name")]
+
+        param_dict = _merge_tool_params(tool, override_params)
         tool_config = ToolConfig(
             class_name=tool.get("class_name"),
             name=tool.get("name"),
@@ -523,12 +693,21 @@ async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int
                     tool_config.metadata = langchain_tool
                     break
 
+        # Extract document_paths for KnowledgeBaseSearchTool (internal access control, not in DB schema)
+        document_paths = None
+        if override_params and "document_paths" in override_params:
+            document_paths = override_params.get("document_paths")
+        # Also check using the tool name as key
+        if not document_paths:
+            kb_overrides = agent_tool_overrides.get("knowledge_base_search")
+            if kb_overrides and "document_paths" in kb_overrides:
+                document_paths = kb_overrides.get("document_paths")
+
         # special logic for search tools that may use reranking models
         if tool_config.class_name == "KnowledgeBaseSearchTool":
-            rerank = param_dict.get("rerank", False)
-            rerank_model_name = param_dict.get("rerank_model_name", "")
+            rerank = tool_config.params.get("rerank", False)
+            rerank_model_name = tool_config.params.get("rerank_model_name", "")
             rerank_model = None
-            is_multimodal = bool(tool_config.params.pop("multimodal", False))
             if rerank and rerank_model_name:
                 rerank_model = get_rerank_model(
                     tenant_id=tenant_id, model_name=rerank_model_name
@@ -536,7 +715,7 @@ async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int
 
             # Build display_name to index_name mapping for LLM parameter conversion
             # Also build reverse mapping (index_name -> display_name) for knowledge_base_summary
-            index_names = param_dict.get("index_names", [])
+            index_names = tool_config.params.get("index_names", [])
             display_name_to_index_map = {}
             index_name_to_display_map = {}
             if index_names:
@@ -552,12 +731,14 @@ async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int
                 "rerank_model": rerank_model,
                 "display_name_to_index_map": display_name_to_index_map,
                 "index_name_to_display_map": index_name_to_display_map,
+                # Internal access control: restrict results to specific document paths (path_or_urls)
+                "document_paths": document_paths,
             }
 
-            # Must have embedding model for knowledge base search
             if not index_names:
                 raise ValidationError(
-                    "Embedding model is required for knowledge_base_search but index_names is empty")
+                    f"[{agent_name or agent_id}] knowledge_base_search tool requires index_names, "
+                    f"but it is not configured in the agent and not provided via tool_params.")
 
             embedding_model, _, _ = get_embedding_model_by_index_name(tenant_id, index_names[0])
             if not embedding_model:
@@ -566,8 +747,8 @@ async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int
                     f"Please configure an embedding model for this knowledge base.")
             tool_config.metadata["embedding_model"] = embedding_model
         elif tool_config.class_name in ["DifySearchTool", "DataMateSearchTool"]:
-            rerank = param_dict.get("rerank", False)
-            rerank_model_name = param_dict.get("rerank_model_name", "")
+            rerank = tool_config.params.get("rerank", False)
+            rerank_model_name = tool_config.params.get("rerank_model_name", "")
             rerank_model = None
             if rerank and rerank_model_name:
                 rerank_model = get_rerank_model(
@@ -861,6 +1042,7 @@ async def create_agent_run_info(
     is_debug: bool = False,
     override_version_no: int | None = None,
     override_model_id: int | None = None,
+    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
 ):
     # Determine which version_no to use based on is_debug flag
     # If is_debug=false, use the current published version (current_version_no)
@@ -893,7 +1075,7 @@ async def create_agent_run_info(
     if override_model_id is not None:
         create_config_kwargs["override_model_id"] = override_model_id
 
-    agent_config = await create_agent_config(**create_config_kwargs)
+    agent_config = await create_agent_config(**create_config_kwargs, tool_params=tool_params)
 
     remote_mcp_list = await get_remote_mcp_server_list(tenant_id=tenant_id, is_need_auth=True)
     default_mcp_url = urljoin(LOCAL_MCP_SERVER, "sse")
diff --git a/backend/apps/agent_app.py b/backend/apps/agent_app.py
index e280ff422..87abbf9e8 100644
--- a/backend/apps/agent_app.py
+++ b/backend/apps/agent_app.py
@@ -195,8 +195,6 @@ async def export_agent_api(request: AgentIDRequest, authorization: Optional[str]
                     "Content-Disposition": f"attachment; filename=\"{result.get('filename', 'agent_export.zip')}\""
                 }
             )
-        if isinstance(result, str):
-            result = json.loads(result)
         return ConversationResponse(code=0, message="success", data=result)
     except Exception as e:
         logger.error(f"Agent export error: {str(e)}")
@@ -621,3 +619,5 @@ async def list_published_agents_api(
         raise HTTPException(
             status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="Published agents list error."
         )
+
+
diff --git a/backend/apps/agent_repository_app.py b/backend/apps/agent_repository_app.py
new file mode 100644
index 000000000..e9da2fde0
--- /dev/null
+++ b/backend/apps/agent_repository_app.py
@@ -0,0 +1,134 @@
+import logging
+from http import HTTPStatus
+from typing import Optional
+
+from fastapi import APIRouter, Body, Header, HTTPException, Query
+from starlette.responses import JSONResponse
+
+from consts.exceptions import SkillDuplicateError, UnauthorizedError
+from services.agent_repository_service import (
+    create_agent_repository_listing_impl,
+    import_agent_from_repository_impl,
+    list_agent_repository_listings_impl,
+    update_agent_repository_status_impl,
+)
+from utils.auth_utils import get_current_user_id
+
+agent_repository_router = APIRouter(prefix="/repository/agent")
+logger = logging.getLogger("agent_repository_app")
+
+
+@agent_repository_router.get("")
+async def list_agent_repository_listings_api(
+    status: Optional[str] = Query(None, description="Filter by listing status"),
+    authorization: str = Header(None),
+):
+    """List all marketplace repository listings with optional status filter."""
+    try:
+        get_current_user_id(authorization)
+        result = list_agent_repository_listings_impl(status=status)
+        return JSONResponse(status_code=HTTPStatus.OK, content=result)
+    except UnauthorizedError as e:
+        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
+    except ValueError as e:
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
+    except Exception as e:
+        logger.error(f"List agent repository listings error: {str(e)}")
+        raise HTTPException(
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
+            detail="List agent repository listings error.",
+        )
+
+
+@agent_repository_router.patch("/{agent_repository_id}/status")
+async def update_agent_repository_status_api(
+    agent_repository_id: int,
+    status: str = Body(
+        ...,
+        embed=True,
+        description=(
+            "New status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / "
+            "REJECTED (审核驳回) / SHARED (已共享)"
+        ),
+    ),
+    authorization: str = Header(None),
+):
+    """Update marketplace repository listing status (share, unshare, approve, reject)."""
+    try:
+        user_id, _ = get_current_user_id(authorization)
+        result = update_agent_repository_status_impl(
+            agent_repository_id=agent_repository_id,
+            status=status,
+            user_id=user_id,
+        )
+        return JSONResponse(status_code=HTTPStatus.OK, content=result)
+    except UnauthorizedError as e:
+        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
+    except ValueError as e:
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
+    except Exception as e:
+        logger.error(f"Update agent repository status error: {str(e)}")
+        raise HTTPException(
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
+            detail="Update agent repository status error.",
+        )
+
+
+@agent_repository_router.post("/{agent_id}/versions/{version_no}")
+async def create_agent_repository_listing_api(
+    agent_id: int,
+    version_no: int,
+    authorization: str = Header(None),
+):
+    """Create or update a marketplace repository listing from an agent version snapshot."""
+    try:
+        user_id, tenant_id = get_current_user_id(authorization)
+        result = await create_agent_repository_listing_impl(
+            agent_id=agent_id,
+            tenant_id=tenant_id,
+            user_id=user_id,
+            version_no=version_no,
+        )
+        return JSONResponse(status_code=HTTPStatus.OK, content=result)
+    except UnauthorizedError as e:
+        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
+    except ValueError as e:
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
+    except Exception as e:
+        logger.error(f"Create agent repository listing error: {str(e)}")
+        raise HTTPException(
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
+            detail="Create agent repository listing error.",
+        )
+
+
+@agent_repository_router.post("/{agent_repository_id}/import")
+async def import_agent_from_repository_api(
+    agent_repository_id: int,
+    authorization: Optional[str] = Header(None),
+):
+    """Import an agent tree from a marketplace repository listing into the current tenant."""
+    try:
+        await import_agent_from_repository_impl(
+            agent_repository_id=agent_repository_id,
+            authorization=authorization,
+        )
+        return JSONResponse(status_code=HTTPStatus.OK, content={})
+    except UnauthorizedError as e:
+        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
+    except SkillDuplicateError as exc:
+        raise HTTPException(
+            status_code=HTTPStatus.CONFLICT,
+            detail={
+                "type": "skill_duplicate",
+                "duplicate_skills": exc.duplicate_names,
+            },
+        )
+    except ValueError as e:
+        raise HTTPException(status_code=HTTPStatus.NOT_FOUND, detail=str(e))
+    except Exception as e:
+        logger.error(f"Import agent from repository error: {str(e)}")
+        raise HTTPException(
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
+            detail="Import agent from repository error.",
+        )
diff --git a/backend/apps/app_factory.py b/backend/apps/app_factory.py
index 219da5b82..02816cec1 100644
--- a/backend/apps/app_factory.py
+++ b/backend/apps/app_factory.py
@@ -101,6 +101,16 @@ async def generic_exception_handler(request, exc):
         if isinstance(exc, AppException):
             return await app_exception_handler(request, exc)
 
+        # Handle NexentCapabilityError with a friendly message
+        from adapters.exception import NexentCapabilityError as _NCE
+
+        if isinstance(exc, _NCE):
+            logger.warning(f"NexentCapabilityError: {exc}")
+            return JSONResponse(
+                status_code=400,
+                content={"message": str(exc)},
+            )
+
         logger.error(f"Generic Exception: {exc}")
         return JSONResponse(
             status_code=500,
diff --git a/backend/apps/cas_app.py b/backend/apps/cas_app.py
new file mode 100644
index 000000000..dbf4815f8
--- /dev/null
+++ b/backend/apps/cas_app.py
@@ -0,0 +1,156 @@
+import html
+import logging
+from http import HTTPStatus
+from typing import Optional
+from urllib.parse import parse_qs, urlsplit
+
+from fastapi import APIRouter, HTTPException, Query, Request
+from fastapi.responses import HTMLResponse, JSONResponse, RedirectResponse
+
+from services.cas_service import (
+    CAS_SERVER_URL,
+    CasAuthenticationError,
+    build_login_url,
+    build_renew_url,
+    get_cas_config,
+    login_with_ticket,
+    renew_with_ticket,
+    revoke_from_logout_request,
+)
+
+logger = logging.getLogger(__name__)
+router = APIRouter(prefix="/user/cas", tags=["cas"])
+
+
+@router.get("/config")
+async def config():
+    return JSONResponse(
+        status_code=HTTPStatus.OK,
+        content={"message": "success", "data": get_cas_config()},
+    )
+
+
+@router.get("/login")
+async def login(redirect: str = Query("/", description="URL to return to after login")):
+    try:
+        login_url = _require_cas_server_redirect(build_login_url(redirect))
+        return RedirectResponse(url=login_url, status_code=HTTPStatus.FOUND)
+    except CasAuthenticationError as exc:
+        logger.warning("CAS login rejected: %s", exc)
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail="CAS login is not available")
+
+
+@router.get("/callback")
+async def callback(ticket: str = "", redirect: str = "/"):
+    try:
+        result = await login_with_ticket(ticket, redirect)
+        return JSONResponse(
+            status_code=HTTPStatus.OK,
+            content={"message": "CAS login successful", "data": result},
+        )
+    except CasAuthenticationError as exc:
+        logger.warning("CAS callback rejected: %s", exc)
+        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail="CAS authentication failed")
+    except Exception as exc:
+        logger.error(f"CAS callback failed: {exc}")
+        raise HTTPException(status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="CAS login failed")
+
+
+@router.post("/callback")
+async def callback_logout(request: Request, logout_request: Optional[str] = None):
+    return await _handle_logout_request(request, logout_request, endpoint="callback")
+
+
+@router.get("/renew")
+async def renew():
+    try:
+        return RedirectResponse(url=build_renew_url(), status_code=HTTPStatus.FOUND)
+    except CasAuthenticationError as exc:
+        logger.warning("CAS renew rejected: %s", exc)
+        return _renew_html(False, "CAS renew failed")
+
+
+@router.get("/renew_callback")
+async def renew_callback(ticket: str = ""):
+    if not ticket:
+        return _renew_html(False, "CAS session is not active")
+    try:
+        result = await renew_with_ticket(ticket)
+        return JSONResponse(
+            status_code=HTTPStatus.OK,
+            content={"message": "CAS renew successful", "data": result},
+        )
+    except Exception as exc:
+        logger.warning(f"CAS renew failed: {exc}")
+        return _renew_html(False, "CAS renew failed")
+
+
+@router.post("/logout_callback")
+async def logout_callback(
+    request: Request,
+    logout_request: Optional[str] = None,
+):
+    return await _handle_logout_request(request, logout_request, endpoint="logout_callback")
+
+
+async def _handle_logout_request(
+    request: Request,
+    logout_request: Optional[str] = None,
+    endpoint: str = "unknown",
+):
+    logout_request = await _extract_logout_request(request, logout_request)
+    logger.info(
+        "CAS SLO %s received logoutRequest: present=%s length=%s",
+        endpoint,
+        bool(logout_request),
+        len(logout_request or ""),
+    )
+    result = revoke_from_logout_request(logout_request)
+    logger.info("CAS SLO %s revoke result: %s", endpoint, result)
+    return JSONResponse(
+        status_code=HTTPStatus.OK,
+        content={"message": "success", "data": result},
+    )
+
+
+async def _extract_logout_request(request: Request, logout_request: Optional[str] = None) -> str:
+    if logout_request:
+        return logout_request
+
+    query_logout_request = request.query_params.get("logoutRequest") or request.query_params.get("logout_request")
+    if query_logout_request:
+        return query_logout_request
+
+    body = await request.body()
+    raw_body = body.decode("utf-8") if body else ""
+    if not raw_body:
+        return ""
+
+    parsed = parse_qs(raw_body)
+    return (parsed.get("logoutRequest") or parsed.get("logout_request") or [raw_body])[0]
+
+
+def _renew_html(success: bool, reason: str = "") -> HTMLResponse:
+    status = "success" if success else "failed"
+    safe_reason = html.escape(reason)
+    return HTMLResponse(
+        status_code=HTTPStatus.OK,
+        content=f"""<!doctype html>
+<html><body><script>
+window.parent && window.parent.postMessage({{ type: "cas-renew-{status}", reason: "{safe_reason}" }}, window.location.origin);
+</script></body></html>""",
+    )
+
+
+def _require_cas_server_redirect(url: str) -> str:
+    parsed_url = urlsplit(url)
+    parsed_cas = urlsplit(CAS_SERVER_URL)
+    if (
+        parsed_url.scheme not in {"http", "https"}
+        or not parsed_url.netloc
+        or parsed_url.scheme != parsed_cas.scheme
+        or parsed_url.netloc != parsed_cas.netloc
+    ):
+        logger.warning("Blocked CAS redirect outside configured server: %s", url)
+        raise CasAuthenticationError("Invalid CAS redirect URL")
+    return url
diff --git a/backend/apps/config_app.py b/backend/apps/config_app.py
index 8cb383df7..a818ec7cb 100644
--- a/backend/apps/config_app.py
+++ b/backend/apps/config_app.py
@@ -2,6 +2,7 @@
 
 from apps.app_factory import create_app
 from apps.agent_app import agent_config_router as agent_router
+from apps.agent_repository_app import agent_repository_router
 from apps.config_sync_app import router as config_sync_router
 from apps.datamate_app import router as datamate_router
 from apps.vectordatabase_app import router as vectordatabase_router
@@ -32,6 +33,7 @@
 from apps.monitoring_app import router as monitoring_router
 from apps.a2a_server_app import router as a2a_server_router
 from apps.haotian_app import router as haotian_router
+from apps.cas_app import router as cas_router
 from consts.const import IS_SPEED_MODE
 from services.prompt_template_service import sync_system_default_prompt_template
 
@@ -54,6 +56,7 @@ async def sync_default_prompt_template_on_startup():
 app.include_router(model_manager_router)
 app.include_router(config_sync_router)
 app.include_router(agent_router)
+app.include_router(agent_repository_router)
 app.include_router(vectordatabase_router)
 app.include_router(datamate_router)
 app.include_router(voice_router)
@@ -73,6 +76,7 @@ async def sync_default_prompt_template_on_startup():
     app.include_router(user_management_router)
 
 app.include_router(oauth_router)
+app.include_router(cas_router)
 
 app.include_router(summary_router)
 app.include_router(prompt_router)
diff --git a/backend/apps/northbound_app.py b/backend/apps/northbound_app.py
index e6aff8e06..9f3b7e323 100644
--- a/backend/apps/northbound_app.py
+++ b/backend/apps/northbound_app.py
@@ -1,14 +1,16 @@
 import logging
 from http import HTTPStatus
 from typing import Optional, Dict, Any
-from urllib.parse import urlparse
+from urllib.parse import urlparse, unquote
+import re
 import uuid
 
 import httpx
-from fastapi import APIRouter, Body, Header, Request, HTTPException, Query
+from fastapi import APIRouter, Body, File, Header, HTTPException, Query, Request, UploadFile
 from fastapi.responses import JSONResponse, StreamingResponse
 
-from consts.exceptions import LimitExceededError, UnauthorizedError
+from consts.exceptions import LimitExceededError, UnauthorizedError, ConversationNotFoundError
+from consts.model import ToolParamsRequest
 from services.northbound_service import (
     NorthboundContext,
     get_conversation_history,
@@ -17,16 +19,35 @@
     stop_chat,
     get_agent_info_list,
     update_conversation_title,
+    upload_files_for_northbound,
 )
 
 from utils.auth_utils import validate_bearer_token, get_user_and_tenant_by_access_key
 
+from .file_management_app import build_content_disposition_header
+
 
 router = APIRouter(prefix="/nb/v1", tags=["northbound"])
 
 __all__ = ["router", "_get_northbound_context"]
 
 
+def _resolve_proxy_download_filename(presigned_url: str, content_disposition: str) -> str:
+    """Resolve a stable download filename for the northbound file proxy."""
+    if content_disposition:
+        filename_star_match = re.search(r"filename\*=UTF-8''([^;]+)", content_disposition)
+        if filename_star_match:
+            return unquote(filename_star_match.group(1)) or "download"
+
+        filename_match = re.search(r'filename="?([^";]+)"?', content_disposition)
+        if filename_match:
+            return filename_match.group(1) or "download"
+
+    path = unquote(urlparse(presigned_url).path)
+    filename = path.split("/")[-1].strip()
+    return filename or "download"
+
+
 async def _get_northbound_context(request: Request) -> NorthboundContext:
     """
     Build northbound context from request.
@@ -109,13 +130,119 @@ async def health_check():
     return {"status": "healthy", "service": "northbound-api"}
 
 
-@router.post("/chat/run")
+@router.post(
+    "/chat/attachments/upload",
+    summary="Upload chat attachments for northbound runs",
+    description=(
+        "Upload one or more files for later use in `/nb/v1/chat/run`. "
+        "Successful uploads return reusable `s3_url` references."
+    ),
+)
+async def upload_chat_attachments(
+    request: Request,
+    files: list[UploadFile] = File(
+        ...,
+        description="List of files to upload",
+        examples=["report.pdf", "diagram.png"],
+    ),
+):
+    try:
+        ctx: NorthboundContext = await _get_northbound_context(request)
+        return JSONResponse(
+            status_code=HTTPStatus.OK,
+            content=await upload_files_for_northbound(ctx=ctx, files=files),
+        )
+    except LimitExceededError as e:
+        logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
+                            detail="Too Many Requests: rate limit exceeded")
+    except ValueError as e:
+        logging.error(f"Invalid northbound upload request: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
+    except PermissionError as e:
+        logging.error(f"Permission denied while uploading northbound files: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.FORBIDDEN, detail=str(e))
+    except HTTPException as e:
+        raise e
+    except Exception as e:
+        logging.error(f"Failed to upload northbound files: {str(e)}", exc_info=e)
+        raise HTTPException(
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="Internal Server Error")
+
+
+@router.post(
+    "/chat/run",
+    summary="Start a northbound chat run with optional attachments",
+    description=(
+        "Run a northbound chat request. Upload attachments first through "
+        "`/nb/v1/chat/attachments/upload`, then pass the returned `s3_url` values "
+        "through the `attachments` field."
+    ),
+)
 async def run_chat(
     request: Request,
-    conversation_id: Optional[int] = Body(None, embed=True),
-    agent_name: str = Body(..., embed=True),
-    query: str = Body(..., embed=True),
-    meta_data: Optional[Dict[str, Any]] = Body(None, embed=True),
+    conversation_id: Optional[int] = Body(
+        None,
+        embed=True,
+        description="Existing conversation ID. Omit to create a new conversation.",
+        examples=[123],
+    ),
+    agent_name: str = Body(
+        ...,
+        embed=True,
+        description="Target agent name.",
+        examples=["general-assistant"],
+    ),
+    query: str = Body(
+        ...,
+        embed=True,
+        description="User input to send to the agent.",
+        examples=["Summarize the uploaded report and list the key risks."],
+    ),
+    attachments: Optional[list] = Body(
+        None,
+        embed=True,
+        description="Attachments for the chat. Can be either a list of S3 URL strings"
+                    "or a list of attachment objects with full metadata.",
+        examples=[["s3://nexent/attachments/user123/20260609_report.pdf"]],
+    ),
+    meta_data: Optional[Dict[str, Any]] = Body(
+        None,
+        embed=True,
+        description="Optional metadata passed through for audit and usage logging.",
+        examples=[{"source": "crm", "ticket_id": "INC-1001"}],
+    ),
+    tool_params: Optional[ToolParamsRequest] = Body(
+        None,
+        embed=True,
+        description="Optional request-scoped overrides for tool initialization parameters. "
+            "Overrides DB-persisted params (ag_tool_instance_t.params) on a per-run basis. "
+            "Conflict resolution: request value wins over DB value. "
+            "Structure: agents -> {agent_name} -> tools -> {tool_name} -> {param_name: param_value}. "
+            "tool_name matching: first by tool.name, then by tool.class_name. "
+            "Unknown param names cause a ValidationError (400). "
+            "Metadata-derived fields (e.g., vdb_core, embedding_model) are recalculated "
+            "from merged params for tools like KnowledgeBaseSearchTool, DifySearchTool, DataMateSearchTool.",
+        examples=[{
+            "agents": {
+                "common_sense_qa_assistant": {
+                    "tools": {
+                        "analyze_text_file": {
+                            "chunk_size": 4000,
+                            "summary_only": True,
+                            "prompt": "Please provide a concise summary of this document focusing on key facts."
+                        },
+                        "knowledge_base_search": {
+                            "top_k": 10,
+                            "rerank": True,
+                            "rerank_model_name": "gte-rerank-v2",
+                            "index_names": ["nexent-docs", "faq-index"]
+                        }
+                    }
+                }
+            }
+        }],
+    ),
     idempotency_key: Optional[str] = Header(None, alias="Idempotency-Key"),
 ):
     try:
@@ -125,13 +252,21 @@ async def run_chat(
             conversation_id=conversation_id,
             agent_name=agent_name,
             query=query,
+            attachments=attachments,
             meta_data=meta_data,
+            tool_params=tool_params,
             idempotency_key=idempotency_key,
         )
     except LimitExceededError as e:
         logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
         raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
                             detail="Too Many Requests: rate limit exceeded")
+    except ValueError as e:
+        logging.error(f"Invalid northbound chat request: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
+    except PermissionError as e:
+        logging.error(f"Permission denied while running northbound chat: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.FORBIDDEN, detail=str(e))
     except HTTPException as e:
         raise e
     except Exception as e:
@@ -254,6 +389,9 @@ async def update_convs_title(
         logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
         raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
                             detail="Too Many Requests: rate limit exceeded")
+    except ConversationNotFoundError as e:
+        logging.error(f"Conversation not found while updating title: {str(e)}", exc_info=e)
+        raise HTTPException(status_code=HTTPStatus.NOT_FOUND, detail=str(e))
     except HTTPException as e:
         raise e
     except Exception as e:
@@ -312,12 +450,12 @@ async def fetch_file_from_presigned_url(
 
         content_type = response.headers.get("Content-Type", "application/octet-stream")
         content_disposition = response.headers.get("Content-Disposition", "")
+        download_filename = _resolve_proxy_download_filename(presigned_url, content_disposition)
 
         headers = {
             "Content-Type": content_type,
+            "Content-Disposition": build_content_disposition_header(download_filename),
         }
-        if content_disposition:
-            headers["Content-Disposition"] = content_disposition
 
         return StreamingResponse(
             content=response.aiter_bytes(),
diff --git a/backend/apps/northbound_knowledge_app.py b/backend/apps/northbound_knowledge_app.py
index 775d6c567..02739d138 100644
--- a/backend/apps/northbound_knowledge_app.py
+++ b/backend/apps/northbound_knowledge_app.py
@@ -51,7 +51,8 @@ async def _require_asset_owner_context(request: Request) -> NorthboundContext:
 @router.get("/indices")
 async def get_list_indices(
     request: Request,
-    pattern: Annotated[str, Query(description="Pattern to match index names")] = "*",
+    pattern: Annotated[str, Query(
+        description="Pattern to match index names")] = "*",
 ):
     """List knowledge bases visible to the asset-owner tenant.
 
@@ -92,7 +93,7 @@ async def create_new_index(
         Optional[Dict[str, Any]],
         Body(
             description=(
-                "Request body with optional fields (ingroup_permission, group_ids, embedding_model_name)"
+                "Request body with optional fields (ingroup_permission, group_ids, embedding_model_name, preserve_source_file)"
             ),
         ),
     ] = None,
@@ -110,10 +111,12 @@ async def create_new_index(
         ingroup_permission = None
         group_ids = None
         embedding_model_name = None
+        preserve_source_file = None
         if body:
             ingroup_permission = body.get("ingroup_permission")
             group_ids = body.get("group_ids")
             embedding_model_name = body.get("embedding_model_name")
+            preserve_source_file = body.get("preserve_source_file")
 
         return ElasticSearchService.create_knowledge_base(
             knowledge_name=index_name,
@@ -124,6 +127,7 @@ async def create_new_index(
             ingroup_permission=ingroup_permission,
             group_ids=group_ids,
             embedding_model_name=embedding_model_name,
+            preserve_source_file=preserve_source_file,
         )
     except LimitExceededError as e:
         logger.exception("Rate limit exceeded while creating index")
@@ -222,52 +226,65 @@ async def delete_documents(
     request: Request,
     index_name: Annotated[str, Path(..., description="Name of the index")],
     path_or_url: Annotated[str, Query(..., description="Path or URL of documents to delete")],
+    scope: Annotated[
+        str,
+        Query(
+            description=(
+                "source_only: delete MinIO source only; "
+                "full: delete ES, MinIO, and Redis records"
+            ),
+        ),
+    ] = "full",
 ):
-    """Delete documents by path or URL and clean up related Redis records.
-
-    Restricted to asset administrators (same auth as get_list_indices).
-    """
+    """Delete a document by scope. Restricted to asset administrators."""
     try:
-        ctx = await _require_asset_owner_context(request)
+        await _require_asset_owner_context(request)
         vdb_core = get_vector_db_core(db_type=VectorDatabaseType.ELASTICSEARCH)
-        logger.debug("Deleting documents for index %s", index_name)
-        result = ElasticSearchService.delete_documents(
-            index_name, path_or_url, vdb_core)
-
-        try:
-            redis_service = get_redis_service()
-            redis_cleanup_result = redis_service.delete_document_records(
-                index_name, path_or_url)
-
-            result["redis_cleanup"] = redis_cleanup_result
-
-            original_message = result.get(
-                "message", "Documents deleted successfully")
-            result["message"] = (
-                f"{original_message}. "
-                f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
-                f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
-                f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
-            )
-
-            if redis_cleanup_result.get("errors"):
-                result["redis_warnings"] = redis_cleanup_result["errors"]
+        logger.debug(
+            "Deleting documents for index %s scope=%s", index_name, scope
+        )
+        result = await ElasticSearchService.delete_document_by_scope(
+            index_name, path_or_url, scope, vdb_core
+        )
 
-        except Exception as redis_error:
-            logger.warning(
-                "Redis cleanup failed for index %s: %s",
-                index_name,
-                redis_error,
-            )
-            result["redis_cleanup_error"] = str(redis_error)
-            original_message = result.get(
-                "message", "Documents deleted successfully")
-            result["message"] = (
-                f"{original_message}, but Redis cleanup encountered an error: "
-                f"{str(redis_error)}"
-            )
+        if scope == "full":
+            try:
+                redis_service = get_redis_service()
+                redis_cleanup_result = redis_service.delete_document_records(
+                    index_name, path_or_url
+                )
+                result["redis_cleanup"] = redis_cleanup_result
+                original_message = result.get(
+                    "message", "Documents deleted successfully"
+                )
+                result["message"] = (
+                    f"{original_message}. "
+                    f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
+                    f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
+                    f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
+                )
+                if redis_cleanup_result.get("errors"):
+                    result["redis_warnings"] = redis_cleanup_result["errors"]
+            except Exception as redis_error:
+                logger.warning(
+                    "Redis cleanup failed for index %s: %s",
+                    index_name,
+                    redis_error,
+                )
+                result["redis_cleanup_error"] = str(redis_error)
+                original_message = result.get(
+                    "message", "Documents deleted successfully"
+                )
+                result["message"] = (
+                    f"{original_message}, but Redis cleanup encountered an error: "
+                    f"{str(redis_error)}"
+                )
 
         return result
+    except ValueError as exc:
+        raise HTTPException(
+            status_code=HTTPStatus.BAD_REQUEST, detail=str(exc)
+        )
     except LimitExceededError as e:
         logger.exception("Rate limit exceeded while deleting documents")
         raise HTTPException(
diff --git a/backend/apps/prompt_app.py b/backend/apps/prompt_app.py
index 987729e69..6b82a5c82 100644
--- a/backend/apps/prompt_app.py
+++ b/backend/apps/prompt_app.py
@@ -4,11 +4,19 @@
 from fastapi import APIRouter, Header, Request
 from fastapi.responses import JSONResponse, StreamingResponse
 
-from consts.model import GeneratePromptRequest, OptimizePromptSectionRequest
+from consts.model import (
+    GeneratePromptRequest,
+    OptimizePromptSectionRequest,
+    OptimizePromptBadCaseRequest,
+    OptimizePromptFromDebugRequest,
+)
 from services.prompt_service import (
     gen_system_prompt_streamable,
-    optimize_prompt_section_impl,
+    OptimizeRequest,
+    OptimizeResult,
+    PromptOptimizationService,
 )
+from adapters.exception import NexentCapabilityError
 from utils.auth_utils import get_current_user_info
 
 router = APIRouter(prefix="/prompt")
@@ -48,30 +56,140 @@ async def optimize_prompt_section_api(
         http_request: Request,
         authorization: Optional[str] = Header(None)
 ):
+    _, tenant_id, language = get_current_user_info(
+        authorization, http_request)
+
+    service = PromptOptimizationService(
+        model_id=optimize_request.model_id,
+        tenant_id=tenant_id,
+        language=language,
+    )
+
     try:
-        _, tenant_id, language = get_current_user_info(
-            authorization, http_request)
-        optimized_section = optimize_prompt_section_impl(
+        result = service.optimize(
+            OptimizeRequest(
+                agent_id=optimize_request.agent_id,
+                model_id=optimize_request.model_id,
+                task_description=optimize_request.task_description,
+                section_type=optimize_request.section_type,
+                section_title=optimize_request.section_title,
+                current_content=optimize_request.current_content,
+                feedback=optimize_request.feedback,
+                mode=optimize_request.mode,
+                start_pos=optimize_request.start_pos,
+                end_pos=optimize_request.end_pos,
+                tool_ids=optimize_request.tool_ids,
+                sub_agent_ids=optimize_request.sub_agent_ids,
+                knowledge_base_display_names=optimize_request.knowledge_base_display_names,
+            )
+        )
+        return JSONResponse(
+            status_code=HTTPStatus.OK,
+            content={
+                "message": "Success",
+                "data": {
+                    "optimized_content": result.optimized_content,
+                    "section_type": result.section_type,
+                    "section_title": result.section_title,
+                    "original_content": result.original_content,
+                }
+            },
+            headers={"X-Prompt-Source": result.source},
+        )
+    except NexentCapabilityError as e:
+        return JSONResponse(
+            status_code=HTTPStatus.BAD_REQUEST,
+            content={"message": str(e)},
+        )
+    except Exception as exc:
+        logger.exception(f"Error occurred while optimizing prompt section: {exc}")
+        raise
+
+
+@router.post("/optimize/badcase")
+async def optimize_prompt_badcase_api(
+        badcase_request: OptimizePromptBadCaseRequest,
+        http_request: Request,
+        authorization: Optional[str] = Header(None)
+):
+    _, tenant_id, language = get_current_user_info(
+        authorization, http_request)
+
+    service = PromptOptimizationService(
+        model_id=badcase_request.model_id,
+        tenant_id=tenant_id,
+        language=language,
+    )
+
+    try:
+        result = service.optimize_badcase(
+            current_content=badcase_request.current_content,
+            bad_cases=badcase_request.bad_cases,
+            agent_id=badcase_request.agent_id,
+            section_type=badcase_request.section_type,
+            section_title=badcase_request.section_title,
+            tool_ids=badcase_request.tool_ids,
+            sub_agent_ids=badcase_request.sub_agent_ids,
+            knowledge_base_display_names=badcase_request.knowledge_base_display_names,
+        )
+        return JSONResponse(
+            status_code=HTTPStatus.OK,
+            content={
+                "message": "Success",
+                "data": {
+                    "optimized_content": result.optimized_content,
+                    "section_type": result.section_type,
+                    "section_title": result.section_title,
+                    "original_content": result.original_content,
+                }
+            },
+            headers={"X-Prompt-Source": result.source},
+        )
+    except NexentCapabilityError as e:
+        return JSONResponse(
+            status_code=HTTPStatus.BAD_REQUEST,
+            content={"message": str(e)},
+        )
+
+
+@router.post("/optimize/from_debug")
+async def optimize_prompt_from_debug_api(
+        optimize_request: OptimizePromptFromDebugRequest,
+        http_request: Request,
+        authorization: Optional[str] = Header(None)
+):
+    _, tenant_id, language = get_current_user_info(
+        authorization, http_request)
+
+    service = PromptOptimizationService(
+        model_id=optimize_request.model_id,
+        tenant_id=tenant_id,
+        language=language,
+    )
+
+    try:
+        result = service.optimize_from_debug(
             agent_id=optimize_request.agent_id,
-            model_id=optimize_request.model_id,
-            task_description=optimize_request.task_description,
-            tenant_id=tenant_id,
-            language=language,
-            section_type=optimize_request.section_type,
-            section_title=optimize_request.section_title,
-            current_content=optimize_request.current_content,
             feedback=optimize_request.feedback,
-            tool_ids=optimize_request.tool_ids,
-            sub_agent_ids=optimize_request.sub_agent_ids,
-            knowledge_base_display_names=optimize_request.knowledge_base_display_names,
+            selected=optimize_request.selected,
+            history=optimize_request.history,
         )
         return JSONResponse(
             status_code=HTTPStatus.OK,
             content={
-                "message": "Prompt section optimized successfully",
-                "data": optimized_section,
-            }
+                "message": "Success",
+                "data": {
+                    "original_full_prompt": result.original_content,
+                    "optimized_full_prompt": result.optimized_content,
+                }
+            },
+            headers={"X-Prompt-Source": result.source},
+        )
+    except NexentCapabilityError as e:
+        return JSONResponse(
+            status_code=HTTPStatus.BAD_REQUEST,
+            content={"message": str(e)},
         )
     except Exception as exc:
-        logger.exception(f"Error occurred while optimizing prompt section: {exc}")
+        logger.exception(f"Error occurred while optimizing prompt from debug: {exc}")
         raise
diff --git a/backend/apps/tool_config_app.py b/backend/apps/tool_config_app.py
index f0b7f9304..bfc8d5ca0 100644
--- a/backend/apps/tool_config_app.py
+++ b/backend/apps/tool_config_app.py
@@ -160,12 +160,14 @@ async def import_openapi_service_api(
         server_url: Base URL of the REST API server
         openapi_json: Complete OpenAPI JSON specification
         service_description: Optional service description
+        headers_template: Optional default headers template
         force_update: If True, replace all existing tools for this service
     """
     service_name = openapi_service_request.get("service_name")
     server_url = openapi_service_request.get("server_url")
     openapi_json = openapi_service_request.get("openapi_json")
     service_description = openapi_service_request.get("service_description")
+    headers_template = openapi_service_request.get("headers_template")
     force_update = openapi_service_request.get("force_update", False)
 
     if not service_name:
@@ -192,6 +194,7 @@ async def import_openapi_service_api(
             tenant_id=tenant_id,
             user_id=user_id,
             service_description=service_description,
+            headers_template=headers_template,
             force_update=force_update
         )
 
diff --git a/backend/apps/user_management_app.py b/backend/apps/user_management_app.py
index edbcdf27d..e79fde887 100644
--- a/backend/apps/user_management_app.py
+++ b/backend/apps/user_management_app.py
@@ -19,12 +19,13 @@
     ValidationError,
 )
 from consts.error_code import ErrorCode
+from services.cas_service import build_logout_url, CasAuthenticationError
 from services.user_management_service import get_authorized_client, validate_token, \
     check_auth_service_health, signup_user_with_invitation, signin_user, refresh_user_token, \
     get_session_by_authorization, get_user_info, create_token, list_tokens_by_user, delete_token, \
     update_password
 from services.user_service import delete_user_and_cleanup
-from utils.auth_utils import get_current_user_id
+from utils.auth_utils import get_current_user_id, extract_session_id_from_authorization
 
 
 load_dotenv()
@@ -150,7 +151,18 @@ async def logout(request: Request):
     authorization = request.headers.get("Authorization")
     try:
         # Make logout idempotent: if no token or token expired, still return success
+        session_id = None
+        cas_logout_url = ""
         if authorization:
+            session_id = extract_session_id_from_authorization(authorization)
+            if session_id:
+                from database.cas_session_db import revoke_cas_session_by_session_id
+
+                revoke_cas_session_by_session_id(session_id, actor="user")
+                try:
+                    cas_logout_url = build_logout_url()
+                except CasAuthenticationError as cas_err:
+                    logging.warning(f"CAS logout URL is unavailable: {str(cas_err)}")
             client = get_authorized_client(authorization)
             try:
                 client.auth.sign_out()
@@ -159,7 +171,12 @@ async def logout(request: Request):
                 logging.warning(
                     f"Sign out encountered an error but will be ignored: {str(signout_err)}")
         return JSONResponse(status_code=HTTPStatus.OK,
-                            content={"message": "Logout successful"})
+                            content={
+                                "message": "Logout successful",
+                                "data": {
+                                    "cas_logout_url": cas_logout_url
+                                }
+                            })
 
     except Exception as e:
         logging.error(f"User logout failed: {str(e)}")
@@ -214,6 +231,10 @@ async def get_user_information(request: Request):
         if not user_info:
             raise UnauthorizedError("User information not found")
 
+        user_info["user"]["auth_provider"] = (
+            "cas" if extract_session_id_from_authorization(authorization) else "local"
+        )
+
         return JSONResponse(status_code=HTTPStatus.OK,
                             content={"message": "Success",
                                      "data": user_info})
diff --git a/backend/apps/vectordatabase_app.py b/backend/apps/vectordatabase_app.py
index 118537766..505c39559 100644
--- a/backend/apps/vectordatabase_app.py
+++ b/backend/apps/vectordatabase_app.py
@@ -76,7 +76,7 @@ def create_new_index(
         embedding_dim: Optional[int] = Query(
             None, description="Dimension of the embedding vectors"),
         request: Dict[str, Any] = Body(
-            None, description="Request body with optional fields (ingroup_permission, group_ids, embedding_model_name)"),
+            None, description="Request body with optional fields (ingroup_permission, group_ids, embedding_model_name, preserve_source_file)"),
         vdb_core: VectorDatabaseCore = Depends(get_vector_db_core),
         authorization: Optional[str] = Header(None)
 ):
@@ -89,11 +89,13 @@ def create_new_index(
         group_ids = None
         embedding_model_name: Optional[str] = None
         is_multimodal: Optional[bool] = None
+        preserve_source_file: Optional[bool] = None
         if request:
             ingroup_permission = request.get("ingroup_permission")
             group_ids = request.get("group_ids")
             embedding_model_name = request.get("embeddingModel")
             is_multimodal = request.get("is_multimodal")
+            preserve_source_file = request.get("preserve_source_file")
 
         # Treat path parameter as user-facing knowledge base name for new creations
         return ElasticSearchService.create_knowledge_base(
@@ -106,6 +108,7 @@ def create_new_index(
             group_ids=group_ids,
             embedding_model_name=embedding_model_name,
             is_multimodal=is_multimodal,
+            preserve_source_file=preserve_source_file,
         )
     except Exception as e:
         raise HTTPException(
@@ -505,54 +508,70 @@ async def get_index_files(
 
 
 @router.delete("/{index_name}/documents")
-def delete_documents(
+async def delete_documents(
         index_name: str = Path(..., description="Name of the index"),
         path_or_url: str = Query(...,
                                  description="Path or URL of documents to delete"),
+        scope: str = Query(
+            "full",
+            description=(
+                "source_only: delete MinIO source only, keep ES chunks/vectors; "
+                "full: delete ES documents, MinIO source, and Redis task records"
+            ),
+        ),
         vdb_core: VectorDatabaseCore = Depends(get_vector_db_core)
 ):
-    """Delete documents by path or URL and clean up related Redis records"""
+    """Delete a document by scope: source file only or full removal from the index."""
     try:
-        # First delete the documents using existing service
-        result = ElasticSearchService.delete_documents(
-            index_name, path_or_url, vdb_core)
-
-        # Then clean up Redis records related to this specific document
-        try:
-            redis_service = get_redis_service()
-            redis_cleanup_result = redis_service.delete_document_records(
-                index_name, path_or_url)
-
-            # Add Redis cleanup info to the result
-            result["redis_cleanup"] = redis_cleanup_result
-
-            # Update the message to include Redis cleanup info
-            original_message = result.get(
-                "message", "Documents deleted successfully")
-            result["message"] = (
-                f"{original_message}. "
-                f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
-                f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
-                f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
-            )
-
-            if redis_cleanup_result.get("errors"):
-                result["redis_warnings"] = redis_cleanup_result["errors"]
+        result = await ElasticSearchService.delete_document_by_scope(
+            index_name, path_or_url, scope, vdb_core
+        )
 
-        except Exception as redis_error:
-            logger.warning(
-                f"Redis cleanup failed for document {path_or_url} in index {index_name}: {str(redis_error)}")
-            result["redis_cleanup_error"] = str(redis_error)
-            original_message = result.get(
-                "message", "Documents deleted successfully")
-            result[
-                "message"] = f"{original_message}, but Redis cleanup encountered an error: {str(redis_error)}"
+        if scope == "full":
+            try:
+                redis_service = get_redis_service()
+                redis_cleanup_result = redis_service.delete_document_records(
+                    index_name, path_or_url
+                )
+                result["redis_cleanup"] = redis_cleanup_result
+                original_message = result.get(
+                    "message", "Documents deleted successfully"
+                )
+                result["message"] = (
+                    f"{original_message}. "
+                    f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
+                    f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
+                    f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
+                )
+                if redis_cleanup_result.get("errors"):
+                    result["redis_warnings"] = redis_cleanup_result["errors"]
+            except Exception as redis_error:
+                logger.warning(
+                    "Redis cleanup failed for document %s in index %s: %s",
+                    path_or_url,
+                    index_name,
+                    redis_error,
+                )
+                result["redis_cleanup_error"] = str(redis_error)
+                original_message = result.get(
+                    "message", "Documents deleted successfully"
+                )
+                result["message"] = (
+                    f"{original_message}, but Redis cleanup encountered an error: "
+                    f"{str(redis_error)}"
+                )
 
         return result
 
+    except ValueError as exc:
+        raise HTTPException(
+            status_code=HTTPStatus.BAD_REQUEST, detail=str(exc)
+        )
     except Exception as e:
         raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail=f"Error delete indexing documents: {e}")
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
+            detail=f"Error delete indexing documents: {e}",
+        )
 
 
 @router.get("/{index_name}/documents/{path_or_url:path}/error-info")
diff --git a/backend/consts/const.py b/backend/consts/const.py
index ac2196c2a..574d550c0 100644
--- a/backend/consts/const.py
+++ b/backend/consts/const.py
@@ -90,6 +90,31 @@ class VectorDatabaseType(str, Enum):
 OAUTH_CA_BUNDLE = os.getenv("OAUTH_CA_BUNDLE", "")
 
 
+# CAS SSO Configuration
+CAS_ENABLED = os.getenv("CAS_ENABLED", "false").lower() in ("true", "1", "yes", "on")
+CAS_SERVER_URL = os.getenv("CAS_SERVER_URL", "").rstrip("/")
+CAS_VALIDATE_PATH = os.getenv("CAS_VALIDATE_PATH", "/p3/serviceValidate")
+CAS_CALLBACK_BASE_URL = os.getenv("CAS_CALLBACK_BASE_URL", OAUTH_CALLBACK_BASE_URL).rstrip("/")
+# CAS login mode:
+# - disabled: disable CAS login entry and automatic CAS redirects.
+# - button: show CAS as an optional login entry.
+# - force: automatically redirect unauthenticated users to CAS login.
+CAS_LOGIN_MODE = os.getenv("CAS_LOGIN_MODE", "disabled").lower()
+CAS_USER_ATTRIBUTE = os.getenv("CAS_USER_ATTRIBUTE", "")
+CAS_EMAIL_ATTRIBUTE = os.getenv("CAS_EMAIL_ATTRIBUTE", "email")
+CAS_ROLE_ATTRIBUTE = os.getenv("CAS_ROLE_ATTRIBUTE", "role")
+CAS_TENANT_ATTRIBUTE = os.getenv("CAS_TENANT_ATTRIBUTE", "tenant_id")
+CAS_ROLE_MAP_JSON = os.getenv("CAS_ROLE_MAP_JSON", "")
+CAS_SESSION_MAX_AGE_SECONDS = int(os.getenv("CAS_SESSION_MAX_AGE_SECONDS", "3600") or 3600)
+LOCAL_SESSION_MAX_AGE_SECONDS = int(os.getenv("LOCAL_SESSION_MAX_AGE_SECONDS", "3600") or 3600)
+CAS_RENEW_BEFORE_SECONDS = int(os.getenv("CAS_RENEW_BEFORE_SECONDS", "300") or 300)
+CAS_RENEW_TIMEOUT_SECONDS = int(os.getenv("CAS_RENEW_TIMEOUT_SECONDS", "10") or 10)
+CAS_SYNTHETIC_EMAIL_DOMAIN = os.getenv("CAS_SYNTHETIC_EMAIL_DOMAIN", "cas.local")
+CAS_LOGOUT_URL = os.getenv("CAS_LOGOUT_URL", "")
+CAS_SSL_VERIFY = os.getenv("CAS_SSL_VERIFY", "true").lower() == "true"
+CAS_CA_BUNDLE = os.getenv("CAS_CA_BUNDLE", "")
+
+
 # ===== To be migrated to frontend configuration =====
 # Email Configuration
 IMAP_SERVER = os.getenv('IMAP_SERVER')
@@ -208,6 +233,7 @@ class VectorDatabaseType(str, Enum):
     "NEXENT_MCP_DOCKER_IMAGE", "nexent/nexent-mcp:latest")
 ENABLE_UPLOAD_IMAGE = os.getenv(
     "ENABLE_UPLOAD_IMAGE", "false").lower() == "true"
+ENABLE_JIUWEN_SDK = os.getenv("NEXENT_ENABLE_JIUWEN_SDK", "true").lower() == "true"
 
 
 # Celery Configuration
@@ -375,36 +401,47 @@ class VectorDatabaseType(str, Enum):
 OTEL_SERVICE_NAME = OTEL_SERVICE_NAME_RAW or "nexent-backend"
 OTEL_EXPORTER_OTLP_ENDPOINT_RAW = os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT")
 OTEL_EXPORTER_OTLP_ENDPOINT = OTEL_EXPORTER_OTLP_ENDPOINT_RAW or "http://localhost:4318"
-OTEL_EXPORTER_OTLP_TRACES_ENDPOINT = os.getenv("OTEL_EXPORTER_OTLP_TRACES_ENDPOINT", "")
-OTEL_EXPORTER_OTLP_METRICS_ENDPOINT = os.getenv("OTEL_EXPORTER_OTLP_METRICS_ENDPOINT", "")
+OTEL_EXPORTER_OTLP_TRACES_ENDPOINT = os.getenv(
+    "OTEL_EXPORTER_OTLP_TRACES_ENDPOINT", "")
+OTEL_EXPORTER_OTLP_METRICS_ENDPOINT = os.getenv(
+    "OTEL_EXPORTER_OTLP_METRICS_ENDPOINT", "")
 OTEL_EXPORTER_OTLP_PROTOCOL_RAW = os.getenv("OTEL_EXPORTER_OTLP_PROTOCOL")
 OTEL_EXPORTER_OTLP_PROTOCOL = OTEL_EXPORTER_OTLP_PROTOCOL_RAW or "http"
 OTEL_EXPORTER_OTLP_HEADERS_RAW = os.getenv("OTEL_EXPORTER_OTLP_HEADERS")
 OTEL_EXPORTER_OTLP_HEADERS = OTEL_EXPORTER_OTLP_HEADERS_RAW or ""
-OTEL_EXPORTER_OTLP_AUTHORIZATION = os.getenv("OTEL_EXPORTER_OTLP_AUTHORIZATION", "")
+OTEL_EXPORTER_OTLP_AUTHORIZATION = os.getenv(
+    "OTEL_EXPORTER_OTLP_AUTHORIZATION", "")
 OTEL_EXPORTER_OTLP_X_API_KEY = os.getenv("OTEL_EXPORTER_OTLP_X_API_KEY", "")
 OTEL_EXPORTER_OTLP_LANGFUSE_INGESTION_VERSION = os.getenv(
     "OTEL_EXPORTER_OTLP_LANGFUSE_INGESTION_VERSION", "")
 LANGSMITH_API_KEY = os.getenv("LANGSMITH_API_KEY", "")
 LANGSMITH_PROJECT = os.getenv("LANGSMITH_PROJECT", "")
-OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW = os.getenv("OTEL_EXPORTER_OTLP_METRICS_ENABLED")
+OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW = os.getenv(
+    "OTEL_EXPORTER_OTLP_METRICS_ENABLED")
 OTEL_EXPORTER_OTLP_METRICS_ENABLED = (
     OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW or "true").lower() == "true"
-MONITORING_INSTRUMENT_REQUESTS_RAW = os.getenv("MONITORING_INSTRUMENT_REQUESTS")
+MONITORING_INSTRUMENT_REQUESTS_RAW = os.getenv(
+    "MONITORING_INSTRUMENT_REQUESTS")
 MONITORING_INSTRUMENT_REQUESTS = (
     MONITORING_INSTRUMENT_REQUESTS_RAW or "false").lower() == "true"
-MONITORING_FASTAPI_INCLUDED_URLS = os.getenv("MONITORING_FASTAPI_INCLUDED_URLS", "")
-MONITORING_FASTAPI_EXCLUDED_URLS = os.getenv("MONITORING_FASTAPI_EXCLUDED_URLS", "")
-MONITORING_FASTAPI_EXCLUDE_SPANS = os.getenv("MONITORING_FASTAPI_EXCLUDE_SPANS", "receive,send")
+MONITORING_FASTAPI_INCLUDED_URLS = os.getenv(
+    "MONITORING_FASTAPI_INCLUDED_URLS", "")
+MONITORING_FASTAPI_EXCLUDED_URLS = os.getenv(
+    "MONITORING_FASTAPI_EXCLUDED_URLS", "")
+MONITORING_FASTAPI_EXCLUDE_SPANS = os.getenv(
+    "MONITORING_FASTAPI_EXCLUDE_SPANS", "receive,send")
 MONITORING_PROJECT_NAME = os.getenv("MONITORING_PROJECT_NAME", "")
 MONITORING_DASHBOARD_URL = os.getenv("MONITORING_DASHBOARD_URL", "")
-MONITORING_TRACE_CONTENT_MODE = os.getenv("MONITORING_TRACE_CONTENT_MODE", "summary")
+MONITORING_TRACE_CONTENT_MODE = os.getenv(
+    "MONITORING_TRACE_CONTENT_MODE", "summary")
 MONITORING_TRACE_MAX_CHARS = os.getenv("MONITORING_TRACE_MAX_CHARS", "4000")
 MONITORING_TRACE_MAX_ITEMS = os.getenv("MONITORING_TRACE_MAX_ITEMS", "20")
 TELEMETRY_SAMPLE_RATE_RAW = os.getenv("TELEMETRY_SAMPLE_RATE")
 TELEMETRY_SAMPLE_RATE = float(TELEMETRY_SAMPLE_RATE_RAW or "1.0")
 
 # Parse OTLP headers into dict format
+
+
 def _parse_otlp_headers(headers_str: str) -> dict:
     """Parse OTLP headers string into dict. Format: 'key1=value1,key2=value2'"""
     if not headers_str:
@@ -416,6 +453,7 @@ def _parse_otlp_headers(headers_str: str) -> dict:
             headers[key.strip()] = value.strip()
     return headers
 
+
 OTLP_HEADERS = _parse_otlp_headers(OTEL_EXPORTER_OTLP_HEADERS)
 if OTEL_EXPORTER_OTLP_AUTHORIZATION:
     OTLP_HEADERS["Authorization"] = OTEL_EXPORTER_OTLP_AUTHORIZATION
@@ -448,7 +486,7 @@ def _parse_otlp_headers(headers_str: str) -> dict:
 
 
 # APP Version
-APP_VERSION = "v2.2.0"
+APP_VERSION = "v2.2.1"
 
 
 # Skill Creation Streaming Configuration
diff --git a/backend/consts/model.py b/backend/consts/model.py
index 6969999fe..00e5b8a0a 100644
--- a/backend/consts/model.py
+++ b/backend/consts/model.py
@@ -1,8 +1,8 @@
 from enum import Enum
-from typing import Optional, Any, List, Dict
+from typing import Optional, Any, List, Dict, Literal
 
 from pydantic import BaseModel, Field, EmailStr, ConfigDict, field_validator
-from nexent.core.agents.agent_model import ToolConfig
+from nexent.core.agents.agent_model import AgentVerificationConfig, ToolConfig
 
 from consts.prompt_template import PROMPT_GENERATE_TEMPLATE_FIELD_ALIAS_MAP
 
@@ -230,6 +230,24 @@ class HistoryItem(BaseModel):
     minio_files: Optional[List[Dict[str, Any]]] = None
 
 
+class AgentToolParamsRequest(BaseModel):
+    """Request-scoped tool parameter overrides for a single agent."""
+
+    tools: Dict[str, Dict[str, Any]] = Field(
+        default_factory=dict,
+        description="Mapping from tool identifier to request-scoped override params",
+    )
+
+
+class ToolParamsRequest(BaseModel):
+    """Request-scoped tool parameter overrides for main and managed agents."""
+
+    agents: Dict[str, AgentToolParamsRequest] = Field(
+        default_factory=dict,
+        description="Mapping from agent identifier to tool parameter overrides",
+    )
+
+
 class AgentRequest(BaseModel):
     query: str
     conversation_id: Optional[int] = None
@@ -240,6 +258,7 @@ class AgentRequest(BaseModel):
     model_id: Optional[int] = None
     version_no: Optional[int] = None
     is_debug: Optional[bool] = False
+    tool_params: Optional[ToolParamsRequest] = None
 
 
 class MessageUnit(BaseModel):
@@ -414,6 +433,9 @@ class OptimizePromptSectionRequest(BaseModel):
     section_title: str
     current_content: str
     feedback: str
+    mode: Literal["general", "insert", "select"] = "general"
+    start_pos: Optional[int] = Field(None, description="Start position for insert/select mode")
+    end_pos: Optional[int] = Field(None, description="End position for insert/select mode")
     tool_ids: Optional[List[int]] = Field(
         None, description="Optional: tool IDs from frontend (takes precedence over database query)")
     sub_agent_ids: Optional[List[int]] = Field(
@@ -422,6 +444,38 @@ class OptimizePromptSectionRequest(BaseModel):
         None, description="Optional: knowledge base display names from frontend (takes precedence over database query)")
 
 
+class BadCaseItem(BaseModel):
+    question: str
+    answer: str
+    label: Optional[str] = None
+    reason: Optional[str] = None
+
+
+class OptimizePromptBadCaseRequest(BaseModel):
+    agent_id: int
+    model_id: int
+    current_content: str
+    bad_cases: List[BadCaseItem]
+    section_type: str
+    section_title: str
+    tool_ids: Optional[List[int]] = Field(None)
+    sub_agent_ids: Optional[List[int]] = Field(None)
+    knowledge_base_display_names: Optional[List[str]] = Field(None)
+
+
+class OptimizeFromDebugSelected(BaseModel):
+    user_question: str
+    assistant_answer: str
+
+
+class OptimizePromptFromDebugRequest(BaseModel):
+    agent_id: int
+    model_id: int
+    feedback: str
+    selected: OptimizeFromDebugSelected
+    history: Optional[List[HistoryItem]] = None
+
+
 class GenerateTitleRequest(BaseModel):
     conversation_id: int
     question: str
@@ -454,8 +508,18 @@ class AgentInfoRequest(BaseModel):
     group_ids: Optional[List[int]] = None
     ingroup_permission: Optional[str] = None
     enable_context_manager: Optional[bool] = None
+    verification_config: Optional[Dict[str, Any]] = None
+    greeting_message: Optional[str] = None
+    example_questions: Optional[List[str]] = None
     version_no: int = 0
 
+    @field_validator("verification_config", mode="before")
+    @classmethod
+    def normalize_verification_config(cls, value):
+        if value is None:
+            return None
+        return AgentVerificationConfig.model_validate(value).model_dump()
+
 
 class AgentIDRequest(BaseModel):
     agent_id: int
@@ -520,6 +584,7 @@ class MessageIdRequest(BaseModel):
 
 class ExportAndImportAgentInfo(BaseModel):
     agent_id: int
+    tenant_id: Optional[str] = None
     name: str
     display_name: Optional[str] = None
     description: str
@@ -527,6 +592,7 @@ class ExportAndImportAgentInfo(BaseModel):
     author: Optional[str] = None
     max_steps: int
     provide_run_summary: bool
+    verification_config: Optional[Dict[str, Any]] = None
     duty_prompt: Optional[str] = None
     constraint_prompt: Optional[str] = None
     few_shots_prompt: Optional[str] = None
@@ -556,6 +622,11 @@ class ExportAndImportDataFormat(BaseModel):
     mcp_info: List[MCPInfo]
 
 
+class AgentRepositorySnapshot(ExportAndImportDataFormat):
+    """Frozen marketplace snapshot: export format plus optional skill ZIP payloads."""
+    skills: Optional[List["SkillZipEntry"]] = None
+
+
 class SkillZipEntry(BaseModel):
     """A skill bundled inside an agent export ZIP."""
     skill_name: str
diff --git a/backend/data_process/tasks.py b/backend/data_process/tasks.py
index f2a30f9b7..4dd6edd69 100644
--- a/backend/data_process/tasks.py
+++ b/backend/data_process/tasks.py
@@ -8,9 +8,11 @@
 import os
 import threading
 import time
+from dataclasses import dataclass
 from typing import Any, Dict, Optional, List, Tuple
 
 import aiohttp
+import requests
 import re
 import ray
 from celery import Task, chain, states, group, chord
@@ -19,6 +21,7 @@
 
 from utils.file_management_utils import get_file_size
 from database.attachment_db import get_file_stream
+from database.knowledge_db import get_knowledge_record
 from services.redis_service import get_redis_service
 from .app import app
 from .ray_actors import DataProcessorRayActor
@@ -43,10 +46,12 @@
 
 
 logger = logging.getLogger("data_process.tasks")
-ASYNC_SPLIT_RETRY_MAX = max(FORWARD_REDIS_RETRY_MAX * 5, FORWARD_REDIS_RETRY_MAX)
+ASYNC_SPLIT_RETRY_MAX = max(
+    FORWARD_REDIS_RETRY_MAX * 5, FORWARD_REDIS_RETRY_MAX)
 FORWARD_ES_CHUNK_BATCH_SIZE = 64
 IMAGE_METADATA_PROCESS_SOURCE = "UniversalImageExtractor"
 
+
 def _wait_for_split_ready(redis_key: str, timeout_s: int, poll_interval_ms: int) -> int:
     """
     Wait until async split aggregation is marked ready in Redis.
@@ -91,7 +96,8 @@ def _estimate_parallel_parts() -> int:
 def _compute_split_wait_timeout(parts_count: int) -> int:
     base_timeout = DP_REDIS_CHUNKS_WAIT_TIMEOUT_S
     waves = math.ceil(max(1, parts_count) / _estimate_parallel_parts())
-    dynamic_timeout = base_timeout + max(0, waves - 1) * max(1, PER_WAVE_TIMEOUT)
+    dynamic_timeout = base_timeout + \
+        max(0, waves - 1) * max(1, PER_WAVE_TIMEOUT)
     return min(MAX_TIMEOUT, max(base_timeout, dynamic_timeout))
 
 
@@ -178,7 +184,6 @@ def _build_balanced_batches(
     return batches
 
 
-
 # Thread lock for initializing Ray to prevent race conditions
 ray_init_lock = threading.Lock()
 
@@ -327,6 +332,35 @@ def run_in_thread():
         raise
 
 
+def _delete_source_file_via_http_sync(
+    *,
+    base_url: str,
+    index_name: str,
+    path_or_url: str,
+    scope: str,
+    timeout_s: float = 30.0,
+) -> Dict[str, Any]:
+    base = (base_url or "").rstrip("/")
+    if not base:
+        raise RuntimeError("ELASTICSEARCH_SERVICE is not configured")
+    url = f"{base}/indices/{index_name}/documents"
+    params = {"path_or_url": path_or_url, "scope": scope}
+
+    resp = requests.delete(url, params=params, timeout=timeout_s)
+    body_text = getattr(resp, "text", "")
+    parsed = None
+    try:
+        parsed = resp.json()
+    except Exception:
+        parsed = _parse_json_or_none(body_text) if body_text else None
+
+    return {
+        "http_status": getattr(resp, "status_code", None),
+        "response_json": parsed if isinstance(parsed, dict) else None,
+        "response_text": body_text if not isinstance(parsed, dict) else None,
+    }
+
+
 def _build_forward_error(
     message: str,
     index_name: str,
@@ -350,6 +384,206 @@ def _parse_json_or_none(text: str) -> Optional[Dict[str, Any]]:
         return None
 
 
+@dataclass(frozen=True)
+class _ForwardContext:
+    task_id: str
+    request_id: str
+    start_time: float
+    source: str
+    index_name: str
+    source_type: str
+    original_filename: Optional[str]
+
+
+def _init_forward_context(
+    *,
+    task_id: str,
+    request_id: str,
+    start_time: float,
+    source: str,
+    index_name: str,
+    source_type: str,
+    original_filename: Optional[str],
+) -> _ForwardContext:
+    return _ForwardContext(
+        task_id=task_id,
+        request_id=request_id,
+        start_time=start_time,
+        source=source,
+        index_name=index_name,
+        source_type=source_type,
+        original_filename=original_filename,
+    )
+
+
+def _is_forward_task_cancelled(ctx: _ForwardContext) -> bool:
+    try:
+        redis_service = get_redis_service()
+        return bool(redis_service.is_task_cancelled(ctx.task_id))
+    except Exception as exc:
+        logger.warning(
+            f"[{ctx.request_id}] FORWARD TASK: Failed to check cancellation flag for task {ctx.task_id}: "
+            f"{exc}"
+        )
+        return False
+
+
+def _build_forward_cancelled_result(ctx: _ForwardContext) -> Dict[str, Any]:
+    return {
+        'task_id': ctx.task_id,
+        'source': ctx.source,
+        'index_name': ctx.index_name,
+        'original_filename': ctx.original_filename,
+        'chunks_stored': 0,
+        'storage_time': 0,
+        'es_result': {
+            "success": False,
+            "message": "Indexing cancelled because document was deleted.",
+            "total_indexed": 0,
+            "total_submitted": 0,
+        },
+    }
+
+
+def _load_forward_chunks(
+    self: Task,
+    *,
+    processed_data: Dict[str, Any],
+    original_source: str,
+    original_index_name: str,
+    filename: Optional[str],
+) -> Tuple[Optional[List[Dict[str, Any]]], bool, str, str, Optional[str]]:
+    chunks = processed_data.get('chunks')
+    split_async = bool(processed_data.get('split_async'))
+
+    # If chunks are not in payload, try loading from Redis via the redis_key
+    if (not chunks) and processed_data.get('redis_key'):
+        redis_key = processed_data.get('redis_key')
+        if not REDIS_BACKEND_URL:
+            raise Exception(json.dumps({
+                "message": "REDIS_BACKEND_URL not configured to retrieve chunks",
+                "index_name": original_index_name,
+                "task_name": "forward",
+                "source": original_source,
+                "original_filename": filename
+            }, ensure_ascii=False))
+        try:
+            import redis
+            client = redis.Redis.from_url(
+                REDIS_BACKEND_URL, decode_responses=True)
+            ready_key = f"{redis_key}:ready"
+            if split_async:
+                ready_flag = client.get(ready_key)
+                if not ready_flag:
+                    retry_num = getattr(self.request, 'retries', 0)
+                    logger.info(
+                        f"[{self.request.id}] FORWARD TASK: Async split not ready for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                    raise self.retry(
+                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                        max_retries=ASYNC_SPLIT_RETRY_MAX,
+                        exc=Exception(json.dumps({
+                            "message": "Async split not ready; will retry",
+                            "index_name": original_index_name,
+                            "task_name": "forward",
+                            "source": original_source,
+                            "original_filename": filename
+                        }, ensure_ascii=False))
+                    )
+            cached = client.get(redis_key)
+            if cached:
+                try:
+                    logger.debug(
+                        f"[{self.request.id}] FORWARD TASK: Retrieved Redis key '{redis_key}', payload_length={len(cached)}")
+                    chunks = json.loads(cached)
+                except json.JSONDecodeError as jde:
+                    # Log raw prefix to help diagnose incorrect writes
+                    raw_preview = cached[:120] if isinstance(
+                        cached, str) else str(type(cached))
+                    logger.error(
+                        f"[{self.request.id}] FORWARD TASK: JSON decode error for key '{redis_key}': {str(jde)}; raw_prefix={raw_preview!r}")
+                    raise
+            else:
+                if split_async:
+                    retry_num = getattr(self.request, 'retries', 0)
+                    logger.info(
+                        f"[{self.request.id}] FORWARD TASK: Async split ready but chunks missing for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                    raise self.retry(
+                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                        max_retries=ASYNC_SPLIT_RETRY_MAX,
+                        exc=Exception(json.dumps({
+                            "message": "Async split ready but chunks missing; will retry",
+                            "index_name": original_index_name,
+                            "task_name": "forward",
+                            "source": original_source,
+                            "original_filename": filename
+                        }, ensure_ascii=False))
+                    )
+                # No busy-wait: release the worker slot and retry later
+                retry_num = getattr(self.request, 'retries', 0)
+                logger.info(
+                    f"[{self.request.id}] FORWARD TASK: Chunks not yet available for key {redis_key}. Retry {retry_num + 1}/{FORWARD_REDIS_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                raise self.retry(
+                    countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                    max_retries=FORWARD_REDIS_RETRY_MAX,
+                    exc=Exception(json.dumps({
+                        "message": "Chunks not ready in Redis; will retry",
+                        "index_name": original_index_name,
+                        "task_name": "forward",
+                        "source": original_source,
+                        "original_filename": filename
+                    }, ensure_ascii=False))
+                )
+        except Retry:
+            raise
+        except Exception as exc:
+            raise Exception(json.dumps({
+                "message": f"Failed to retrieve chunks from Redis: {str(exc)}",
+                "index_name": original_index_name,
+                "task_name": "forward",
+                "source": original_source,
+                "original_filename": filename
+            }, ensure_ascii=False))
+
+    if processed_data.get('source'):
+        original_source = processed_data.get('source')
+    if processed_data.get('index_name'):
+        original_index_name = processed_data.get('index_name')
+    if processed_data.get('original_filename'):
+        filename = processed_data.get('original_filename')
+
+    logger.info(
+        f"[{self.request.id}] FORWARD TASK: Received data for source '{original_source}' with {len(chunks) if chunks else 'None'} chunks")
+
+    if chunks is None:
+        raise Exception(json.dumps({
+            "message": "No chunks received for forwarding",
+            "index_name": original_index_name,
+            "task_name": "forward",
+            "source": original_source,
+            "original_filename": filename
+        }, ensure_ascii=False))
+    if len(chunks) == 0:
+        if split_async and processed_data.get('redis_key'):
+            retry_num = getattr(self.request, 'retries', 0)
+            logger.info(
+                f"[{self.request.id}] FORWARD TASK: Empty chunks while waiting for async split. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+            raise self.retry(
+                countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                max_retries=ASYNC_SPLIT_RETRY_MAX,
+                exc=Exception(json.dumps({
+                    "message": "Chunks not ready in Redis (empty); will retry",
+                    "index_name": original_index_name,
+                    "task_name": "forward",
+                    "source": original_source,
+                    "original_filename": filename
+                }, ensure_ascii=False))
+            )
+        logger.warning(
+            f"[{self.request.id}] FORWARD TASK: Empty chunks list received for source {original_source}")
+
+    return chunks, split_async, original_source, original_index_name, filename
+
+
 def _extract_error_code_from_es_response(
     parsed_body: Optional[Dict[str, Any]],
     text: str,
@@ -404,7 +638,7 @@ async def _post():
         try:
             connector = aiohttp.TCPConnector(verify_ssl=False)
             timeout = aiohttp.ClientTimeout(total=600)
-            
+
             request_params: Dict[str, str] = {}
 
             if large_mode:
@@ -423,7 +657,8 @@ async def _post():
                     parsed_body = _parse_json_or_none(text)
 
                     if status >= 400:
-                        error_code = _extract_error_code_from_es_response(parsed_body, text)
+                        error_code = _extract_error_code_from_es_response(
+                            parsed_body, text)
                         if error_code:
                             raise Exception(json.dumps({
                                 "error_code": error_code
@@ -508,7 +743,8 @@ def get_actor(self) -> Any:
         if not self.actors:
             actor = self._create_and_warm_actor()
             if actor is None:
-                raise RuntimeError("Global actor pool is empty and actor warm-up failed")
+                raise RuntimeError(
+                    "Global actor pool is empty and actor warm-up failed")
             self.actors.append(actor)
         idx = self.rr_index % len(self.actors)
         self.rr_index += 1
@@ -552,10 +788,12 @@ def prewarm_ray_actors(target_size: Optional[int] = None) -> int:
     """
     Ensure a global shared pool of warm Ray actors exists for low-latency task execution.
     """
-    desired = RAY_GLOBAL_ACTOR_POOL_SIZE if target_size is None else max(0, int(target_size))
+    desired = RAY_GLOBAL_ACTOR_POOL_SIZE if target_size is None else max(
+        0, int(target_size))
     manager = _get_or_create_global_pool_manager()
     current_after = ray.get(
-        manager.ensure_pool.remote(desired=desired, max_allowed=_estimate_parallel_parts())
+        manager.ensure_pool.remote(
+            desired=desired, max_allowed=_estimate_parallel_parts())
     )
     logger.info(
         f"Global Ray actor pool ready: current={current_after}, desired={desired}"
@@ -578,6 +816,7 @@ def _get_split_actor() -> Any:
     """
     return get_ray_actor()
 
+
 class LoggingTask(Task):
     """Base task class with enhanced logging"""
 
@@ -645,7 +884,8 @@ def process_part(
             "chunks_count": len(chunks),
         }
     except Exception as e:
-        logger.error(f"[process_part] Failed to process part for '{filename}': {str(e)}")
+        logger.error(
+            f"[process_part] Failed to process part for '{filename}': {str(e)}")
         return {
             "part_redis_key": part_redis_key,
             "chunks_count": 0,
@@ -1159,7 +1399,8 @@ def process(
             fetch_start = time.perf_counter()
             file_stream = get_file_stream(source)
             if file_stream is None:
-                raise FileNotFoundError(f"Unable to fetch file from URL: {source}")
+                raise FileNotFoundError(
+                    f"Unable to fetch file from URL: {source}")
             file_data = file_stream.read()
             fetch_elapsed = time.perf_counter() - fetch_start
             logger.info(
@@ -1208,7 +1449,8 @@ def process(
                     if cached:
                         cached_chunks = json.loads(cached)
                         if isinstance(cached_chunks, list):
-                            image_metadata_chunk_count = _count_image_metadata_chunks(cached_chunks)
+                            image_metadata_chunk_count = _count_image_metadata_chunks(
+                                cached_chunks)
             except Exception as image_count_exc:
                 logger.warning(
                     f"[{self.request.id}] PROCESS TASK: Failed counting image metadata chunks for async split: {image_count_exc}")
@@ -1232,17 +1474,17 @@ def process(
         self.update_state(
             state=states.SUCCESS,
             meta={
-            'chunks_count': chunk_count,
-            'processing_time': elapsed_time,
-            'source': source,
-            'index_name': index_name,
-            'original_filename': original_filename,
-            'task_name': 'process',
-            'stage': 'text_extracted',
-            'file_size_mb': file_size_mb,
-            'processing_speed_mb_s': file_size_mb / elapsed_time if file_size_mb > 0 and elapsed_time > 0 else 0
-        }
-    )
+                'chunks_count': chunk_count,
+                'processing_time': elapsed_time,
+                'source': source,
+                'index_name': index_name,
+                'original_filename': original_filename,
+                'task_name': 'process',
+                'stage': 'text_extracted',
+                'file_size_mb': file_size_mb,
+                'processing_speed_mb_s': file_size_mb / elapsed_time if file_size_mb > 0 and elapsed_time > 0 else 0
+            }
+        )
 
         logger.info(
             f"[{self.request.id}] PROCESS TASK: Processing complete, waiting for forward task")
@@ -1408,165 +1650,34 @@ def forward(
     filename = original_filename
 
     try:
-        # Before doing any heavy work, check whether this task has been
-        # explicitly cancelled (for example, because the user deleted the
-        # document from the knowledge base configuration page).
-        try:
-            redis_service = get_redis_service()
-            if redis_service.is_task_cancelled(task_id):
-                logger.info(
-                    f"[{self.request.id}] FORWARD TASK: Detected cancellation flag for task {task_id}; "
-                    f"skipping chunk forwarding for source '{source}' in index '{index_name}'."
-                )
-                # Treat this as a graceful early exit. We still return a
-                # structured payload so callers can consider the task done.
-                return {
-                    'task_id': task_id,
-                    'source': source,
-                    'index_name': index_name,
-                    'original_filename': original_filename,
-                    'chunks_stored': 0,
-                    'storage_time': 0,
-                    'es_result': {
-                        "success": False,
-                        "message": "Indexing cancelled because document was deleted.",
-                        "total_indexed": 0,
-                        "total_submitted": 0,
-                    },
-                }
-        except Exception as cancel_check_exc:
-            logger.warning(
-                f"[{self.request.id}] FORWARD TASK: Failed to check cancellation flag for task {task_id}: "
-                f"{cancel_check_exc}"
-            )
+        ctx = _init_forward_context(
+            task_id=task_id,
+            request_id=str(self.request.id),
+            start_time=start_time,
+            source=source,
+            index_name=index_name,
+            source_type=source_type,
+            original_filename=original_filename,
+        )
 
-        chunks = processed_data.get('chunks')
-        split_async = bool(processed_data.get('split_async'))
-        # If chunks are not in payload, try loading from Redis via the redis_key
-        if (not chunks) and processed_data.get('redis_key'):
-            redis_key = processed_data.get('redis_key')
-            if not REDIS_BACKEND_URL:
-                raise Exception(json.dumps({
-                    "message": "REDIS_BACKEND_URL not configured to retrieve chunks",
-                    "index_name": original_index_name,
-                    "task_name": "forward",
-                    "source": original_source,
-                    "original_filename": filename
-                }, ensure_ascii=False))
-            try:
-                import redis
-                client = redis.Redis.from_url(
-                    REDIS_BACKEND_URL, decode_responses=True)
-                ready_key = f"{redis_key}:ready"
-                if split_async:
-                    ready_flag = client.get(ready_key)
-                    if not ready_flag:
-                        retry_num = getattr(self.request, 'retries', 0)
-                        logger.info(
-                            f"[{self.request.id}] FORWARD TASK: Async split not ready for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                        raise self.retry(
-                            countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                            max_retries=ASYNC_SPLIT_RETRY_MAX,
-                            exc=Exception(json.dumps({
-                                "message": "Async split not ready; will retry",
-                                "index_name": original_index_name,
-                                "task_name": "forward",
-                                "source": original_source,
-                                "original_filename": filename
-                            }, ensure_ascii=False))
-                        )
-                cached = client.get(redis_key)
-                if cached:
-                    try:
-                        logger.debug(
-                            f"[{self.request.id}] FORWARD TASK: Retrieved Redis key '{redis_key}', payload_length={len(cached)}")
-                        chunks = json.loads(cached)
-                    except json.JSONDecodeError as jde:
-                        # Log raw prefix to help diagnose incorrect writes
-                        raw_preview = cached[:120] if isinstance(
-                            cached, str) else str(type(cached))
-                        logger.error(
-                            f"[{self.request.id}] FORWARD TASK: JSON decode error for key '{redis_key}': {str(jde)}; raw_prefix={raw_preview!r}")
-                        raise
-                else:
-                    if split_async:
-                        retry_num = getattr(self.request, 'retries', 0)
-                        logger.info(
-                            f"[{self.request.id}] FORWARD TASK: Async split ready but chunks missing for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                        raise self.retry(
-                            countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                            max_retries=ASYNC_SPLIT_RETRY_MAX,
-                            exc=Exception(json.dumps({
-                                "message": "Async split ready but chunks missing; will retry",
-                                "index_name": original_index_name,
-                                "task_name": "forward",
-                                "source": original_source,
-                                "original_filename": filename
-                            }, ensure_ascii=False))
-                        )
-                    # No busy-wait: release the worker slot and retry later
-                    retry_num = getattr(self.request, 'retries', 0)
-                    logger.info(
-                        f"[{self.request.id}] FORWARD TASK: Chunks not yet available for key {redis_key}. Retry {retry_num + 1}/{FORWARD_REDIS_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                    raise self.retry(
-                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                        max_retries=FORWARD_REDIS_RETRY_MAX,
-                        exc=Exception(json.dumps({
-                            "message": "Chunks not ready in Redis; will retry",
-                            "index_name": original_index_name,
-                            "task_name": "forward",
-                            "source": original_source,
-                            "original_filename": filename
-                        }, ensure_ascii=False))
-                    )
-            except Retry:
-                raise
-            except Exception as exc:
-                raise Exception(json.dumps({
-                    "message": f"Failed to retrieve chunks from Redis: {str(exc)}",
-                    "index_name": original_index_name,
-                    "task_name": "forward",
-                    "source": original_source,
-                    "original_filename": filename
-                }, ensure_ascii=False))
-        if processed_data.get('source'):
-            original_source = processed_data.get('source')
-        if processed_data.get('index_name'):
-            original_index_name = processed_data.get('index_name')
-        if processed_data.get('original_filename'):
-            filename = processed_data.get('original_filename')
-        logger.info(
-            f"[{self.request.id}] FORWARD TASK: Received data for source '{original_source}' with {len(chunks) if chunks else 'None'} chunks")
+        # Before doing any heavy work, check whether this task has been explicitly cancelled.
+        if _is_forward_task_cancelled(ctx):
+            logger.info(
+                f"[{self.request.id}] FORWARD TASK: Detected cancellation flag for task {task_id}; "
+                f"skipping chunk forwarding for source '{source}' in index '{index_name}'."
+            )
+            return _build_forward_cancelled_result(ctx)
+
+        chunks, split_async, original_source, original_index_name, filename = _load_forward_chunks(
+            self,
+            processed_data=processed_data,
+            original_source=original_source,
+            original_index_name=original_index_name,
+            filename=filename,
+        )
 
         # Calculate total chunks for progress tracking
         total_chunks = len(chunks) if chunks else 0
-
-        if chunks is None:
-            raise Exception(json.dumps({
-                "message": "No chunks received for forwarding",
-                "index_name": original_index_name,
-                "task_name": "forward",
-                "source": original_source,
-                "original_filename": original_filename
-            }, ensure_ascii=False))
-        if len(chunks) == 0:
-            if split_async and processed_data.get('redis_key'):
-                retry_num = getattr(self.request, 'retries', 0)
-                logger.info(
-                    f"[{self.request.id}] FORWARD TASK: Empty chunks while waiting for async split. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                raise self.retry(
-                    countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                    max_retries=ASYNC_SPLIT_RETRY_MAX,
-                    exc=Exception(json.dumps({
-                        "message": "Chunks not ready in Redis (empty); will retry",
-                        "index_name": original_index_name,
-                        "task_name": "forward",
-                        "source": original_source,
-                        "original_filename": filename
-                    }, ensure_ascii=False))
-                )
-            logger.warning(
-                f"[{self.request.id}] FORWARD TASK: Empty chunks list received for source {original_source}")
         formatted_chunks = []
         # Compute once per file to avoid repeated IO/MinIO calls inside loop
         file_size = get_file_size(source_type, original_source) if isinstance(
@@ -1757,6 +1868,7 @@ def forward(
 
         logger.info(
             f"[{self.request.id}] FORWARD TASK: Successfully stored {len(chunks)} chunks to index {original_index_name} in {end_time - start_time:.2f}s")
+
         return {
             'task_id': task_id,
             'source': original_source,
@@ -1839,9 +1951,106 @@ def forward(
         raise
 
 
-@app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_and_forward')
-def process_and_forward(
-        self,
+@app.task(
+    bind=True,
+    base=LoggingTask,
+    name="data_process.tasks.cleanup_source",
+    queue="forward_q",
+)
+def cleanup_source(self, forward_result: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Conditionally delete the MinIO source file after successful indexing.
+
+    If the knowledge base is configured with preserve_source_file=false, call:
+    DELETE /indices/{index_name}/documents?path_or_url=...&scope=source_only
+    """
+    index_name = (forward_result or {}).get("index_name")
+    source = (forward_result or {}).get("source")
+
+    cleanup_info: Dict[str, Any] = {
+        "attempted": False,
+        "skipped_reason": None,
+        "success": None,
+        "http_status": None,
+        "response": None,
+        "error": None,
+    }
+
+    if not index_name or not source:
+        cleanup_info["skipped_reason"] = "missing_index_name_or_source"
+        forward_result = dict(forward_result or {})
+        forward_result["source_cleanup"] = cleanup_info
+        return forward_result
+
+    try:
+        record = get_knowledge_record({"index_name": index_name}) or {}
+        preserve_source_file = record.get("preserve_source_file", True)
+    except Exception as exc:
+        logger.warning(
+            "[%s] CLEANUP TASK: Failed to load knowledge config for index '%s': %s",
+            getattr(self.request, "id", "unknown"),
+            index_name,
+            exc,
+        )
+        cleanup_info["skipped_reason"] = "knowledge_record_lookup_failed"
+        forward_result = dict(forward_result or {})
+        forward_result["source_cleanup"] = cleanup_info
+        return forward_result
+
+    if preserve_source_file:
+        cleanup_info["skipped_reason"] = "preserve_source_file_true"
+        forward_result = dict(forward_result or {})
+        forward_result["source_cleanup"] = cleanup_info
+        return forward_result
+
+    cleanup_info["attempted"] = True
+    try:
+        resp = _delete_source_file_via_http_sync(
+            base_url=ELASTICSEARCH_SERVICE,
+            index_name=index_name,
+            path_or_url=source,
+            scope="source_only",
+        )
+        cleanup_info["http_status"] = resp.get("http_status")
+        cleanup_info["response"] = (
+            resp.get("response_json")
+            if resp.get("response_json") is not None
+            else resp.get("response_text")
+        )
+
+        ok = False
+        if isinstance(resp.get("response_json"), dict):
+            ok = bool(resp["response_json"].get("status") == "success")
+        elif resp.get("http_status") and 200 <= int(resp["http_status"]) < 300:
+            ok = True
+
+        cleanup_info["success"] = ok
+        if not ok:
+            logger.warning(
+                "[%s] CLEANUP TASK: Source-only delete did not succeed. index='%s' source='%s' http_status=%s",
+                getattr(self.request, "id", "unknown"),
+                index_name,
+                source,
+                cleanup_info["http_status"],
+            )
+    except Exception as exc:
+        cleanup_info["success"] = False
+        cleanup_info["error"] = str(exc)
+        logger.warning(
+            "[%s] CLEANUP TASK: Source-only delete failed. index='%s' source='%s' error=%s",
+            getattr(self.request, "id", "unknown"),
+            index_name,
+            source,
+            exc,
+        )
+
+    forward_result = dict(forward_result or {})
+    forward_result["source_cleanup"] = cleanup_info
+    return forward_result
+
+
+def submit_process_forward_chain(
+        *,
         source: str,
         source_type: str,
         chunking_strategy: str,
@@ -1849,30 +2058,14 @@ def process_and_forward(
         original_filename: Optional[str] = None,
         authorization: Optional[str] = None,
         embedding_model_id: Optional[int] = None,
-        tenant_id: Optional[str] = None
+        tenant_id: Optional[str] = None,
 ) -> str:
     """
-    Combined task that chains processing and forwarding
-
-    This task delegates to a chain of process -> forward
-
-    Args:
-        source: Source file path, URL, or text content
-        source_type: source of the file("local", "minio")
-        chunking_strategy: Strategy for chunking the document
-        index_name: Name of the index to store documents
-        original_filename: The original name of the file
-        authorization: Authorization header for API calls
-        embedding_model_id: Embedding model ID for chunk size configuration
-        tenant_id: Tenant ID for retrieving model configuration
+    Build and enqueue a Celery chain: process -> forward.
 
     Returns:
-        Task ID of the chain
+        Celery chain task ID, or empty string if enqueue failed.
     """
-    logger.info(
-        f"Starting processing chain for {source}, original_filename={original_filename}, strategy={chunking_strategy}, index={index_name}, model_id={embedding_model_id}")
-
-    # Create a task chain
     task_chain = chain(
         process.s(
             source=source,
@@ -1889,20 +2082,66 @@ def process_and_forward(
             source_type=source_type,
             original_filename=original_filename,
             authorization=authorization
-        ).set(queue='forward_q')
+        ).set(queue='forward_q'),
+        cleanup_source.s().set(queue='forward_q'),
     )
 
-    # Execute the chain
     result = task_chain.apply_async()
     if result is None or not hasattr(result, 'id') or result.id is None:
         logger.error(
             "Celery chain apply_async() did not return a valid result or result.id")
         return ""
-    logger.info(f"Created task chain ID: {result.id}")
-
     return result.id
 
 
+@app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_and_forward')
+def process_and_forward(
+        self,
+        source: str,
+        source_type: str,
+        chunking_strategy: str,
+        index_name: Optional[str] = None,
+        original_filename: Optional[str] = None,
+        authorization: Optional[str] = None,
+        embedding_model_id: Optional[int] = None,
+        tenant_id: Optional[str] = None
+) -> str:
+    """
+    Combined task that chains processing and forwarding
+
+    This task delegates to a chain of process -> forward
+
+    Args:
+        source: Source file path, URL, or text content
+        source_type: source of the file("local", "minio")
+        chunking_strategy: Strategy for chunking the document
+        index_name: Name of the index to store documents
+        original_filename: The original name of the file
+        authorization: Authorization header for API calls
+        embedding_model_id: Embedding model ID for chunk size configuration
+        tenant_id: Tenant ID for retrieving model configuration
+
+    Returns:
+        Task ID of the chain
+    """
+    logger.info(
+        f"Starting processing chain for {source}, original_filename={original_filename}, strategy={chunking_strategy}, index={index_name}, model_id={embedding_model_id}")
+
+    chain_id = submit_process_forward_chain(
+        source=source,
+        source_type=source_type,
+        chunking_strategy=chunking_strategy,
+        index_name=index_name,
+        original_filename=original_filename,
+        authorization=authorization,
+        embedding_model_id=embedding_model_id,
+        tenant_id=tenant_id,
+    )
+    if chain_id:
+        logger.info(f"Created task chain ID: {chain_id}")
+    return chain_id
+
+
 @app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_sync')
 def process_sync(
         self,
diff --git a/backend/database/agent_db.py b/backend/database/agent_db.py
index 82696ffab..533659b0f 100644
--- a/backend/database/agent_db.py
+++ b/backend/database/agent_db.py
@@ -1,9 +1,10 @@
 import logging
-from typing import List
+from typing import List, Optional
 from sqlalchemy import or_, update
 
 from database.client import get_db_session, as_dict, filter_property
 from database.db_models import AgentInfo, ToolInstance, AgentRelation
+from database.agent_version_db import query_current_version_no
 from consts.const import ASSET_OWNER_TENANT_ID
 from utils.str_utils import convert_list_to_string
 
@@ -102,6 +103,40 @@ def query_sub_agents_id_list(main_agent_id: int, tenant_id: str, version_no: int
         return [relation.selected_agent_id for relation in relations]
 
 
+def query_sub_agent_relations(main_agent_id: int, tenant_id: str, version_no: int = 0) -> List[dict]:
+    """
+    Query sub-agent relations by main agent id, including pinned version info.
+    Default version_no=0 queries the draft version.
+
+    Args:
+        main_agent_id: Parent agent ID
+        tenant_id: Tenant ID
+        version_no: Version number to filter. Default 0 = draft/editing state
+    """
+    with get_db_session() as session:
+        query = session.query(AgentRelation).filter(
+            AgentRelation.parent_agent_id == main_agent_id,
+            AgentRelation.tenant_id == tenant_id,
+            AgentRelation.version_no == version_no,
+            AgentRelation.delete_flag != 'Y')
+        relations = query.all()
+        return [as_dict(relation) for relation in relations]
+
+
+def resolve_sub_agent_version_no(
+    selected_agent_id: int,
+    selected_agent_version_no: Optional[int],
+    tenant_id: str,
+) -> int:
+    """
+    Resolve the effective version number for a sub-agent relation.
+    Uses pinned version when set; otherwise falls back to child's current published version.
+    """
+    if selected_agent_version_no is not None:
+        return selected_agent_version_no
+    return query_current_version_no(agent_id=selected_agent_id, tenant_id=tenant_id) or 0
+
+
 def clear_agent_new_mark(agent_id: int, tenant_id: str, user_id: str, version_no: int = 0):
     """
     Clear the NEW mark for an agent.
@@ -163,6 +198,7 @@ def create_agent(agent_info, tenant_id: str, user_id: str):
     """
     info_with_metadata = dict(agent_info)
     info_with_metadata.setdefault("max_steps", 15)
+    info_with_metadata.setdefault("verification_config", None)
     info_with_metadata.update({
         "tenant_id": tenant_id,
         "version_no": 0,  # Default to draft version
@@ -201,6 +237,9 @@ def create_agent(agent_info, tenant_id: str, user_id: str):
             "group_ids": new_agent.group_ids,
             "is_new": new_agent.is_new,
             "enable_context_manager": new_agent.enable_context_manager,
+            "verification_config": new_agent.verification_config,
+            "greeting_message": new_agent.greeting_message,
+            "example_questions": new_agent.example_questions,
             "current_version_no": new_agent.current_version_no,
             "version_no": new_agent.version_no,
             "created_by": new_agent.created_by,
diff --git a/backend/database/agent_repository_db.py b/backend/database/agent_repository_db.py
new file mode 100644
index 000000000..a6bb4f48b
--- /dev/null
+++ b/backend/database/agent_repository_db.py
@@ -0,0 +1,358 @@
+import logging
+import math
+from typing import Any, Dict, List, Optional
+
+from sqlalchemy import func, or_, update
+
+from database.client import as_dict, filter_property, get_db_session
+from database.db_models import AgentRepository
+
+logger = logging.getLogger("agent_repository_db")
+
+# Listing status: NOT_SHARED (未共享), PENDING_REVIEW (待审核),
+# REJECTED (审核驳回), SHARED (已共享)
+STATUS_NOT_SHARED = "NOT_SHARED"
+STATUS_PENDING_REVIEW = "PENDING_REVIEW"
+STATUS_REJECTED = "REJECTED"
+STATUS_SHARED = "SHARED"
+
+VALID_REPOSITORY_STATUSES = frozenset({
+    STATUS_NOT_SHARED,
+    STATUS_PENDING_REVIEW,
+    STATUS_REJECTED,
+    STATUS_SHARED,
+})
+
+_UPSERT_IMMUTABLE_FIELDS = frozenset({
+    "agent_id",
+    "agent_repository_id",
+    "publisher_tenant_id",
+})
+
+_UPSERT_SNAPSHOT_FIELDS = frozenset({
+    "source_version_no",
+    "name",
+    "display_name",
+    "description",
+    "author",
+    "category_id",
+    "tags",
+    "tool_count",
+    "version_label",
+    "agent_info_json",
+})
+
+
+def insert_agent_repository_record(
+    repository_data: Dict[str, Any],
+    publisher_tenant_id: str,
+    publisher_user_id: str,
+) -> int:
+    """Insert a new agent repository listing record."""
+    with get_db_session() as session:
+        payload = {
+            **repository_data,
+            "publisher_tenant_id": publisher_tenant_id,
+            "publisher_user_id": publisher_user_id,
+            "created_by": publisher_user_id,
+            "updated_by": publisher_user_id,
+            "delete_flag": "N",
+        }
+        if payload.get("status") is None:
+            payload["status"] = STATUS_NOT_SHARED
+
+        new_record = AgentRepository(
+            **filter_property(payload, AgentRepository)
+        )
+        session.add(new_record)
+        session.flush()
+        return int(new_record.agent_repository_id)
+
+
+def get_agent_repository_by_id(repository_id: int) -> Optional[dict]:
+    """Fetch a repository listing by primary key."""
+    with get_db_session() as session:
+        record = session.query(AgentRepository).filter(
+            AgentRepository.agent_repository_id == repository_id,
+            AgentRepository.delete_flag != "Y",
+        ).first()
+        return as_dict(record) if record else None
+
+
+def get_agent_repository_by_id_and_publisher(
+    repository_id: int,
+    publisher_tenant_id: str,
+) -> Optional[dict]:
+    """Fetch a repository listing scoped to the publisher tenant."""
+    with get_db_session() as session:
+        record = session.query(AgentRepository).filter(
+            AgentRepository.agent_repository_id == repository_id,
+            AgentRepository.publisher_tenant_id == publisher_tenant_id,
+            AgentRepository.delete_flag != "Y",
+        ).first()
+        return as_dict(record) if record else None
+
+
+def get_agent_repository_by_agent_id(agent_id: int) -> Optional[dict]:
+    """Fetch an active repository listing by root agent_id."""
+    with get_db_session() as session:
+        record = session.query(AgentRepository).filter(
+            AgentRepository.agent_id == agent_id,
+            AgentRepository.delete_flag != "Y",
+        ).first()
+        return as_dict(record) if record else None
+
+
+def upsert_agent_repository_record(
+    repository_data: Dict[str, Any],
+    publisher_tenant_id: str,
+    publisher_user_id: str,
+) -> tuple[int, bool]:
+    """Insert or update a repository listing keyed by agent_id.
+
+    When no record exists, inserts a new listing. When a record exists:
+    - Same source_version_no: updates status (and updated_by) only.
+    - Different source_version_no: updates all snapshot fields, preserving
+      agent_id, agent_repository_id, and publisher_tenant_id.
+
+    Returns:
+        Tuple of (agent_repository_id, is_updated). is_updated is False on insert.
+    """
+    agent_id = repository_data.get("agent_id")
+    if agent_id is None:
+        raise ValueError("agent_id is required for repository upsert")
+
+    existing = get_agent_repository_by_agent_id(int(agent_id))
+    if not existing:
+        repository_id = insert_agent_repository_record(
+            repository_data=repository_data,
+            publisher_tenant_id=publisher_tenant_id,
+            publisher_user_id=publisher_user_id,
+        )
+        return repository_id, False
+
+    existing_version = existing.get("source_version_no")
+    incoming_version = repository_data.get("source_version_no")
+    repository_id = int(existing["agent_repository_id"])
+
+    if existing_version == incoming_version:
+        update_fields: Dict[str, Any] = {
+            "status": repository_data.get("status", STATUS_NOT_SHARED),
+            "updated_by": publisher_user_id,
+        }
+    else:
+        update_fields = {
+            key: repository_data[key]
+            for key in _UPSERT_SNAPSHOT_FIELDS
+            if key in repository_data
+        }
+        update_fields["publisher_user_id"] = publisher_user_id
+        update_fields["updated_by"] = publisher_user_id
+        update_fields["status"] = repository_data.get("status", STATUS_NOT_SHARED)
+
+    with get_db_session() as session:
+        session.execute(
+            update(AgentRepository)
+            .where(
+                AgentRepository.agent_repository_id == repository_id,
+                AgentRepository.publisher_tenant_id == publisher_tenant_id,
+                AgentRepository.delete_flag != "Y",
+            )
+            .values(**update_fields)
+        )
+    return repository_id, True
+
+
+def list_agent_repository_summaries(
+    *,
+    status: Optional[str] = None,
+) -> List[dict]:
+    """List all active repository summaries without heavy JSON blobs."""
+    with get_db_session() as session:
+        query = session.query(
+            AgentRepository.agent_repository_id,
+            AgentRepository.author,
+            AgentRepository.name,
+            AgentRepository.display_name,
+            AgentRepository.description,
+            AgentRepository.status,
+        ).filter(
+            AgentRepository.delete_flag != "Y",
+        )
+        if status:
+            query = query.filter(AgentRepository.status == status)
+        rows = query.order_by(AgentRepository.agent_repository_id.desc()).all()
+        return [
+            {
+                "agent_repository_id": row.agent_repository_id,
+                "author": row.author,
+                "name": row.name,
+                "display_name": row.display_name,
+                "description": row.description,
+                "status": row.status,
+            }
+            for row in rows
+        ]
+
+
+def query_agent_repository_list(
+    *,
+    page: int = 1,
+    page_size: int = 20,
+    search: Optional[str] = None,
+    tag: Optional[str] = None,
+    category_id: Optional[int] = None,
+    status: Optional[str] = STATUS_SHARED,
+    publisher_tenant_id: Optional[str] = None,
+) -> Dict[str, Any]:
+    """Query repository listings with offset pagination."""
+    page = max(page, 1)
+    page_size = max(min(page_size, 100), 1)
+    offset = (page - 1) * page_size
+
+    with get_db_session() as session:
+        query = session.query(AgentRepository).filter(
+            AgentRepository.delete_flag != "Y",
+        )
+
+        if status:
+            query = query.filter(AgentRepository.status == status)
+        if publisher_tenant_id:
+            query = query.filter(
+                AgentRepository.publisher_tenant_id == publisher_tenant_id
+            )
+        if category_id is not None:
+            query = query.filter(AgentRepository.category_id == category_id)
+        if tag:
+            query = query.filter(AgentRepository.tags.any(tag))
+        if search:
+            keyword = f"%{search}%"
+            query = query.filter(
+                or_(
+                    AgentRepository.name.ilike(keyword),
+                    AgentRepository.display_name.ilike(keyword),
+                    AgentRepository.description.ilike(keyword),
+                    AgentRepository.author.ilike(keyword),
+                    func.array_to_string(AgentRepository.tags, ",").ilike(keyword),
+                )
+            )
+
+        total = query.count()
+        rows = (
+            query.order_by(AgentRepository.agent_repository_id.desc())
+            .offset(offset)
+            .limit(page_size)
+            .all()
+        )
+
+        total_pages = math.ceil(total / page_size) if total else 0
+        return {
+            "items": [as_dict(row) for row in rows],
+            "pagination": {
+                "page": page,
+                "page_size": page_size,
+                "total": total,
+                "total_pages": total_pages,
+            },
+        }
+
+
+def update_agent_repository_by_id(
+    *,
+    repository_id: int,
+    publisher_tenant_id: str,
+    user_id: str,
+    updates: Dict[str, Any],
+) -> int:
+    """Update a repository listing owned by the publisher tenant. Returns affected row count."""
+    allowed_fields = {
+        "display_name",
+        "description",
+        "author",
+        "category_id",
+        "tags",
+        "tool_count",
+        "version_label",
+        "source_version_no",
+        "agent_info_json",
+        "status",
+    }
+    update_fields = {
+        key: value
+        for key, value in updates.items()
+        if key in allowed_fields
+    }
+    if not update_fields:
+        return 0
+
+    update_fields["updated_by"] = user_id
+
+    with get_db_session() as session:
+        result = session.execute(
+            update(AgentRepository)
+            .where(
+                AgentRepository.agent_repository_id == repository_id,
+                AgentRepository.publisher_tenant_id == publisher_tenant_id,
+                AgentRepository.delete_flag != "Y",
+            )
+            .values(**update_fields)
+        )
+        return int(result.rowcount or 0)
+
+
+def update_agent_repository_status_by_id(
+    *,
+    repository_id: int,
+    status: str,
+    user_id: str,
+) -> int:
+    """Update repository listing status by primary key. Returns affected row count."""
+    with get_db_session() as session:
+        result = session.execute(
+            update(AgentRepository)
+            .where(
+                AgentRepository.agent_repository_id == repository_id,
+                AgentRepository.delete_flag != "Y",
+            )
+            .values(status=status, updated_by=user_id)
+        )
+        return int(result.rowcount or 0)
+
+
+def soft_delete_agent_repository_by_id(
+    *,
+    repository_id: int,
+    publisher_tenant_id: str,
+    user_id: str,
+) -> int:
+    """Soft-delete a repository listing owned by the publisher tenant."""
+    with get_db_session() as session:
+        result = session.execute(
+            update(AgentRepository)
+            .where(
+                AgentRepository.agent_repository_id == repository_id,
+                AgentRepository.publisher_tenant_id == publisher_tenant_id,
+                AgentRepository.delete_flag != "Y",
+            )
+            .values(delete_flag="Y", updated_by=user_id)
+        )
+        return int(result.rowcount or 0)
+
+
+def list_agent_repository_by_publisher(
+    publisher_tenant_id: str,
+    *,
+    publisher_user_id: Optional[str] = None,
+) -> List[dict]:
+    """List all repository listings published by a tenant."""
+    with get_db_session() as session:
+        query = session.query(AgentRepository).filter(
+            AgentRepository.publisher_tenant_id == publisher_tenant_id,
+            AgentRepository.delete_flag != "Y",
+        )
+        if publisher_user_id:
+            query = query.filter(
+                AgentRepository.publisher_user_id == publisher_user_id
+            )
+        rows = query.order_by(AgentRepository.agent_repository_id.desc()).all()
+        return [as_dict(row) for row in rows]
diff --git a/backend/database/cas_session_db.py b/backend/database/cas_session_db.py
new file mode 100644
index 000000000..57d1aa8ea
--- /dev/null
+++ b/backend/database/cas_session_db.py
@@ -0,0 +1,134 @@
+"""
+Database operations for CAS-backed web sessions.
+"""
+
+from datetime import datetime
+from typing import Any, Dict, Optional
+
+from database.client import as_dict, get_db_session
+from database.db_models import UserCasSession
+
+CAS_SESSION_ACTIVE = "active"
+CAS_SESSION_REVOKED = "revoked"
+
+
+def create_cas_session(
+    *,
+    session_id: str,
+    user_id: str,
+    cas_user_id: str,
+    expires_at: datetime,
+    cas_session_index: Optional[str] = None,
+) -> Dict[str, Any]:
+    with get_db_session() as session:
+        record = UserCasSession(
+            session_id=session_id,
+            user_id=user_id,
+            cas_user_id=cas_user_id,
+            cas_session_index=cas_session_index,
+            status=CAS_SESSION_ACTIVE,
+            expires_at=expires_at,
+            created_by=user_id,
+            updated_by=user_id,
+        )
+        session.add(record)
+        session.flush()
+        return as_dict(record)
+
+
+def get_cas_session_by_session_id(session_id: str) -> Optional[Dict[str, Any]]:
+    if not session_id:
+        return None
+    with get_db_session() as session:
+        result = (
+            session.query(UserCasSession)
+            .filter(
+                UserCasSession.session_id == session_id,
+                UserCasSession.delete_flag == "N",
+            )
+            .first()
+        )
+        return as_dict(result) if result else None
+
+
+def is_cas_session_active(session_id: str) -> bool:
+    if not session_id:
+        return False
+    with get_db_session() as session:
+        result = (
+            session.query(UserCasSession)
+            .filter(
+                UserCasSession.session_id == session_id,
+                UserCasSession.status == CAS_SESSION_ACTIVE,
+                UserCasSession.expires_at > datetime.now(),
+                UserCasSession.delete_flag == "N",
+            )
+            .first()
+        )
+        return result is not None
+
+
+def revoke_cas_session_by_session_id(session_id: str, actor: str = "cas") -> int:
+    if not session_id:
+        return 0
+    with get_db_session() as session:
+        result = (
+            session.query(UserCasSession)
+            .filter(
+                UserCasSession.session_id == session_id,
+                UserCasSession.status == CAS_SESSION_ACTIVE,
+                UserCasSession.delete_flag == "N",
+            )
+            .update(
+                {
+                    "status": CAS_SESSION_REVOKED,
+                    "revoked_at": datetime.now(),
+                    "updated_by": actor,
+                }
+            )
+        )
+        return result
+
+
+def revoke_cas_sessions_by_user_id(cas_user_id: str, actor: str = "cas") -> int:
+    if not cas_user_id:
+        return 0
+    with get_db_session() as session:
+        result = (
+            session.query(UserCasSession)
+            .filter(
+                UserCasSession.cas_user_id == cas_user_id,
+                UserCasSession.status == CAS_SESSION_ACTIVE,
+                UserCasSession.delete_flag == "N",
+            )
+            .update(
+                {
+                    "status": CAS_SESSION_REVOKED,
+                    "revoked_at": datetime.now(),
+                    "updated_by": actor,
+                }
+            )
+        )
+        return result
+
+
+def revoke_cas_session_by_index(cas_session_index: str, actor: str = "cas") -> int:
+    if not cas_session_index:
+        return 0
+    with get_db_session() as session:
+        result = (
+            session.query(UserCasSession)
+            .filter(
+                UserCasSession.cas_session_index == cas_session_index,
+                UserCasSession.status == CAS_SESSION_ACTIVE,
+                UserCasSession.delete_flag == "N",
+            )
+            .update(
+                {
+                    "status": CAS_SESSION_REVOKED,
+                    "revoked_at": datetime.now(),
+                    "updated_by": actor,
+                }
+            )
+        )
+        return result
diff --git a/backend/database/conversation_db.py b/backend/database/conversation_db.py
index 18c0ee9fc..2d06bb9be 100644
--- a/backend/database/conversation_db.py
+++ b/backend/database/conversation_db.py
@@ -1016,3 +1016,71 @@ def get_message_id_by_index(conversation_id: int, message_index: int) -> Optiona
         result = session.execute(stmt).scalar()
 
         return result
+
+
+def get_latest_assistant_message_id(conversation_id: int, user_id: Optional[str] = None) -> Optional[int]:
+    """
+    Get the most recent assistant message ID for a conversation.
+
+    Args:
+        conversation_id: Conversation ID (integer)
+        user_id: Optional user ID for ownership check
+
+    Returns:
+        Optional[int]: The latest assistant message ID, or None if not found
+    """
+    with get_db_session() as session:
+        conversation_id = int(conversation_id)
+
+        stmt = select(ConversationMessage.message_id).where(
+            ConversationMessage.conversation_id == conversation_id,
+            ConversationMessage.delete_flag == 'N',
+            ConversationMessage.message_role == 'assistant'
+        ).order_by(desc(ConversationMessage.message_index)).limit(1)
+
+        if user_id:
+            stmt = stmt.join(
+                ConversationRecord,
+                ConversationMessage.conversation_id == ConversationRecord.conversation_id
+            ).where(ConversationRecord.created_by == user_id)
+
+        result = session.execute(stmt).scalar()
+        return result
+
+
+def update_message_minio_files(message_id: int, skill_file_uploads: List[Dict[str, Any]]) -> bool:
+    """
+    Merge skill file uploads into an existing message's minio_files field.
+
+    Args:
+        message_id: Message ID to update
+        skill_file_uploads: List of skill file upload metadata dicts to append
+
+    Returns:
+        bool: True if the message was updated, False if the message was not found
+    """
+    with get_db_session() as session:
+        message_id = int(message_id)
+
+        stmt = select(ConversationMessage).where(
+            ConversationMessage.message_id == message_id,
+            ConversationMessage.delete_flag == 'N'
+        )
+        record = session.scalars(stmt).first()
+        if not record:
+            return False
+
+        existing = record.minio_files
+        if existing:
+            try:
+                if isinstance(existing, str):
+                    existing = json.loads(existing)
+            except (json.JSONDecodeError, TypeError):
+                existing = []
+        else:
+            existing = []
+
+        existing.extend(skill_file_uploads)
+        record.minio_files = json.dumps(existing, ensure_ascii=False)
+
+        return True
diff --git a/backend/database/db_models.py b/backend/database/db_models.py
index b779266c9..5450b5f74 100644
--- a/backend/database/db_models.py
+++ b/backend/database/db_models.py
@@ -15,6 +15,8 @@
 _TENANT_ID_DOC = "Tenant ID for multi-tenancy isolation"
 
 # Base class for tables without audit fields
+
+
 class SimpleTableBase(DeclarativeBase):
     pass
 
@@ -297,13 +299,16 @@ class AgentInfo(TableBase):
 
     agent_id = Column(Integer, Sequence(
         "ag_tenant_agent_t_agent_id_seq", schema=SCHEMA), nullable=False, primary_key=True, autoincrement=True, doc="ID")
-    version_no = Column(Integer, default=0, nullable=False, primary_key=True, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    version_no = Column(Integer, default=0, nullable=False, primary_key=True,
+                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
     name = Column(String(100), doc="Agent name")
     display_name = Column(String(100), doc="Agent display name")
     description = Column(Text, doc="Description")
     author = Column(String(100), doc="Agent author")
-    model_name = Column(String(100), doc="[DEPRECATED] Name of the model used, use model_id instead")
-    model_id = Column(Integer, doc="Model ID, foreign key reference to model_record_t.model_id")
+    model_name = Column(
+        String(100), doc="[DEPRECATED] Name of the model used, use model_id instead")
+    model_id = Column(
+        Integer, doc="Model ID, foreign key reference to model_record_t.model_id")
     max_steps = Column(Integer, doc="Maximum number of steps")
     duty_prompt = Column(Text, doc="Duty prompt content")
     constraint_prompt = Column(Text, doc="Constraint prompt content")
@@ -315,15 +320,22 @@ class AgentInfo(TableBase):
         Boolean, doc="Whether to provide the running summary to the manager agent")
     business_description = Column(
         Text, doc="Manually entered by the user to describe the entire business process")
-    business_logic_model_name = Column(String(100), doc="Model name used for business logic prompt generation")
-    business_logic_model_id = Column(Integer, doc="Model ID used for business logic prompt generation, foreign key reference to model_record_t.model_id")
-    prompt_template_id = Column(Integer, doc="Prompt template ID used for business logic prompt generation")
-    prompt_template_name = Column(String(100), doc="Prompt template name used for business logic prompt generation")
+    business_logic_model_name = Column(
+        String(100), doc="Model name used for business logic prompt generation")
+    business_logic_model_id = Column(
+        Integer, doc="Model ID used for business logic prompt generation, foreign key reference to model_record_t.model_id")
+    prompt_template_id = Column(
+        Integer, doc="Prompt template ID used for business logic prompt generation")
+    prompt_template_name = Column(String(
+        100), doc="Prompt template name used for business logic prompt generation")
     group_ids = Column(String, doc="Agent group IDs list")
     is_new = Column(Boolean, default=False, doc="Whether this agent is marked as new for the user")
     current_version_no = Column(Integer, nullable=True, doc="Current published version number. NULL means no version published yet")
     ingroup_permission = Column(String(30), doc="In-group permission: EDIT, READ_ONLY, PRIVATE")
     enable_context_manager = Column(Boolean, default=False, doc="Whether to enable context management (compression) for this agent")
+    verification_config = Column(JSONB, doc="Layered ReAct self-verification configuration")
+    greeting_message = Column(Text, doc="Agent greeting message displayed on chat initial screen")
+    example_questions = Column(JSONB, doc="List of example questions for starting a conversation with this agent")
 
 
 class PromptTemplate(TableBase):
@@ -352,12 +364,15 @@ class PromptTemplate(TableBase):
 
     template_id = Column(Integer, Sequence(
         "ag_prompt_template_t_template_id_seq", schema=SCHEMA), primary_key=True, nullable=False, autoincrement=True, doc="Prompt template ID")
-    template_name = Column(String(100), nullable=False, doc="Prompt template name")
+    template_name = Column(String(100), nullable=False,
+                           doc="Prompt template name")
     description = Column(String(500), doc="Prompt template description")
-    template_type = Column(String(50), nullable=False, default="agent_generate", doc="Prompt template type")
+    template_type = Column(String(50), nullable=False,
+                           default="agent_generate", doc="Prompt template type")
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
     user_id = Column(String(100), nullable=False, doc="User ID")
-    template_content_zh = Column(JSONB, nullable=False, doc="Chinese prompt template content")
+    template_content_zh = Column(
+        JSONB, nullable=False, doc="Chinese prompt template content")
     template_content_en = Column(JSONB, doc="English prompt template content")
 
 
@@ -381,7 +396,8 @@ class ToolInstance(TableBase):
     user_id = Column(String(100), doc="User ID")
     tenant_id = Column(String(100), doc="Tenant ID")
     enabled = Column(Boolean, doc="Enabled")
-    version_no = Column(Integer, default=0, primary_key=True, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    version_no = Column(Integer, default=0, primary_key=True, nullable=False,
+                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
 
 
 class KnowledgeRecord(TableBase):
@@ -397,18 +413,25 @@ class KnowledgeRecord(TableBase):
     knowledge_name = Column(String(100), doc="User-facing knowledge base name")
     knowledge_describe = Column(String(3000), doc="Knowledge base description")
     knowledge_sources = Column(String(300), doc="Knowledge base sources")
-    embedding_model_name = Column(String(200), doc="Embedding model name, used to record the embedding model used by the knowledge base")
-    embedding_model_id = Column(Integer, doc="Embedding model ID, foreign key reference to model_record_t.model_id")
+    embedding_model_name = Column(String(
+        200), doc="Embedding model name, used to record the embedding model used by the knowledge base")
+    embedding_model_id = Column(
+        Integer, doc="Embedding model ID, foreign key reference to model_record_t.model_id")
     tenant_id = Column(String(100), doc="Tenant ID")
     group_ids = Column(String, doc="Knowledge base group IDs list")
     ingroup_permission = Column(
         String(30), doc="In-group permission: EDIT, READ_ONLY, PRIVATE")
     summary_frequency = Column(String(10), nullable=True,
-        doc="Auto-summary frequency: '3h', '5h', '1d', '1w', or NULL (disabled)")
+                               doc="Auto-summary frequency: '3h', '5h', '1d', '1w', or NULL (disabled)")
     last_summary_time = Column(TIMESTAMP(timezone=False), nullable=True,
-        doc="Timestamp of last summary generation")
+                               doc="Timestamp of last summary generation")
     last_doc_update_time = Column(TIMESTAMP(timezone=False), nullable=True,
-        doc="Timestamp of last document add/delete operation")
+                                  doc="Timestamp of last document add/delete operation")
+    preserve_source_file = Column(
+        Boolean,
+        default=True,
+        doc="Whether to preserve uploaded source documents after vectorization",
+    )
 
 
 class TenantConfig(TableBase):
@@ -481,7 +504,8 @@ class McpRecord(TableBase):
         doc="Custom HTTP headers as JSON object for MCP server requests",
         default=None,
     )
-    source = Column(String(30), doc="Source type: local/mcp_registry/community")
+    source = Column(
+        String(30), doc="Source type: local/mcp_registry/community")
     registry_json = Column(JSONB, doc="Full MCP registry server.json snapshot")
     config_json = Column(JSON, doc="MCP config data")
     enabled = Column(Boolean, default=True, doc="Enabled")
@@ -509,11 +533,13 @@ class McpCommunityRecord(TableBase):
     source = Column(String(30), doc="Source type, fixed to community")
     version = Column(String(50), doc="MCP version")
     registry_json = Column(JSONB, doc="Full MCP metadata JSON")
-    transport_type = Column(String(30), doc="Transport type: http/sse/container")
+    transport_type = Column(
+        String(30), doc="Transport type: http/sse/container")
     config_json = Column(JSON, doc="Public-shareable MCP configuration JSON")
     tags = Column(ARRAY(Text), doc="Tags")
     description = Column(Text, doc="Description")
 
+
 class UserTenant(TableBase):
     """
     User and tenant relationship table
@@ -525,7 +551,8 @@ class UserTenant(TableBase):
                             primary_key=True, nullable=False, doc="User tenant relationship ID, unique primary key")
     user_id = Column(String(100), nullable=False, doc="User ID")
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
-    user_role = Column(String(30), doc="User role: SUPER_ADMIN, ADMIN, DEV, USER")
+    user_role = Column(
+        String(30), doc="User role: SUPER_ADMIN, ADMIN, DEV, USER")
     user_email = Column(String(255), doc="User email address")
 
 
@@ -536,11 +563,18 @@ class AgentRelation(TableBase):
     __tablename__ = "ag_agent_relation_t"
     __table_args__ = {"schema": SCHEMA}
 
-    relation_id = Column(Integer, Sequence("ag_agent_relation_t_relation_id_seq", schema=SCHEMA), primary_key=True, nullable=False, doc="Relationship ID, primary key")
-    selected_agent_id = Column(Integer, primary_key=True, doc="Selected agent ID")
+    relation_id = Column(Integer, Sequence("ag_agent_relation_t_relation_id_seq", schema=SCHEMA),
+                         primary_key=True, nullable=False, doc="Relationship ID, primary key")
+    selected_agent_id = Column(
+        Integer, primary_key=True, doc="Selected agent ID")
     parent_agent_id = Column(Integer, doc="Parent agent ID")
     tenant_id = Column(String(100), doc="Tenant ID")
-    version_no = Column(Integer, default=0, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    version_no = Column(Integer, default=0, nullable=False,
+                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    selected_agent_version_no = Column(
+        Integer, nullable=True,
+        doc="Pinned version of selected_agent_id. NULL = runtime fallback to child current_version_no",
+    )
 
 
 class PartnerMappingId(TableBase):
@@ -656,13 +690,51 @@ class AgentVersion(TableBase):
                 primary_key=True, nullable=False, doc=_PRIMARY_KEY_DOC)
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
     agent_id = Column(Integer, nullable=False, doc="Agent ID")
-    version_no = Column(Integer, nullable=False, doc="Version number, starts from 1. Does not include 0 (draft)")
-    version_name = Column(String(100), doc="User-defined version name for display")
+    version_no = Column(Integer, nullable=False,
+                        doc="Version number, starts from 1. Does not include 0 (draft)")
+    version_name = Column(
+        String(100), doc="User-defined version name for display")
     release_note = Column(Text, doc="Release notes / publish remarks")
-    source_version_no = Column(Integer, doc="Source version number. If this version is a rollback, record the source version")
-    source_type = Column(String(30), doc="Source type: NORMAL (normal publish) / ROLLBACK (rollback and republish)")
-    status = Column(String(30), default="RELEASED", doc="Version status: RELEASED / DISABLED / ARCHIVED")
-    is_a2a = Column(Boolean, default=False, doc="Whether this version is published as an A2A Server agent")
+    source_version_no = Column(
+        Integer, doc="Source version number. If this version is a rollback, record the source version")
+    source_type = Column(String(
+        30), doc="Source type: NORMAL (normal publish) / ROLLBACK (rollback and republish)")
+    status = Column(String(30), default="RELEASED",
+                    doc="Version status: RELEASED / DISABLED / ARCHIVED")
+    is_a2a = Column(Boolean, default=False,
+                    doc="Whether this version is published as an A2A Server agent")
+
+
+class AgentRepository(TableBase):
+    """
+    Agent repository (marketplace) table. Frozen snapshot of a published agent tree for sharing.
+    """
+    __tablename__ = "ag_agent_repository_t"
+    __table_args__ = {"schema": SCHEMA}
+
+    agent_repository_id = Column(BigInteger, Sequence("ag_agent_repository_t_agent_repository_id_seq", schema=SCHEMA),
+                                 primary_key=True, nullable=False, doc="Agent repository listing ID, unique primary key")
+    publisher_tenant_id = Column(String(100), nullable=False, doc="Publisher tenant ID")
+    publisher_user_id = Column(String(100), nullable=False, doc="Publisher user ID")
+    agent_id = Column(Integer, nullable=False,
+                      doc="Root agent ID from ag_tenant_agent_t; upsert key")
+    source_version_no = Column(Integer, nullable=False,
+                               doc="Published version number frozen at share time")
+    name = Column(String(100), nullable=False,
+                  doc="Root agent programmatic name for display and search")
+    display_name = Column(String(100), doc="Root agent display name")
+    description = Column(Text, doc="Root agent description")
+    author = Column(String(100), doc="Agent author")
+    category_id = Column(Integer, doc="Optional marketplace category ID")
+    tags = Column(ARRAY(Text), doc="Marketplace tags")
+    tool_count = Column(Integer,
+                        doc="Total tool count across all agents in the bundle (display only)")
+    version_label = Column(String(100),
+                           doc="Repository entry version label for display (e.g. v1.0)")
+    agent_info_json = Column(JSONB, nullable=False,
+                             doc="Frozen ExportAndImportDataFormat snapshot with optional skills")
+    status = Column(String(30), default="NOT_SHARED",
+                    doc="Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)")
 
 
 class UserTokenInfo(TableBase):
@@ -675,7 +747,8 @@ class UserTokenInfo(TableBase):
     token_id = Column(Integer, Sequence("user_token_info_t_token_id_seq", schema=SCHEMA),
                       primary_key=True, nullable=False, doc="Token ID, unique primary key")
     access_key = Column(String(100), nullable=False, doc="Access Key (AK)")
-    user_id = Column(String(100), nullable=False, doc="User ID who owns this token")
+    user_id = Column(String(100), nullable=False,
+                     doc="User ID who owns this token")
 
 
 class UserTokenUsageLog(TableBase):
@@ -687,16 +760,21 @@ class UserTokenUsageLog(TableBase):
 
     token_usage_id = Column(Integer, Sequence("user_token_usage_log_t_token_usage_id_seq", schema=SCHEMA),
                             primary_key=True, nullable=False, doc="Token usage log ID, unique primary key")
-    token_id = Column(Integer, nullable=False, doc="Foreign key to user_token_info_t.token_id")
-    call_function_name = Column(String(100), doc="API function name being called")
-    related_id = Column(Integer, doc="Related resource ID (e.g., conversation_id)")
-    meta_data = Column(JSONB, doc="Additional metadata for this usage log entry, stored as JSON")
+    token_id = Column(Integer, nullable=False,
+                      doc="Foreign key to user_token_info_t.token_id")
+    call_function_name = Column(
+        String(100), doc="API function name being called")
+    related_id = Column(
+        Integer, doc="Related resource ID (e.g., conversation_id)")
+    meta_data = Column(
+        JSONB, doc="Additional metadata for this usage log entry, stored as JSON")
 
 
 class UserOAuthAccount(TableBase):
     __tablename__ = "user_oauth_account_t"
     __table_args__ = (
-        UniqueConstraint("provider", "provider_user_id", name="uq_oauth_provider_user"),
+        UniqueConstraint("provider", "provider_user_id",
+                         name="uq_oauth_provider_user"),
         {"schema": SCHEMA},
     )
 
@@ -714,11 +792,38 @@ class UserOAuthAccount(TableBase):
     provider_user_id = Column(
         String(200), nullable=False, doc="User ID from the OAuth provider"
     )
-    provider_email = Column(String(255), doc="Email address from the OAuth provider")
-    provider_username = Column(String(200), doc="Display name from the OAuth provider")
+    provider_email = Column(
+        String(255), doc="Email address from the OAuth provider")
+    provider_username = Column(
+        String(200), doc="Display name from the OAuth provider")
     tenant_id = Column(String(100), doc="Tenant ID at time of linking")
 
 
+class UserCasSession(TableBase):
+    __tablename__ = "user_cas_session_t"
+    __table_args__ = (
+        Index("ix_user_cas_session_session_id", "session_id"),
+        Index("ix_user_cas_session_user_id", "user_id"),
+        Index("ix_user_cas_session_cas_user_id", "cas_user_id"),
+        {"schema": SCHEMA},
+    )
+
+    cas_session_id = Column(
+        Integer,
+        Sequence("user_cas_session_t_cas_session_id_seq", schema=SCHEMA),
+        primary_key=True,
+        nullable=False,
+        doc="CAS session record ID",
+    )
+    session_id = Column(String(100), nullable=False, unique=True, doc="JWT session ID")
+    user_id = Column(String(100), nullable=False, doc="Supabase user UUID")
+    cas_user_id = Column(String(200), nullable=False, doc="User ID from CAS")
+    cas_session_index = Column(String(500), doc="CAS SessionIndex or service ticket")
+    status = Column(String(30), nullable=False, default="active", doc="active/revoked")
+    expires_at = Column(TIMESTAMP(timezone=False), nullable=False, doc="Session expiration time")
+    revoked_at = Column(TIMESTAMP(timezone=False), doc="Revocation time")
+
+
 class SkillInfo(TableBase):
     """
     Skill information table - stores skill metadata and content.
@@ -728,13 +833,17 @@ class SkillInfo(TableBase):
 
     skill_id = Column(Integer, Sequence("ag_skill_info_t_skill_id_seq", schema=SCHEMA),
                       primary_key=True, nullable=False, autoincrement=True, doc="Skill ID")
-    skill_name = Column(String(100), nullable=False, unique=True, doc="Unique skill name")
-    tenant_id = Column(String(100), nullable=True, doc="Tenant ID for multi-tenancy. NULL for pre-existing skills.")
+    skill_name = Column(String(100), nullable=False,
+                        unique=True, doc="Unique skill name")
+    tenant_id = Column(String(100), nullable=True,
+                       doc="Tenant ID for multi-tenancy. NULL for pre-existing skills.")
     skill_description = Column(String(1000), doc="Skill description")
     skill_tags = Column(JSON, doc="Skill tags as JSON array")
     skill_content = Column(Text, doc="Skill content in markdown format")
-    config_schemas = Column(JSON, doc="Parameter metadata from config/schema.yaml")
-    config_values = Column(JSON, doc="Runtime parameter values from config/config.yaml")
+    config_schemas = Column(
+        JSON, doc="Parameter metadata from config/schema.yaml")
+    config_values = Column(
+        JSON, doc="Runtime parameter values from config/config.yaml")
     source = Column(String(30), nullable=False, default="official",
                     doc="Skill source: official, custom, etc.")
 
@@ -748,8 +857,10 @@ class SkillToolRelation(TableBase):
 
     rel_id = Column(Integer, Sequence("ag_skill_tools_rel_t_rel_id_seq", schema=SCHEMA),
                     primary_key=True, nullable=False, autoincrement=True, doc="Relation ID")
-    skill_id = Column(Integer, nullable=False, doc="Foreign key to ag_skill_info_t.skill_id")
-    tool_id = Column(Integer, nullable=False, doc="Foreign key to ag_tool_info_t.tool_id")
+    skill_id = Column(Integer, nullable=False,
+                      doc="Foreign key to ag_skill_info_t.skill_id")
+    tool_id = Column(Integer, nullable=False,
+                     doc="Foreign key to ag_tool_info_t.tool_id")
 
 
 class SkillInstance(TableBase):
@@ -768,14 +879,19 @@ class SkillInstance(TableBase):
         nullable=False,
         doc="Skill instance ID"
     )
-    skill_id = Column(Integer, nullable=False, doc="Foreign key to ag_skill_info_t.skill_id")
+    skill_id = Column(Integer, nullable=False,
+                      doc="Foreign key to ag_skill_info_t.skill_id")
     agent_id = Column(Integer, nullable=False, doc="Agent ID")
     user_id = Column(String(100), doc="User ID")
     tenant_id = Column(String(100), doc="Tenant ID")
-    enabled = Column(Boolean, default=True, doc="Whether this skill is enabled for the agent")
-    version_no = Column(Integer, default=0, primary_key=True, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
-    config_values = Column(JSON, doc="Per-agent runtime parameter values (mirrors ag_tool_instance_t.params)")
-    config_schemas = Column(JSON, doc="Per-agent parameter schema overrides from config/schema.yaml")
+    enabled = Column(Boolean, default=True,
+                     doc="Whether this skill is enabled for the agent")
+    version_no = Column(Integer, default=0, primary_key=True, nullable=False,
+                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    config_values = Column(
+        JSON, doc="Per-agent runtime parameter values (mirrors ag_tool_instance_t.params)")
+    config_schemas = Column(
+        JSON, doc="Per-agent parameter schema overrides from config/schema.yaml")
 
 
 class OuterApiService(TableBase):
@@ -788,13 +904,16 @@ class OuterApiService(TableBase):
 
     id = Column(BigInteger, Sequence("ag_outer_api_services_id_seq", schema=SCHEMA),
                 primary_key=True, nullable=False, doc="Service ID, unique primary key")
-    mcp_service_name = Column(String(100), nullable=False, doc="MCP service name (unique identifier per tenant)")
+    mcp_service_name = Column(String(100), nullable=False,
+                              doc="MCP service name (unique identifier per tenant)")
     description = Column(Text, doc="Service description from OpenAPI info")
     openapi_json = Column(JSONB, doc="Complete OpenAPI JSON specification")
     server_url = Column(String(500), doc="Base URL of the REST API server")
     headers_template = Column(JSONB, doc="Default headers template as JSON")
-    tenant_id = Column(String(100), nullable=False, doc="Tenant ID for multi-tenancy")
-    is_available = Column(Boolean, default=True, doc="Whether the service is available")
+    tenant_id = Column(String(100), nullable=False,
+                       doc="Tenant ID for multi-tenancy")
+    is_available = Column(Boolean, default=True,
+                          doc="Whether the service is available")
 
 
 # Alias for backward compatibility
@@ -809,27 +928,37 @@ class A2ANacosConfig(TableBase):
     __tablename__ = "ag_a2a_nacos_config_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
-    config_id = Column(String(64), unique=True, nullable=False, doc="Unique config identifier for API reference")
+    id = Column(BigInteger, primary_key=True,
+                autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    config_id = Column(String(64), unique=True, nullable=False,
+                       doc="Unique config identifier for API reference")
 
     # Nacos connection
-    nacos_addr = Column(String(512), nullable=False, doc="Nacos server address, e.g., http://nacos-server:8848")
-    nacos_username = Column(String(100), doc="Nacos username for authentication")
-    nacos_password = Column(String(256), doc="Nacos password, encrypted at rest")
+    nacos_addr = Column(String(512), nullable=False,
+                        doc="Nacos server address, e.g., http://nacos-server:8848")
+    nacos_username = Column(
+        String(100), doc="Nacos username for authentication")
+    nacos_password = Column(
+        String(256), doc="Nacos password, encrypted at rest")
 
     # Discovery scope
-    namespace_id = Column(String(100), default="public", doc="Nacos namespace for service discovery")
+    namespace_id = Column(String(100), default="public",
+                          doc="Nacos namespace for service discovery")
 
     # Metadata
-    name = Column(String(100), nullable=False, doc="Display name for this Nacos config")
+    name = Column(String(100), nullable=False,
+                  doc="Display name for this Nacos config")
     description = Column(Text, doc="Description of this Nacos configuration")
 
     # Tenant isolation
-    tenant_id = Column(String(100), nullable=False, doc="Tenant ID for multi-tenancy")
+    tenant_id = Column(String(100), nullable=False,
+                       doc="Tenant ID for multi-tenancy")
 
     # Status
-    is_active = Column(Boolean, default=True, doc="Whether this Nacos config is active")
-    last_scan_at = Column(TIMESTAMP(timezone=False), doc="Last time a scan was performed using this config")
+    is_active = Column(Boolean, default=True,
+                       doc="Whether this Nacos config is active")
+    last_scan_at = Column(TIMESTAMP(timezone=False),
+                          doc="Last time a scan was performed using this config")
 
 
 class A2AExternalAgent(TableBase):
@@ -840,39 +969,49 @@ class A2AExternalAgent(TableBase):
     __tablename__ = "ag_a2a_external_agent_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True,
+                autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Agent metadata (cached from Agent Card)
-    name = Column(String(255), nullable=False, doc="Agent name from Agent Card")
+    name = Column(String(255), nullable=False,
+                  doc="Agent name from Agent Card")
     description = Column(Text, doc="Agent description from Agent Card")
-    version = Column(String(50), doc="Agent version from Agent Card, e.g., 1.2.0")
+    version = Column(
+        String(50), doc="Agent version from Agent Card, e.g., 1.2.0")
 
     # Primary interface (extracted from supportedInterfaces for quick access)
     # In A2A 1.0, this should store the http-json-rpc URL
-    agent_url = Column(String(512), nullable=False, doc="Primary A2A endpoint URL (http-json-rpc by default)")
+    agent_url = Column(String(512), nullable=False,
+                       doc="Primary A2A endpoint URL (http-json-rpc by default)")
 
     # Protocol type for calling this agent: JSONRPC, HTTP+JSON, GRPC
-    protocol_type = Column(String(20), default=PROTOCOL_JSONRPC, doc="Protocol type for calling this agent")
+    protocol_type = Column(String(20), default=PROTOCOL_JSONRPC,
+                           doc="Protocol type for calling this agent")
 
     # Capabilities
-    streaming = Column(Boolean, default=False, doc="Whether this agent supports SSE streaming")
+    streaming = Column(Boolean, default=False,
+                       doc="Whether this agent supports SSE streaming")
 
     # All supported interfaces (full JSON array from Agent Card)
     # Format: [{protocolBinding, url, protocolVersion}, ...]
     supported_interfaces = Column(JSON, doc="All supported interfaces array")
 
     # Source information
-    source_type = Column(String(20), nullable=False, doc="Discovery source: url or nacos")
+    source_type = Column(String(20), nullable=False,
+                         doc="Discovery source: url or nacos")
 
     # For URL mode
     source_url = Column(String(512), doc="Direct URL to agent card")
 
     # For Nacos mode
-    nacos_config_id = Column(String(64), doc="Reference to Nacos config used for discovery")
-    nacos_agent_name = Column(String(255), doc="Original name used for Nacos query")
+    nacos_config_id = Column(
+        String(64), doc="Reference to Nacos config used for discovery")
+    nacos_agent_name = Column(
+        String(255), doc="Original name used for Nacos query")
 
     # Base URL for infrastructure health checks
-    base_url = Column(String(512), doc="Base URL for health checks (service root address), e.g., http://agent:8080")
+    base_url = Column(String(
+        512), doc="Base URL for health checks (service root address), e.g., http://agent:8080")
 
     # Tenant isolation
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
@@ -881,13 +1020,18 @@ class A2AExternalAgent(TableBase):
     raw_card = Column(JSON, doc="Full original Agent Card JSON from discovery")
 
     # Cache management
-    cached_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when Agent Card was cached")
-    cache_expires_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when cache expires")
+    cached_at = Column(TIMESTAMP(timezone=False),
+                       doc="Timestamp when Agent Card was cached")
+    cache_expires_at = Column(
+        TIMESTAMP(timezone=False), doc="Timestamp when cache expires")
 
     # Health check status
-    is_available = Column(Boolean, default=True, doc="Whether this agent is currently reachable")
-    last_check_at = Column(TIMESTAMP(timezone=False), doc="Last health check timestamp")
-    last_check_result = Column(String(50), doc="Last health check result: OK, ERROR, TIMEOUT")
+    is_available = Column(Boolean, default=True,
+                          doc="Whether this agent is currently reachable")
+    last_check_at = Column(TIMESTAMP(timezone=False),
+                           doc="Last health check timestamp")
+    last_check_result = Column(
+        String(50), doc="Last health check result: OK, ERROR, TIMEOUT")
 
 
 class A2AExternalAgentRelation(TableBase):
@@ -905,19 +1049,23 @@ class A2AExternalAgentRelation(TableBase):
         {"schema": SCHEMA},
     )
 
-    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True,
+                autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Local agent (parent)
-    local_agent_id = Column(Integer, nullable=False, doc="Local parent agent ID")
+    local_agent_id = Column(Integer, nullable=False,
+                            doc="Local parent agent ID")
 
     # External A2A agent (sub-agent) - FK to ag_a2a_external_agent_t.id
-    external_agent_id = Column(BigInteger, nullable=False, doc="External A2A agent ID (FK to ag_a2a_external_agent_t.id)")
+    external_agent_id = Column(
+        BigInteger, nullable=False, doc="External A2A agent ID (FK to ag_a2a_external_agent_t.id)")
 
     # Tenant isolation
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
 
     # Status
-    is_enabled = Column(Boolean, default=True, doc="Whether this relation is active")
+    is_enabled = Column(Boolean, default=True,
+                        doc="Whether this relation is active")
 
 
 class A2AServerAgent(TableBase):
@@ -928,7 +1076,8 @@ class A2AServerAgent(TableBase):
     __tablename__ = "ag_a2a_server_agent_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True,
+                autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Link to local agent
     agent_id = Column(Integer, nullable=False, doc="Local agent ID")
@@ -938,35 +1087,44 @@ class A2AServerAgent(TableBase):
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
 
     # Generated endpoint ID
-    endpoint_id = Column(String(64), unique=True, nullable=False, doc="Generated endpoint ID")
+    endpoint_id = Column(String(64), unique=True,
+                         nullable=False, doc="Generated endpoint ID")
 
     # Basic info (extracted from local agent, can be overridden)
-    name = Column(String(255), nullable=False, doc="Agent name exposed in Agent Card")
+    name = Column(String(255), nullable=False,
+                  doc="Agent name exposed in Agent Card")
     description = Column(Text, doc="Agent description exposed in Agent Card")
     version = Column(String(50), doc="Agent version exposed in Agent Card")
 
     # Primary endpoint URL (http-json-rpc by default)
-    agent_url = Column(String(512), doc="Primary A2A endpoint URL (http-json-rpc by default)")
+    agent_url = Column(
+        String(512), doc="Primary A2A endpoint URL (http-json-rpc by default)")
 
     # Capabilities
-    streaming = Column(Boolean, default=False, doc="Whether this agent supports SSE streaming")
+    streaming = Column(Boolean, default=False,
+                       doc="Whether this agent supports SSE streaming")
 
     # All supported interfaces (A2A 1.0 compliant)
     # Format: [{protocolBinding, url, protocolVersion}, ...]
-    supported_interfaces = Column(JSON, doc="All supported interfaces: [{protocolBinding, url, protocolVersion}, ...]")
+    supported_interfaces = Column(
+        JSON, doc="All supported interfaces: [{protocolBinding, url, protocolVersion}, ...]")
 
     # Agent Card customization (partial overrides only)
-    card_overrides = Column(JSON, doc="User customizations for Agent Card (partial override)")
+    card_overrides = Column(
+        JSON, doc="User customizations for Agent Card (partial override)")
 
     # A2A Server status
-    is_enabled = Column(Boolean, default=False, doc="Whether A2A Server is enabled for this agent")
+    is_enabled = Column(Boolean, default=False,
+                        doc="Whether A2A Server is enabled for this agent")
 
     # Raw Agent Card (generated from settings, for debugging)
     raw_card = Column(JSON, doc="Generated Agent Card JSON (for debugging)")
 
     # Publishing timestamps
-    published_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when A2A Server was last enabled")
-    unpublished_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when A2A Server was disabled")
+    published_at = Column(TIMESTAMP(timezone=False),
+                          doc="Timestamp when A2A Server was last enabled")
+    unpublished_at = Column(TIMESTAMP(timezone=False),
+                            doc="Timestamp when A2A Server was disabled")
 
 
 class A2ATask(SimpleTableBase):
@@ -979,7 +1137,8 @@ class A2ATask(SimpleTableBase):
 
     # Core identifiers (following A2A spec)
     id = Column(String(64), primary_key=True, doc="Task ID (A2A spec: taskId)")
-    context_id = Column(String(64), doc="Context ID for grouping related tasks")
+    context_id = Column(
+        String(64), doc="Context ID for grouping related tasks")
 
     # Endpoint and caller info
     endpoint_id = Column(String(64), nullable=False, doc="Endpoint ID")
@@ -990,16 +1149,21 @@ class A2ATask(SimpleTableBase):
     raw_request = Column(JSON, doc="Original A2A request payload")
 
     # Task state (following A2A TaskState enum)
-    task_state = Column(String(50), nullable=False, server_default="TASK_STATE_SUBMITTED", doc="Task state: TASK_STATE_SUBMITTED, TASK_STATE_WORKING, TASK_STATE_COMPLETED, TASK_STATE_FAILED, TASK_STATE_CANCELED, TASK_STATE_INPUT_REQUIRED, TASK_STATE_REJECTED, TASK_STATE_AUTH_REQUIRED")
-    state_timestamp = Column(TIMESTAMP(timezone=False), doc="Task state last update timestamp")
+    task_state = Column(String(50), nullable=False, server_default="TASK_STATE_SUBMITTED",
+                        doc="Task state: TASK_STATE_SUBMITTED, TASK_STATE_WORKING, TASK_STATE_COMPLETED, TASK_STATE_FAILED, TASK_STATE_CANCELED, TASK_STATE_INPUT_REQUIRED, TASK_STATE_REJECTED, TASK_STATE_AUTH_REQUIRED")
+    state_timestamp = Column(TIMESTAMP(timezone=False),
+                             doc="Task state last update timestamp")
 
     # Task result
     result_data = Column(JSON, doc="Task final result data")
 
     # Timestamps
-    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Task creation timestamp")
-    update_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), onupdate=func.now(), doc="Task last update timestamp")
-    completed_at = Column(TIMESTAMP(timezone=False), doc="Task completion timestamp")
+    create_time = Column(TIMESTAMP(timezone=False),
+                         server_default=func.now(), doc="Task creation timestamp")
+    update_time = Column(TIMESTAMP(timezone=False), server_default=func.now(
+    ), onupdate=func.now(), doc="Task last update timestamp")
+    completed_at = Column(TIMESTAMP(timezone=False),
+                          doc="Task completion timestamp")
 
 
 class A2AMessage(SimpleTableBase):
@@ -1011,23 +1175,30 @@ class A2AMessage(SimpleTableBase):
     __table_args__ = {"schema": SCHEMA}
 
     # Core identifiers (following A2A spec)
-    message_id = Column(String(64), primary_key=True, doc="Message ID (A2A spec: messageId)")
-    task_id = Column(String(64), nullable=True, doc="Task ID this message belongs to (nullable for standalone/simple requests)")
+    message_id = Column(String(64), primary_key=True,
+                        doc="Message ID (A2A spec: messageId)")
+    task_id = Column(String(64), nullable=True,
+                     doc="Task ID this message belongs to (nullable for standalone/simple requests)")
 
     # Message attributes
-    message_index = Column(Integer, nullable=False, doc="Order of message in the conversation")
-    role = Column(String(20), nullable=False, doc="Message sender role: user or agent")
+    message_index = Column(Integer, nullable=False,
+                           doc="Order of message in the conversation")
+    role = Column(String(20), nullable=False,
+                  doc="Message sender role: user or agent")
 
     # Message content (following A2A Part structure)
-    parts = Column(JSON, nullable=False, doc="Message parts following A2A Part structure")
+    parts = Column(JSON, nullable=False,
+                   doc="Message parts following A2A Part structure")
     meta_data = Column(JSON, doc="Optional metadata")
     extensions = Column(JSON, doc="Extension URI list")
 
     # References to other tasks (optional)
-    reference_task_ids = Column(JSON, doc="Referenced task IDs array for multi-turn scenarios")
+    reference_task_ids = Column(
+        JSON, doc="Referenced task IDs array for multi-turn scenarios")
 
     # Timestamp
-    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Message creation timestamp")
+    create_time = Column(TIMESTAMP(
+        timezone=False), server_default=func.now(), doc="Message creation timestamp")
 
 
 class A2AArtifact(SimpleTableBase):
@@ -1039,15 +1210,19 @@ class A2AArtifact(SimpleTableBase):
 
     # Core identifiers (following A2A spec)
     id = Column(String(64), primary_key=True, doc="Internal primary key")
-    artifact_id = Column(String(64), nullable=False, doc="Artifact ID (A2A spec: artifactId)")
-    task_id = Column(String(64), nullable=False, doc="Task ID this artifact belongs to")
+    artifact_id = Column(String(64), nullable=False,
+                         doc="Artifact ID (A2A spec: artifactId)")
+    task_id = Column(String(64), nullable=False,
+                     doc="Task ID this artifact belongs to")
 
     # Artifact attributes
     name = Column(String(255), doc="Human-readable artifact name")
     description = Column(Text, doc="Artifact description")
-    parts = Column(JSON, nullable=False, doc="Artifact parts following A2A Part structure")
+    parts = Column(JSON, nullable=False,
+                   doc="Artifact parts following A2A Part structure")
     meta_data = Column(JSON, doc="Artifact metadata")
     extensions = Column(JSON, doc="Extension URI list")
 
     # Timestamp
-    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Artifact creation timestamp")
+    create_time = Column(TIMESTAMP(
+        timezone=False), server_default=func.now(), doc="Artifact creation timestamp")
diff --git a/backend/database/knowledge_db.py b/backend/database/knowledge_db.py
index 9a8b1c8c1..8fc60d6bd 100644
--- a/backend/database/knowledge_db.py
+++ b/backend/database/knowledge_db.py
@@ -34,6 +34,7 @@ def create_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
             - user_id: Optional user ID for created_by and updated_by fields
             - tenant_id: Optional tenant ID for created_by and updated_by fields
             - embedding_model_name: embedding model name for the knowledge base
+            - preserve_source_file: whether to preserve uploaded source documents (optional)
 
     Returns:
         Dict[str, Any]: Dictionary with at least 'knowledge_id' and 'index_name'
@@ -57,6 +58,7 @@ def create_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
                 "knowledge_name": knowledge_name,
                 "group_ids": convert_list_to_string(group_ids) if isinstance(group_ids, list) else group_ids,
                 "ingroup_permission": query.get("ingroup_permission"),
+                "preserve_source_file": query.get("preserve_source_file", True),
             }
 
             # For backward compatibility: if caller explicitly provides index_name,
@@ -117,11 +119,16 @@ def upsert_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
 
             if existing_record:
                 # Update existing record
-                existing_record.knowledge_name = query.get('knowledge_name') or query.get('index_name')
-                existing_record.knowledge_describe = query.get('knowledge_describe', '')
-                existing_record.knowledge_sources = query.get('knowledge_sources', 'elasticsearch')
-                existing_record.embedding_model_name = query.get('embedding_model_name')
-                existing_record.embedding_model_id = query.get('embedding_model_id')
+                existing_record.knowledge_name = query.get(
+                    'knowledge_name') or query.get('index_name')
+                existing_record.knowledge_describe = query.get(
+                    'knowledge_describe', '')
+                existing_record.knowledge_sources = query.get(
+                    'knowledge_sources', 'elasticsearch')
+                existing_record.embedding_model_name = query.get(
+                    'embedding_model_name')
+                existing_record.embedding_model_id = query.get(
+                    'embedding_model_id')
                 existing_record.updated_by = query.get('user_id')
                 existing_record.update_time = func.current_timestamp()
 
@@ -183,7 +190,7 @@ def update_knowledge_record(query: Dict[str, Any]) -> bool:
             # Update group IDs
             if query.get("group_ids") is not None:
                 record.group_ids = query["group_ids"]
-            
+
             # Update timestamp and user
             if query.get("user_id"):
                 record.updated_by = query["user_id"]
@@ -251,15 +258,17 @@ def get_knowledge_record(query: Optional[Dict[str, Any]] = None) -> Dict[str, An
 
             # Support both index_name and knowledge_name queries
             if 'index_name' in query:
-                db_query = db_query.filter(KnowledgeRecord.index_name == query['index_name'])
+                db_query = db_query.filter(
+                    KnowledgeRecord.index_name == query['index_name'])
             elif 'knowledge_name' in query:
-                db_query = db_query.filter(KnowledgeRecord.knowledge_name == query['knowledge_name'])
+                db_query = db_query.filter(
+                    KnowledgeRecord.knowledge_name == query['knowledge_name'])
 
             # Add tenant_id filter only if it is provided in the query
             if 'tenant_id' in query and query['tenant_id'] is not None:
                 db_query = db_query.filter(
                     KnowledgeRecord.tenant_id == query['tenant_id'])
-            
+
             result = db_query.first()
 
             if result:
diff --git a/backend/database/user_tenant_db.py b/backend/database/user_tenant_db.py
index f1294f8a7..b147eac49 100644
--- a/backend/database/user_tenant_db.py
+++ b/backend/database/user_tenant_db.py
@@ -75,6 +75,37 @@ def insert_user_tenant(user_id: str, tenant_id: str, user_role: str = "USER", us
         session.add(user_tenant)
 
 
+def upsert_user_tenant(user_id: str, tenant_id: str, user_role: str = "USER", user_email: str = None) -> Dict[str, Any]:
+    """
+    Create or update the active user-tenant relationship for an external identity login.
+    """
+    with get_db_session() as session:
+        result = session.query(UserTenant).filter(
+            UserTenant.user_id == user_id,
+            UserTenant.delete_flag == "N"
+        ).first()
+
+        if result:
+            result.tenant_id = tenant_id
+            result.user_role = user_role
+            if user_email is not None:
+                result.user_email = user_email
+            result.updated_by = user_id
+        else:
+            result = UserTenant(
+                user_id=user_id,
+                tenant_id=tenant_id,
+                user_role=user_role,
+                user_email=user_email,
+                created_by=user_id,
+                updated_by=user_id
+            )
+            session.add(result)
+
+        session.flush()
+        return as_dict(result)
+
+
 def get_users_by_tenant_id(tenant_id: str, page: Optional[int] = 1, page_size: Optional[int] = 20,
                            sort_by: str = "created_at", sort_order: str = "desc") -> Dict[str, Any]:
     """
diff --git a/backend/mcp_service.py b/backend/mcp_service.py
index 0d8ab4c1b..4629d42ad 100644
--- a/backend/mcp_service.py
+++ b/backend/mcp_service.py
@@ -70,7 +70,7 @@ async def run(self, arguments: Dict[str, Any]) -> Any:
 
 
 nexent_mcp = FastMCP(name="nexent_mcp")
-nexent_mcp.mount(local_mcp_service.name, local_mcp_service)
+nexent_mcp.mount(local_mcp_service, local_mcp_service.name)
 
 _openapi_mcp_services: Dict[str, FastMCP] = {}
 
@@ -188,7 +188,8 @@ def _sanitize_function_name(name: str) -> str:
 def register_openapi_service(
     service_name: str,
     openapi_json: Dict[str, Any],
-    server_url: str
+    server_url: str,
+    headers_template: Dict[str, str],
 ) -> bool:
     """
     Register an OpenAPI service using FastMCP.from_openapi().
@@ -222,7 +223,7 @@ def register_openapi_service(
             openapi_spec["servers"] = [{"url": server_url}]
 
         # Create HTTP client for the underlying REST API
-        client = httpx.AsyncClient(base_url=server_url, timeout=30.0)
+        client = httpx.AsyncClient(base_url=server_url, timeout=120.0, headers=headers_template)
 
         # Create FastMCP instance from OpenAPI spec
         mcp_server = FastMCP.from_openapi(
@@ -239,7 +240,7 @@ def register_openapi_service(
         _openapi_mcp_services[service_name] = mcp_server
 
         # Mount to the main MCP server
-        nexent_mcp.mount(service_name, mcp_server)
+        nexent_mcp.mount(mcp_server, service_name)
 
         logger.info(f"Registered OpenAPI service: {service_name}")
         return True
@@ -320,13 +321,14 @@ def refresh_openapi_services_by_tenant(tenant_id: str) -> Dict[str, Any]:
         service_name = service.get("mcp_service_name")
         openapi_json = service.get("openapi_json")
         server_url = service.get("server_url")
+        headers_template = service.get("headers_template")
 
         if not openapi_json:
             logger.warning(f"Service '{service_name}' has no OpenAPI JSON, skipping")
             skipped_count += 1
             continue
 
-        if register_openapi_service(service_name, openapi_json, server_url):
+        if register_openapi_service(service_name, openapi_json, server_url, headers_template):
             registered_count += 1
         else:
             skipped_count += 1
@@ -394,6 +396,7 @@ def refresh_single_openapi_service(service_name: str, tenant_id: str) -> Dict[st
     # Re-register with fresh data
     openapi_json = service_data.get("openapi_json")
     server_url = service_data.get("server_url")
+    headers_template = service_data.get("headers_template")
 
     if not openapi_json:
         logger.warning(f"Service '{service_name}' has no OpenAPI JSON")
@@ -403,7 +406,7 @@ def refresh_single_openapi_service(service_name: str, tenant_id: str) -> Dict[st
             "error": "No OpenAPI JSON found"
         }
 
-    success = register_openapi_service(service_name, openapi_json, server_url)
+    success = register_openapi_service(service_name, openapi_json, server_url, headers_template)
     return {
         "status": "refreshed" if success else "error",
         "service_name": service_name,
diff --git a/backend/prompts/managed_system_prompt_template_en.yaml b/backend/prompts/managed_system_prompt_template_en.yaml
index 5c2893c39..62e16e946 100644
--- a/backend/prompts/managed_system_prompt_template_en.yaml
+++ b/backend/prompts/managed_system_prompt_template_en.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### Basic Information
-  You are {{APP_NAME}}, {{APP_DESCRIPTION}}, it is {{time|default('current time')}} now
+  You are {{APP_NAME}}, {{APP_DESCRIPTION}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### Contextual Memory
@@ -66,6 +66,11 @@ system_prompt: |-
      - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.
      - **IMPORTANT**: After code execution, the system will return content with "Observation:" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**
 
+  3. Self-verification:
+     - After critical events (tool calls, retrieval results, code execution, and final-answer preparation), the system may run explicit verification.
+     - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.
+     - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.
+
   After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.
 
   When generating the final answer, you need to follow these specifications:
@@ -178,3 +183,13 @@ final_answer:
     Original task: {{task}}
 
     Please provide a clear and concise summary of the work completed so far.
+
+
+verification:
+  pre_messages: |-
+    You are a strict verifier for a ReAct agent. Judge reliability only from the task, candidate answer, tool outputs, and observations. Do not output hidden chain-of-thought.
+    You must output JSON only.
+
+  post_messages: |-
+    Verify whether the candidate answer covers the user's intent, is grounded in observations, handles tool errors, uses trustworthy citations, and is formatted for users.
+    Output fields: passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note.
diff --git a/backend/prompts/managed_system_prompt_template_zh.yaml b/backend/prompts/managed_system_prompt_template_zh.yaml
index 291e336fb..da3d53469 100644
--- a/backend/prompts/managed_system_prompt_template_zh.yaml
+++ b/backend/prompts/managed_system_prompt_template_zh.yaml
@@ -2,7 +2,7 @@ system_prompt: |-
 
   ### 基本信息
 
-  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，现在是{{time|default('当前时间')}}，用户ID为{{user_id}}
+  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，用户ID为{{user_id}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### 上下文记忆
@@ -130,6 +130,11 @@ system_prompt: |-
      - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。
      - **重要**：代码执行后，系统会返回 "Observation:" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。
 
+  3. 自验证：
+     - 关键事件（工具调用、检索结果、代码执行、准备最终回答）后，系统会进行显式自验证。
+     - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。
+     - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。
+
   在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。
 
   生成最终回答时，你需要遵循以下规范：
@@ -271,3 +276,13 @@ final_answer:
     原始任务：{{task}}
 
     请对迄今为止完成的工作进行清晰、简洁的总结。
+
+
+verification:
+  pre_messages: |-
+    你是 ReAct 智能体的严格验证器。请仅根据任务、候选答案、工具输出和观察结果判断答案是否可靠，不要输出隐藏思维链。
+    你必须只输出 JSON。
+
+  post_messages: |-
+    请验证候选答案是否覆盖用户意图、是否有观察结果支撑、是否处理了工具错误、引用是否可信、格式是否适合展示。
+    输出字段：passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note。
diff --git a/backend/prompts/manager_system_prompt_template_en.yaml b/backend/prompts/manager_system_prompt_template_en.yaml
index 8ce58db29..d44ed9a71 100644
--- a/backend/prompts/manager_system_prompt_template_en.yaml
+++ b/backend/prompts/manager_system_prompt_template_en.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### Basic Information
-  You are {{APP_NAME}}, {{APP_DESCRIPTION}}, it is {{time|default('current time')}} now
+  You are {{APP_NAME}}, {{APP_DESCRIPTION}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### Contextual Memory
@@ -67,6 +67,11 @@ system_prompt: |-
      - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.
      - **IMPORTANT**: After code execution, the system will return content with "Observation:" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**
 
+  3. Self-verification:
+     - After critical events (tool calls, retrieval results, code execution, agent handoffs, and final-answer preparation), the system may run explicit verification.
+     - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.
+     - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.
+
   After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.
 
   When generating the final answer, you need to follow these specifications:
@@ -222,3 +227,13 @@ final_answer:
     Original task: {{task}}
 
     Please provide a clear and concise summary of the work completed so far.
+
+
+verification:
+  pre_messages: |-
+    You are a strict verifier for a ReAct agent. Judge reliability only from the task, candidate answer, tool outputs, and observations. Do not output hidden chain-of-thought.
+    You must output JSON only.
+
+  post_messages: |-
+    Verify whether the candidate answer covers the user's intent, is grounded in observations, handles tool errors, uses trustworthy citations, and is formatted for users.
+    Output fields: passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note.
diff --git a/backend/prompts/manager_system_prompt_template_zh.yaml b/backend/prompts/manager_system_prompt_template_zh.yaml
index fc4eb7c0c..a49ced82d 100644
--- a/backend/prompts/manager_system_prompt_template_zh.yaml
+++ b/backend/prompts/manager_system_prompt_template_zh.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### 基本信息
-  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，现在是{{time|default('当前时间')}}，用户ID为{{user_id}}
+  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，用户ID为{{user_id}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### 上下文记忆
@@ -130,6 +130,11 @@ system_prompt: |-
      - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。
      - **重要**：代码执行后，系统会返回 "Observation:" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。
 
+  3. 自验证：
+     - 关键事件（工具调用、检索结果、代码执行、助手返回、准备最终回答）后，系统会进行显式自验证。
+     - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。
+     - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。
+
   在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。
 
   生成最终回答时，你需要遵循以下规范：
@@ -299,3 +304,13 @@ final_answer:
     原始任务：{{task}}
 
     请对迄今为止完成的工作进行清晰、简洁的总结。
+
+
+verification:
+  pre_messages: |-
+    你是 ReAct 智能体的严格验证器。请仅根据任务、候选答案、工具输出和观察结果判断答案是否可靠，不要输出隐藏思维链。
+    你必须只输出 JSON。
+
+  post_messages: |-
+    请验证候选答案是否覆盖用户意图、是否有观察结果支撑、是否处理了工具错误、引用是否可信、格式是否适合展示。
+    输出字段：passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note。
diff --git a/backend/prompts/utils/greeting_generate_en.yaml b/backend/prompts/utils/greeting_generate_en.yaml
new file mode 100644
index 000000000..31ea75632
--- /dev/null
+++ b/backend/prompts/utils/greeting_generate_en.yaml
@@ -0,0 +1,54 @@
+GREETING_SYSTEM_PROMPT: |-
+  ### You are an expert in generating agent greetings and example questions. You help users create engaging greetings and practical example questions for starting conversations with agents.
+  You are building an Agent application. The input includes: agent name, duty description, business description, and existing examples.
+  Generate a concise greeting and 3-5 example questions that help users quickly start a conversation with the agent.
+  The greeting should reflect the agent's positioning and capabilities.
+
+  ### Requirements:
+  1. The greeting should be concise and friendly, 1-2 sentences, introducing the agent's identity and core capabilities. Don't make it too long or too formal.
+  2. Example questions should be specific and practical, representing questions users might actually ask, showcasing the agent's core features.
+  3. If existing examples contain user query scenarios, prioritize extracting short user questions from them, keeping semantics consistent but simplified to natural conversational form.
+  4. Provide 3-5 example questions, each with a clear use case.
+  5. You MUST output strictly in JSON format, do not output any other content or formatting.
+
+  ### Output format:
+  ```json
+  {
+    "greeting_message": "greeting content",
+    "example_questions": ["example question 1", "example question 2", "example question 3"]
+  }
+  ```
+
+  ### Examples:
+  Example 1 (Travel Planning Assistant, existing examples contain "Help me plan a trip from Shanghai to Beijing" etc.):
+  ```json
+  {
+    "greeting_message": "Hello! I'm your travel planning assistant, I can help you plan trips, recommend attractions, and arrange travel routes.",
+    "example_questions": ["Help me plan a 3-day trip from Shanghai to Beijing", "Recommend some family-friendly attractions", "What's fun to do in Hangzhou tomorrow?"]
+  }
+  ```
+
+  Example 2 (Data Analysis Assistant):
+  ```json
+  {
+    "greeting_message": "Hello! I'm a data analysis assistant, I can help you process and analyze data, provide visual reports and insights.",
+    "example_questions": ["Help me analyze trends in this sales data", "Generate a quarterly performance comparison report", "Which products have the highest profit margins?"]
+  }
+  ```
+
+USER_PROMPT: |-
+  ### Agent Name:
+  {{display_name}}
+
+  ### Agent Duty Description:
+  {{duty_description}}
+
+  ### Business Description:
+  {{business_description}}
+
+  {% if few_shots %}
+  ### Existing Examples (extract user query scenarios from these as example questions):
+  {{few_shots}}
+  {% endif %}
+
+  Please generate the greeting and example questions based on the above information. Output strictly in JSON format.
\ No newline at end of file
diff --git a/backend/prompts/utils/greeting_generate_zh.yaml b/backend/prompts/utils/greeting_generate_zh.yaml
new file mode 100644
index 000000000..34b8d85d3
--- /dev/null
+++ b/backend/prompts/utils/greeting_generate_zh.yaml
@@ -0,0 +1,53 @@
+GREETING_SYSTEM_PROMPT: |-
+  ### 你是【智能体开场白和示例问题生成专家】，用于帮助用户创建高效、吸引人的智能体开场白和示例问题。
+  现在正在构建一个Agent应用，用户的输入包含：智能体名称、职责描述、业务描述、已有示例。
+  请根据智能体的定位和职责，生成一个简短的开场白和3~5个示例问题，帮助用户快速开始与智能体的对话。
+
+  ### 要求：
+  1.开场白要简洁友好，1-2句话即可，介绍智能体的身份和核心能力，不要过长或过于正式。
+  2.示例问题要具体、实用，是用户真实可能提出的问题，体现智能体的核心功能。
+  3.如果已有示例中包含用户的提问场景，请优先从中提炼简短的用户问题作为示例问题，保持语义一致但简化为自然对话形式。
+  4.示例问题数量为3~5个，每个问题要有明确的使用场景。
+  5.必须严格按照JSON格式输出，不要输出任何其他内容或格式。
+
+  ### 输出格式：
+  ```json
+  {
+    "greeting_message": "开场白内容",
+    "example_questions": ["示例问题1", "示例问题2", "示例问题3"]
+  }
+  ```
+
+  ### 参考示例：
+  示例1（旅行规划助手，已有示例包含"帮我规划明天从上海出发去北京的行程"等场景）：
+  ```json
+  {
+    "greeting_message": "你好！我是你的旅行规划助手，可以帮你规划行程、推荐景点和安排出行路线。",
+    "example_questions": ["帮我规划一个从上海到北京的三日旅行", "推荐一些适合家庭出游的景点", "明天去杭州有什么好玩的地方？"]
+  }
+  ```
+
+  示例2（数据分析助手）：
+  ```json
+  {
+    "greeting_message": "你好！我是数据分析助手，可以帮你处理和分析各种数据，提供可视化报告和洞察。",
+    "example_questions": ["帮我分析这组销售数据的趋势", "生成一份季度业绩对比报告", "哪些产品的利润率最高？"]
+  }
+  ```
+
+USER_PROMPT: |-
+  ### 智能体名称：
+  {{display_name}}
+
+  ### 智能体职责描述：
+  {{duty_description}}
+
+  ### 业务描述：
+  {{business_description}}
+
+  {% if few_shots %}
+  ### 已有示例（请从中提炼用户提问场景作为示例问题）：
+  {{few_shots}}
+  {% endif %}
+
+  请根据以上信息生成开场白和示例问题。严格按JSON格式输出。
\ No newline at end of file
diff --git a/backend/pyproject.toml b/backend/pyproject.toml
index dff0e8693..b8f51dd4c 100644
--- a/backend/pyproject.toml
+++ b/backend/pyproject.toml
@@ -1,7 +1,7 @@
 [project]
 name = "backend"
 version = "0.1.0"
-requires-python = "==3.10.*"
+requires-python = ">=3.11,<3.12"
 dependencies = [
     "aiofiles>=0.8.0",
     "uvicorn>=0.34.0",
@@ -11,7 +11,7 @@ dependencies = [
     "aiohttp>=3.8.0",
     "authlib>=1.3.0",
     "cryptography>=42.0.0",
-    "psycopg2-binary==2.9.10",
+    "psycopg2-binary>=2.9.9",
     "PyJWT>=2.8.0",
     "sqlalchemy~=2.0.37",
     "greenlet<3.5.0",
@@ -21,10 +21,14 @@ dependencies = [
     "jsonref>=1.1.0",
     "ruamel-yaml==0.19.1",
     "redis>=5.0.0",
-    "fastmcp==2.12.0",
+    "fastmcp>=2.14.2,<3.0",
     "langchain>=0.3.26",
     "scikit-learn>=1.0.0",
     "numpy>=1.24.0",
+    "defusedxml>=0.7.1",
+    "openjiuwen>=0.1.0",
+    "pydantic-settings>=2.0.0",
+    "python-docx>=1.1.0",
 ]
 
 [project.optional-dependencies]
@@ -34,7 +38,7 @@ data-process = [
     "flower>=2.0.1",
     "nest_asyncio>=1.5.6",
     "unstructured[csv,docx,pdf,pptx,xlsx,md]==0.18.14",
-    "huggingface_hub>=0.19.0,<0.21.0"
+    "huggingface_hub>=0.30.0,<1.0"
 ]
 test = [
     "pytest",
diff --git a/backend/services/agent_repository_service.py b/backend/services/agent_repository_service.py
new file mode 100644
index 000000000..87649bcd1
--- /dev/null
+++ b/backend/services/agent_repository_service.py
@@ -0,0 +1,306 @@
+import logging
+from typing import Any, Dict, Optional
+
+from consts.const import ASSET_OWNER_TENANT_ID
+from consts.model import AgentRepositorySnapshot
+from database.agent_db import search_agent_info_by_agent_id
+from database.agent_version_db import search_version_by_version_no
+from database.agent_repository_db import (
+    STATUS_PENDING_REVIEW,
+    VALID_REPOSITORY_STATUSES,
+    get_agent_repository_by_agent_id,
+    get_agent_repository_by_id,
+    insert_agent_repository_record,
+    list_agent_repository_summaries,
+    update_agent_repository_by_id,
+    update_agent_repository_status_by_id,
+)
+from services.agent_service import (
+    collect_skill_zip_entries,
+    export_agent_dict_for_repository_impl,
+    import_agent_impl,
+    import_agent_with_skills_impl,
+)
+
+logger = logging.getLogger("agent_repository_service")
+
+_UPDATE_SNAPSHOT_FIELDS = (
+    "display_name",
+    "description",
+    "author",
+    "category_id",
+    "tags",
+    "tool_count",
+    "version_label",
+    "source_version_no",
+    "agent_info_json",
+    "status",
+)
+
+
+def _to_summary_item(record: Dict[str, Any]) -> Dict[str, Any]:
+    """Map a DB record to a lightweight marketplace summary item."""
+    return {
+        "agent_repository_id": record.get("agent_repository_id"),
+        "author": record.get("author"),
+        "name": record.get("name"),
+        "display_name": record.get("display_name"),
+        "description": record.get("description"),
+        "status": record.get("status"),
+    }
+
+
+def list_agent_repository_listings_impl(
+    *,
+    status: Optional[str] = None,
+) -> Dict[str, Any]:
+    """List all repository listings with optional status filter."""
+    if status is not None and status not in VALID_REPOSITORY_STATUSES:
+        raise ValueError(
+            f"Invalid status '{status}'; must be one of: "
+            f"{', '.join(sorted(VALID_REPOSITORY_STATUSES))}"
+        )
+    records = list_agent_repository_summaries(status=status)
+    return {"items": [_to_summary_item(record) for record in records]}
+
+
+def update_agent_repository_status_impl(
+    *,
+    agent_repository_id: int,
+    status: str,
+    user_id: str,
+) -> Dict[str, Any]:
+    """Update a repository listing status by primary key."""
+    if status not in VALID_REPOSITORY_STATUSES:
+        raise ValueError(
+            f"Invalid status '{status}'; must be one of: "
+            f"{', '.join(sorted(VALID_REPOSITORY_STATUSES))}"
+        )
+
+    record = get_agent_repository_by_id(agent_repository_id)
+    if not record:
+        raise ValueError("Repository listing not found")
+
+    rows_affected = update_agent_repository_status_by_id(
+        repository_id=agent_repository_id,
+        status=status,
+        user_id=user_id,
+    )
+    if rows_affected == 0:
+        raise ValueError("Repository listing not found")
+
+    updated = get_agent_repository_by_id(agent_repository_id)
+    if not updated:
+        raise ValueError("Failed to load repository listing after update")
+    return _to_summary_item(updated)
+
+
+def _to_list_item(record: Dict[str, Any]) -> Dict[str, Any]:
+    """Map a DB record to a marketplace list item (without heavy JSON blobs)."""
+    return {
+        "id": record.get("agent_repository_id"),
+        "agent_repository_id": record.get("agent_repository_id"),
+        "agent_id": record.get("agent_id"),
+        "name": record.get("name"),
+        "display_name": record.get("display_name"),
+        "description": record.get("description"),
+        "author": record.get("author"),
+        "category_id": record.get("category_id"),
+        "tags": record.get("tags") or [],
+        "tool_count": record.get("tool_count"),
+        "version_label": record.get("version_label"),
+        "status": record.get("status"),
+        "source_version_no": record.get("source_version_no"),
+        "publisher_tenant_id": record.get("publisher_tenant_id"),
+        "created_at": record.get("create_time"),
+        "updated_at": record.get("update_time"),
+    }
+
+
+def _to_detail_item(
+    record: Dict[str, Any],
+    *,
+    include_bundles: bool = True,
+    is_updated: Optional[bool] = None,
+) -> Dict[str, Any]:
+    """Map a DB record to a marketplace detail payload."""
+    detail = _to_list_item(record)
+    if include_bundles:
+        detail["agent_info_json"] = record.get("agent_info_json")
+    if is_updated is not None:
+        detail["is_updated"] = is_updated
+    return detail
+
+
+def _validate_create_payload(repository_data: Dict[str, Any]) -> None:
+    """Validate required fields before inserting a repository listing."""
+    required_fields = (
+        "agent_id",
+        "source_version_no",
+        "name",
+        "agent_info_json",
+    )
+    missing = [
+        field for field in required_fields
+        if field not in repository_data or repository_data[field] is None
+    ]
+    if missing:
+        raise ValueError(f"Missing required repository fields: {', '.join(missing)}")
+    if not repository_data.get("name"):
+        raise ValueError("name must be a non-empty string")
+
+    agent_info_json = repository_data.get("agent_info_json")
+    if not isinstance(agent_info_json, dict):
+        raise ValueError("agent_info_json must be a JSON object")
+    for key in ("agent_id", "agent_info", "mcp_info"):
+        if key not in agent_info_json:
+            raise ValueError(f"agent_info_json must contain '{key}'")
+
+
+def _validate_agent_info_json_shareable(agent_info_json: dict) -> None:
+    """Reject marketplace share when any agent in the tree belongs to ASSET_OWNER tenant."""
+    agent_info_map = agent_info_json.get("agent_info")
+    if not isinstance(agent_info_map, dict):
+        return
+    for entry in agent_info_map.values():
+        if not isinstance(entry, dict):
+            continue
+        if entry.get("tenant_id") == ASSET_OWNER_TENANT_ID:
+            raise ValueError("租户管理员智能体无法共享")
+
+
+async def _build_agent_info_json(
+    agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int,
+) -> dict:
+    """Build marketplace snapshot JSON via the agent export pipeline."""
+    export_dict = await export_agent_dict_for_repository_impl(
+        agent_id=agent_id,
+        tenant_id=tenant_id,
+        user_id=user_id,
+        version_no=version_no,
+    )
+    skills = collect_skill_zip_entries(
+        agent_id=agent_id,
+        tenant_id=tenant_id,
+        version_no=version_no,
+    )
+    snapshot = AgentRepositorySnapshot(
+        **export_dict,
+        skills=skills or None,
+    )
+    return snapshot.model_dump()
+
+
+async def _build_repository_data_from_agent(
+    agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int,
+) -> Dict[str, Any]:
+    """Build a repository upsert payload from a published agent version snapshot."""
+    agent_info = search_agent_info_by_agent_id(agent_id, tenant_id, version_no)
+    agent_info_json = await _build_agent_info_json(
+        agent_id=agent_id,
+        tenant_id=tenant_id,
+        user_id=user_id,
+        version_no=version_no,
+    )
+    _validate_agent_info_json_shareable(agent_info_json)
+
+    version_meta = search_version_by_version_no(agent_id, tenant_id, version_no)
+    version_label = (
+        version_meta.get("version_name")
+        if version_meta and version_meta.get("version_name")
+        else f"v{version_no}"
+    )
+
+    return {
+        "agent_id": agent_id,
+        "source_version_no": version_no,
+        "name": agent_info["name"],
+        "display_name": agent_info.get("display_name"),
+        "description": agent_info.get("description"),
+        "author": agent_info.get("author"),
+        "version_label": version_label,
+        "agent_info_json": agent_info_json,
+        "status": STATUS_PENDING_REVIEW,
+    }
+
+
+async def create_agent_repository_listing_impl(
+    agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int,
+) -> Dict[str, Any]:
+    """Create or update a repository listing from a published agent version.
+
+    Loads agent metadata and builds agent_info_json via the export pipeline,
+    then inserts or updates the marketplace table.
+
+    When a listing for the same agent_id already exists, snapshot fields are
+    updated via update_agent_repository_by_id.
+    """
+    if version_no < 0:
+        raise ValueError("version_no must be >= 0")
+
+    repository_data = await _build_repository_data_from_agent(
+        agent_id, tenant_id, user_id, version_no
+    )
+    _validate_create_payload(repository_data)
+
+    existing = get_agent_repository_by_agent_id(agent_id)
+    if not existing:
+        repository_id = insert_agent_repository_record(
+            repository_data=repository_data,
+            publisher_tenant_id=tenant_id,
+            publisher_user_id=user_id,
+        )
+        is_updated = False
+    else:
+        repository_id = int(existing["agent_repository_id"])
+        updates = {
+            key: repository_data[key]
+            for key in _UPDATE_SNAPSHOT_FIELDS
+            if key in repository_data
+        }
+        affected = update_agent_repository_by_id(
+            repository_id=repository_id,
+            publisher_tenant_id=tenant_id,
+            user_id=user_id,
+            updates=updates,
+        )
+        if affected == 0:
+            raise ValueError("Failed to update repository listing")
+        is_updated = True
+
+    record = get_agent_repository_by_id(repository_id)
+    if not record:
+        raise ValueError("Failed to load repository listing after write")
+    return _to_detail_item(record, is_updated=is_updated)
+
+
+async def import_agent_from_repository_impl(
+    agent_repository_id: int,
+    authorization: str,
+) -> Dict[int, int]:
+    """Import an agent tree from a marketplace repository listing into the current tenant."""
+    record = get_agent_repository_by_id(agent_repository_id)
+    if not record:
+        raise ValueError("Repository listing not found")
+
+    agent_info_json = record.get("agent_info_json")
+    if not isinstance(agent_info_json, dict):
+        raise ValueError("Repository listing has no agent snapshot")
+
+    snapshot = AgentRepositorySnapshot.model_validate(agent_info_json)
+    if snapshot.skills:
+        return await import_agent_with_skills_impl(
+            snapshot,
+            snapshot.skills,
+            authorization,
+        )
+    return await import_agent_impl(snapshot, authorization)
diff --git a/backend/services/agent_service.py b/backend/services/agent_service.py
index 5a340b1d6..643d1995e 100644
--- a/backend/services/agent_service.py
+++ b/backend/services/agent_service.py
@@ -22,7 +22,8 @@
 from utils.prompt_template_utils import normalize_prompt_generate_template_content
 from consts.const import MEMORY_SEARCH_START_MSG, MEMORY_SEARCH_DONE_MSG, MEMORY_SEARCH_FAIL_MSG, TOOL_TYPE_MAPPING, \
     LANGUAGE, MESSAGE_ROLE, MODEL_CONFIG_MAPPING, CAN_EDIT_ALL_USER_ROLES, PERMISSION_EDIT, PERMISSION_READ, PERMISSION_PRIVATE
-from consts.exceptions import MemoryPreparationException, SkillDuplicateError
+from consts.exceptions import AppException, MemoryPreparationException, SkillDuplicateError
+from consts.error_code import ErrorCode
 from consts.agent_unavailable_reasons import AgentUnavailableReason
 from consts.model import (
     AgentInfoRequest,
@@ -45,7 +46,9 @@
     delete_related_agent,
     insert_related_agent,
     query_all_agent_info_by_tenant_id,
+    query_sub_agent_relations,
     query_sub_agents_id_list,
+    resolve_sub_agent_version_no,
     search_agent_id_by_agent_name,
     search_agent_info_by_agent_id,
     search_blank_sub_agent_by_main_agent_id,
@@ -67,8 +70,10 @@
     search_tools_for_sub_agent
 )
 from database import skill_db
+from database.attachment_db import upload_fileobj
 from services.skill_service import SkillService
-from database.agent_version_db import query_version_list
+from services.file_management_service import is_allowed_skill_upload_path
+from database.agent_version_db import query_version_list, query_current_version_no
 from database.group_db import query_group_ids_by_user
 from database.user_tenant_db import get_user_tenant_by_user_id
 from database.a2a_agent_db import get_server_agent_ids, query_external_sub_agents
@@ -78,7 +83,7 @@
     get_prompt_template_summary,
 )
 from utils.str_utils import convert_list_to_string, convert_string_to_list
-from services.conversation_management_service import save_conversation_assistant, save_conversation_user
+from services.conversation_management_service import save_conversation_assistant, save_conversation_user, save_skill_files_to_conversation
 from services.memory_config_service import build_memory_context
 from utils.auth_utils import get_current_user_info, get_user_language
 from utils.config_utils import tenant_config_manager
@@ -97,9 +102,139 @@
 SAFE_AGENT_STREAM_ERROR_MESSAGE = "Agent execution failed. Please try again later."
 
 
-# -------------------------------------------------------------
-# Internal helper functions
-# -------------------------------------------------------------
+def _extract_json_objects_from_text(text: str) -> list[dict]:
+    """Extract all JSON objects embedded in a text blob."""
+    if not text:
+        return []
+
+    decoder = json.JSONDecoder()
+    results: list[dict] = []
+    index = 0
+
+    while index < len(text):
+        start_index = text.find("{", index)
+        if start_index < 0:
+            break
+
+        try:
+            payload, end_index = decoder.raw_decode(text, start_index)
+        except json.JSONDecodeError:
+            index = start_index + 1
+            continue
+
+        if isinstance(payload, dict):
+            results.append(payload)
+        index = max(end_index, start_index + 1)
+
+    return results
+
+
+def _extract_skill_file_upload_payloads(content: str) -> list[dict]:
+    """Extract JSON payloads containing absolute_path from streamed tool output."""
+    payloads: list[dict] = []
+    for payload in _extract_json_objects_from_text(content):
+        if payload.get("absolute_path"):
+            payloads.append(payload)
+    return payloads
+
+
+def _transform_skill_files_to_standard_format(upload_results: list[dict]) -> list[dict]:
+    """
+    Transform skill file upload results to match the frontend attachment format.
+
+    Skill upload format:
+        {file_name, absolute_path, object_name, preview_url, url, presigned_url, mime_type, file_size, status}
+    Frontend format:
+        {object_name, name, type, size, url, presigned_url, description}
+    """
+    frontend_files = []
+    for result in upload_results:
+        frontend_files.append({
+            "object_name": result.get("object_name", ""),
+            "name": result.get("file_name", result.get("name", "")),
+            "type": "file",
+            "size": result.get("file_size", result.get("size", 0)),
+            "url": result.get("url", ""),
+            "presigned_url": result.get("presigned_url", result.get("preview_url", "")),
+            "description": "",
+        })
+    return frontend_files
+
+
+async def _process_skill_file_uploads(
+    content: str,
+    user_id: str,
+    tenant_id: str,
+) -> list[dict]:
+    """Upload generated skill files to storage and return upload metadata."""
+
+    upload_results: list[dict] = []
+    for payload in _extract_skill_file_upload_payloads(content):
+        absolute_path = str(payload.get("absolute_path") or "").strip()
+        file_name = str(
+            payload.get("file_name")
+            or payload.get("file_path")
+            or os.path.basename(absolute_path)
+        )
+        mime_type = str(payload.get("mime_type") or payload.get("content_type") or "application/octet-stream")
+        if not absolute_path:
+            continue
+
+        if not is_allowed_skill_upload_path(absolute_path):
+            logger.warning(
+                "[skill-file] rejected unsafe path absolute_path=%s",
+                absolute_path,
+            )
+            continue
+
+        if not file_name:
+            file_name = os.path.basename(absolute_path)
+
+        if not os.path.exists(absolute_path):
+            continue
+
+        try:
+            file_size = os.path.getsize(absolute_path)
+            actual_prefix = f"skill-files/{user_id}" if user_id else "skill-files"
+            with open(absolute_path, "rb") as file_obj:
+                upload_result = upload_fileobj(
+                    file_obj=file_obj,
+                    file_name=file_name,
+                    prefix=actual_prefix,
+                    generate_presigned_url=True,
+                    file_size=file_size,
+                )
+
+            if upload_result.get("success"):
+                upload_results.append(
+                    {
+                        "status": "success",
+                        "file_name": file_name,
+                        "absolute_path": absolute_path,
+                        "object_name": upload_result.get("object_name"),
+                        "preview_url": upload_result.get("presigned_url") or upload_result.get("url"),
+                        "url": upload_result.get("url"),
+                        "presigned_url": upload_result.get("presigned_url"),
+                        "mime_type": mime_type,
+                        "file_size": upload_result.get("file_size", file_size),
+                    }
+                )
+            else:
+                error_message = upload_result.get("error") or "Upload failed"
+                logger.warning(
+                    "[skill-file] upload failed file_name=%s absolute_path=%s error=%s",
+                    file_name,
+                    absolute_path,
+                    error_message,
+                )
+        except Exception as exc:
+            logger.exception(
+                "[skill-file] failed to upload file file_name=%s absolute_path=%s",
+                file_name,
+                absolute_path,
+            )
+
+    return upload_results
 
 
 def _safe_agent_stream_error_chunk() -> str:
@@ -647,23 +782,53 @@ async def _stream_agent_chunks(
     agent_run_info,
     memory_ctx,
 ):
-    """Yield SSE chunks from agent_run while persisting messages & cleanup.
-
-    This utility centralizes the common streaming logic used by both
-    generate_stream_with_memory and generate_stream_no_memory so that the code
-    is easier to maintain and less error-prone.
-    """
+    """Yield SSE chunks from agent_run while persisting messages and cleanup."""
 
     local_messages = []
     captured_final_answer = None
+    captured_skill_files: dict[str, dict] = {}
+    skill_file_uploads: list[dict] = []
     try:
         async for chunk in agent_run(agent_run_info):
             local_messages.append(chunk)
-            # Try to capture the final answer as it streams by in order to start memory addition
             try:
                 data = json.loads(chunk)
-                if data.get("type") == "final_answer":
+                chunk_type = data.get("type")
+                if chunk_type == "final_answer":
                     captured_final_answer = data.get("content")
+
+                should_parse_skill_file = chunk_type in {"execution_logs", "parse"} or data.get("role") == "tool-response"
+                if should_parse_skill_file:
+                    extracted_payload_count = 0
+                    content_value = data.get("content")
+                    if isinstance(content_value, list):
+                        content_items = content_value
+                    elif content_value:
+                        content_items = [{"type": "text", "text": str(content_value)}]
+                    else:
+                        content_items = []
+
+                    for item in content_items:
+                        if isinstance(item, dict) and item.get("type") == "text":
+                            text_value = item.get("text")
+                            if text_value:
+                                extracted_payloads = _extract_json_objects_from_text(text_value)
+                                for payload in extracted_payloads:
+                                    absolute_path = str(payload.get("absolute_path") or "").strip()
+                                    if not absolute_path:
+                                        continue
+                                    if absolute_path in captured_skill_files:
+                                        continue
+                                    if not os.path.exists(absolute_path):
+                                        continue
+                                    captured_skill_files[absolute_path] = payload
+                                    extracted_payload_count += 1
+                    if extracted_payload_count:
+                        logger.info(
+                            "[skill-file] captured payloads count=%s current_total=%s",
+                            extracted_payload_count,
+                            len(captured_skill_files),
+                        )
             except Exception:
                 pass
             yield f"data: {chunk}\n\n"
@@ -671,7 +836,6 @@ async def _stream_agent_chunks(
         logger.error("Agent run error: %r", run_exc, exc_info=True)
         yield _safe_agent_stream_error_chunk()
     finally:
-        # Persist assistant messages for non-debug runs
         if not agent_request.is_debug:
             save_messages(
                 agent_request,
@@ -680,11 +844,54 @@ async def _stream_agent_chunks(
                 tenant_id=tenant_id,
                 user_id=user_id,
             )
-        # Always unregister the run to release resources
         agent_run_manager.unregister_agent_run(
             agent_request.conversation_id, user_id)
 
-        # Schedule memory addition in background to avoid blocking SSE termination
+        try:
+            skill_file_content_local = "\n".join(
+                json.dumps(payload, ensure_ascii=False)
+                for payload in captured_skill_files.values()
+            )
+            if skill_file_content_local:
+                skill_file_uploads = await _process_skill_file_uploads(
+                    content=skill_file_content_local,
+                    user_id=user_id,
+                    tenant_id=tenant_id,
+                )
+                logger.info(
+                    "[skill-file] upload finished conversation=%s result_count=%s results=%s",
+                    agent_request.conversation_id,
+                    len(skill_file_uploads), skill_file_uploads
+                )
+                if skill_file_uploads:
+                    # Keep original format for real-time SSE display
+                    skill_files_payload = json.dumps(
+                        {"skill_file_uploads": skill_file_uploads},
+                        ensure_ascii=False,
+                    )
+                    try:
+                        yield f"data: {json.dumps({'type': 'skill_files', 'content': skill_files_payload}, ensure_ascii=False)}\n\n"
+                    except RuntimeError:
+                        # Stream is closing (e.g., client disconnect). Avoid raising during generator teardown.
+                        pass
+                    # Persist skill file uploads to the conversation history so they
+                    # appear in subsequent GET /conversation/{id} calls.
+                    # Transform to frontend attachment format (object_name, name, type, size, etc.)
+                    try:
+                        frontend_files = _transform_skill_files_to_standard_format(skill_file_uploads)
+                        save_skill_files_to_conversation(
+                            conversation_id=agent_request.conversation_id,
+                            skill_file_uploads=frontend_files,
+                            user_id=user_id,
+                        )
+                    except Exception:
+                        logger.exception(
+                            "[skill-file] failed to persist skill file uploads to conversation=%s",
+                            agent_request.conversation_id,
+                        )
+        except Exception:
+            logger.exception("Failed to process skill file uploads")
+
         async def _add_memory_background():
             try:
                 # Skip if memory recording is disabled
@@ -779,14 +986,13 @@ async def get_agent_info_impl(agent_id: int, tenant_id: str, version_no: int = 0
             user_role = str(user_tenant_record.get("user_role") or "").upper()
             can_edit_all = user_role in CAN_EDIT_ALL_USER_ROLES
 
-            # Permission logic (same as agent list):
-            # - If creator or can_edit_all: PERMISSION_EDIT
-            # - Otherwise: use ingroup_permission, default to PERMISSION_READ if None
-            if can_edit_all or str(agent_info.get("created_by")) == str(user_id):
-                agent_info["permission"] = PERMISSION_EDIT
-            else:
-                ingroup_permission = agent_info.get("ingroup_permission")
-                agent_info["permission"] = ingroup_permission if ingroup_permission is not None else PERMISSION_READ
+            # Permission logic (same as agent list, including ASSET_OWNER read-only override)
+            agent_info["permission"] = resolve_agent_list_permission(
+                user_role=user_role,
+                agent=agent_info,
+                user_id=user_id,
+                can_edit_all=can_edit_all,
+            )
         except Exception as e:
             logger.warning(f"Failed to calculate agent permission: {str(e)}")
 
@@ -862,6 +1068,12 @@ async def get_agent_info_impl(agent_id: int, tenant_id: str, version_no: int = 0
     agent_info["is_available"] = is_available
     agent_info["unavailable_reasons"] = unavailable_reasons
 
+    # Set current_version_no from draft record (version_no=0)
+    # This ensures the returned data always has the current published version info
+    if version_no > 0:
+        draft_version_no = query_current_version_no(agent_id, tenant_id)
+        agent_info["current_version_no"] = draft_version_no
+
     return agent_info
 
 
@@ -906,6 +1118,10 @@ async def get_creating_sub_agent_info_impl(authorization: str = Header(None)):
 
 async def update_agent_info_impl(request: AgentInfoRequest, authorization: str = Header(None)):
     user_id, tenant_id, _ = get_current_user_info(authorization)
+
+    if request.example_questions is not None and len(request.example_questions) > 6:
+        raise AppException(ErrorCode.COMMON_PARAMETER_INVALID, "example_questions cannot exceed 6 items")
+
     prompt_template_id, prompt_template_name = get_prompt_template_summary(
         template_id=request.prompt_template_id,
         tenant_id=tenant_id,
@@ -932,9 +1148,12 @@ async def update_agent_info_impl(request: AgentInfoRequest, authorization: str =
                 "prompt_template_name": prompt_template_name,
                 "max_steps": request.max_steps,
                 "provide_run_summary": request.provide_run_summary,
+                "verification_config": request.verification_config,
                 "duty_prompt": request.duty_prompt,
                 "constraint_prompt": request.constraint_prompt,
                 "few_shots_prompt": request.few_shots_prompt,
+                "greeting_message": request.greeting_message,
+                "example_questions": request.example_questions,
                 "enabled": request.enabled if request.enabled is not None else True,
                 "group_ids": convert_list_to_string(request.group_ids) if request.group_ids else user_group_ids,
                 "ingroup_permission": request.ingroup_permission
@@ -1202,76 +1421,216 @@ async def clear_agent_memory(agent_id: int, tenant_id: str, user_id: str):
         # Silently fail to maintain agent deletion process
 
 
-async def export_agent_impl(agent_id: int, authorization: str = Header(None)) -> str:
-    """
-    Export the configuration information of the specified agent and all its sub-agents.
-
-    Args:
-        agent_id (int): The ID of the agent to export.
-        authorization (str): User authentication information, obtained from the Header.
-
-    Returns:
-        str: A formatted JSON string containing the configuration information of the agent and all its sub-agents.
-
-    Data Structure Example:
-        model.py  ExportAndImportDataFormat
-
-    Note:
-        This function recursively finds all managed sub-agents and exports the detailed configuration of each agent (including tools, prompts, etc.) as a dictionary, and finally returns it as a formatted JSON string for frontend download and backup.
-    """
-
-    user_id, tenant_id, _ = get_current_user_info(authorization)
-
+async def _export_agent_dict_core(
+    root_agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int = 0,
+) -> dict:
+    """Build ExportAndImportDataFormat dict for an agent tree at the given version."""
     export_agent_dict = {}
-    search_list = deque([agent_id])
-    agent_id_set = set()
+    search_list: deque = deque([(root_agent_id, version_no)])
+    visited: set = set()
 
     mcp_info_set = set()
 
-    while len(search_list):
-        left_ele = search_list.popleft()
-        if left_ele in agent_id_set:
+    while search_list:
+        current_agent_id, current_version_no = search_list.popleft()
+        visit_key = (current_agent_id, current_version_no)
+        if visit_key in visited:
             continue
+        visited.add(visit_key)
 
-        agent_id_set.add(left_ele)
-        agent_info = await export_agent_by_agent_id(agent_id=left_ele, tenant_id=tenant_id, user_id=user_id)
+        agent_info = await export_agent_by_agent_id(
+            agent_id=current_agent_id,
+            tenant_id=tenant_id,
+            user_id=user_id,
+            version_no=current_version_no,
+        )
 
-        # collect mcp name
         for tool in agent_info.tools:
             if tool.source == "mcp" and tool.usage:
                 mcp_info_set.add(tool.usage)
 
-        search_list.extend(agent_info.managed_agents)
+        relations = query_sub_agent_relations(
+            main_agent_id=current_agent_id,
+            tenant_id=tenant_id,
+            version_no=current_version_no,
+        )
+        for rel in relations:
+            child_id = rel["selected_agent_id"]
+            child_version = resolve_sub_agent_version_no(
+                child_id,
+                rel.get("selected_agent_version_no"),
+                tenant_id,
+            )
+            search_list.append((child_id, child_version))
+
         export_agent_dict[str(agent_info.agent_id)] = agent_info
 
-    # convert mcp info to MCPInfo list
     mcp_info_list = []
     for mcp_server_name in mcp_info_set:
-        # get mcp url by mcp_server_name and tenant_id
         mcp_url = get_mcp_server_by_name_and_tenant(mcp_server_name, tenant_id)
         mcp_info_list.append(
             MCPInfo(mcp_server_name=mcp_server_name, mcp_url=mcp_url))
 
     export_data = ExportAndImportDataFormat(
-        agent_id=agent_id, agent_info=export_agent_dict, mcp_info=mcp_info_list)
-    return json.dumps(export_data.model_dump())
+        agent_id=root_agent_id,
+        agent_info=export_agent_dict,
+        mcp_info=mcp_info_list,
+    )
+    return export_data.model_dump()
 
 
-async def export_agent_by_agent_id(agent_id: int, tenant_id: str, user_id: str) -> ExportAndImportAgentInfo:
+async def export_agent_dict_impl(
+    agent_id: int,
+    authorization: str = Header(None),
+    version_no: int = 0,
+) -> dict:
     """
-    Export a single agent's information based on agent_id
+    Export the configuration information of the specified agent and all its sub-agents.
+
+    Args:
+        agent_id (int): The ID of the agent to export.
+        authorization (str): User authentication information, obtained from the Header.
+        version_no (int): Version to export. Default 0 = draft.
+
+    Returns:
+        dict: ExportAndImportDataFormat as a plain dict (via model_dump).
     """
+    user_id, tenant_id, _ = get_current_user_info(authorization)
+    return await _export_agent_dict_core(
+        root_agent_id=agent_id,
+        tenant_id=tenant_id,
+        user_id=user_id,
+        version_no=version_no,
+    )
+
+
+async def export_agent_dict_for_repository_impl(
+    agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int,
+) -> dict:
+    """Export agent tree for marketplace repository storage (no HTTP auth header)."""
+    return await _export_agent_dict_core(
+        root_agent_id=agent_id,
+        tenant_id=tenant_id,
+        user_id=user_id,
+        version_no=version_no,
+    )
+
+
+async def export_agent_impl(
+    agent_id: int,
+    authorization: str = Header(None),
+    version_no: int = 0,
+) -> str:
+    """Serialize export_agent_dict_impl output to a JSON string for download or ZIP embedding."""
+    agent_dict = await export_agent_dict_impl(
+        agent_id, authorization, version_no=version_no
+    )
+    return json.dumps(agent_dict)
+
+
+def _collect_skill_names_from_tree(
+    agent_id: int,
+    tenant_id: str,
+    version_no: int,
+    visited: Optional[set] = None,
+) -> List[str]:
+    """Collect unique skill names from an agent tree at the given version."""
+    if visited is None:
+        visited = set()
+
+    skill_names: List[str] = []
+    seen_names: set = set()
+
+    def _walk(current_agent_id: int, current_version_no: int) -> None:
+        visit_key = (current_agent_id, current_version_no)
+        if visit_key in visited:
+            return
+        visited.add(visit_key)
+
+        skill_instances = skill_db.query_skill_instances_by_agent_id(
+            agent_id=current_agent_id,
+            tenant_id=tenant_id,
+            version_no=current_version_no,
+        )
+        for inst in skill_instances:
+            skill_id = inst.get("skill_id")
+            skill = skill_db.get_skill_by_id(skill_id, tenant_id)
+            if skill:
+                name = skill.get("name")
+                if name and name not in seen_names:
+                    seen_names.add(name)
+                    skill_names.append(name)
+
+        relations = query_sub_agent_relations(
+            main_agent_id=current_agent_id,
+            tenant_id=tenant_id,
+            version_no=current_version_no,
+        )
+        for rel in relations:
+            child_id = rel["selected_agent_id"]
+            child_version = resolve_sub_agent_version_no(
+                child_id,
+                rel.get("selected_agent_version_no"),
+                tenant_id,
+            )
+            _walk(child_id, child_version)
+
+    _walk(agent_id, version_no)
+    return skill_names
+
+
+def collect_skill_zip_entries(
+    agent_id: int,
+    tenant_id: str,
+    version_no: int = 0,
+) -> List[SkillZipEntry]:
+    """Export skill ZIP payloads for all skills in an agent tree."""
+    skill_names = _collect_skill_names_from_tree(agent_id, tenant_id, version_no)
+    if not skill_names:
+        return []
+
+    skill_service = SkillService(tenant_id=tenant_id)
+    exported = skill_service.export_skills_by_names(skill_names, tenant_id)
+    return [
+        SkillZipEntry(
+            skill_name=entry["skill_name"],
+            skill_zip_base64=entry["skill_zip_base64"],
+        )
+        for entry in exported
+    ]
+
+
+async def export_agent_by_agent_id(
+    agent_id: int,
+    tenant_id: str,
+    user_id: str,
+    version_no: int = 0,
+) -> ExportAndImportAgentInfo:
+    """Export a single agent's information based on agent_id and version_no."""
     agent_info = search_agent_info_by_agent_id(
-        agent_id=agent_id, tenant_id=tenant_id)
+        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
+    )
     agent_relation_in_db = query_sub_agents_id_list(
-        main_agent_id=agent_id, tenant_id=tenant_id)
-    tool_list = await create_tool_config_list(agent_id=agent_id, tenant_id=tenant_id, user_id=user_id)
+        main_agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
+    )
+    tool_list = await create_tool_config_list(
+        agent_id=agent_id,
+        tenant_id=tenant_id,
+        user_id=user_id,
+        version_no=version_no,
+    )
 
     # Collect skill names from skill instances
     skill_names: List[str] = []
     try:
         skill_instances = skill_db.query_skill_instances_by_agent_id(
-            agent_id=agent_id, tenant_id=tenant_id, version_no=0
+            agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
         )
         for inst in skill_instances:
             skill_id = inst.get("skill_id")
@@ -1307,6 +1666,7 @@ async def export_agent_by_agent_id(agent_id: int, tenant_id: str, user_id: str)
             "display_name") if business_logic_model_info is not None else None
 
     agent_info = ExportAndImportAgentInfo(agent_id=agent_id,
+                                          tenant_id=agent_info["tenant_id"],
                                           name=agent_info["name"],
                                           display_name=agent_info["display_name"],
                                           description=agent_info["description"],
@@ -1314,6 +1674,7 @@ async def export_agent_by_agent_id(agent_id: int, tenant_id: str, user_id: str)
                                           author=agent_info.get("author"),
                                           max_steps=agent_info["max_steps"],
                                           provide_run_summary=agent_info["provide_run_summary"],
+                                          verification_config=agent_info.get("verification_config"),
                                           duty_prompt=agent_info.get(
                                               "duty_prompt"),
                                           constraint_prompt=agent_info.get(
@@ -1468,6 +1829,7 @@ async def import_agent_by_agent_id(
                                          "prompt_template_name": import_agent_info.prompt_template_name or SYSTEM_PROMPT_TEMPLATE_NAME,
                                          "max_steps": import_agent_info.max_steps,
                                          "provide_run_summary": import_agent_info.provide_run_summary,
+                                         "verification_config": getattr(import_agent_info, "verification_config", None),
                                          "duty_prompt": import_agent_info.duty_prompt,
                                          "constraint_prompt": import_agent_info.constraint_prompt,
                                          "few_shots_prompt": import_agent_info.few_shots_prompt,
@@ -1835,6 +2197,7 @@ async def prepare_agent_run(
         is_debug=agent_request.is_debug,
         override_version_no=agent_request.version_no,
         override_model_id=agent_request.model_id,
+        tool_params=agent_request.tool_params,
     )
 
     # Mount conversation-level reusable ContextManager if enabled
@@ -2280,52 +2643,45 @@ def get_sub_agents_recursive(parent_agent_id: int, depth: int = 0, max_depth: in
         raise ValueError(f"Failed to get agent call relationship: {str(e)}")
 
 
-async def export_agent_with_skills_impl(agent_id: int, authorization: str) -> dict:
-    """Export an agent, returning a ZIP if it has skill instances, otherwise plain JSON.
+async def export_agent_with_skills_impl(
+    agent_id: int,
+    authorization: str,
+    version_no: int = 0,
+) -> dict:
+    """Export an agent, returning a ZIP if it has skill instances, otherwise a plain dict.
 
     The response is either:
       - A dict with {"_zip": True, "data": bytes, "filename": str} when the agent has skills
-      - A plain dict (JSON string) when the agent has no skills
+      - ExportAndImportDataFormat as a plain dict when the agent has no skills
     """
-    from services.skill_service import SkillService
-
     user_id, tenant_id, _ = get_current_user_info(authorization)
 
-    skill_instances = skill_db.query_skill_instances_by_agent_id(
-        agent_id=agent_id, tenant_id=tenant_id, version_no=0
+    skill_zip_entries = collect_skill_zip_entries(
+        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
     )
 
-    if not skill_instances:
-        return await export_agent_impl(agent_id, authorization)
-
-    skill_names = []
-    for inst in skill_instances:
-        skill_id = inst.get("skill_id")
-        skill = skill_db.get_skill_by_id(skill_id, tenant_id)
-        if skill:
-            skill_names.append(skill.get("name"))
-
-    if not skill_names:
-        return await export_agent_impl(agent_id, authorization)
-
-    agent_json_str = await export_agent_impl(agent_id, authorization)
+    if not skill_zip_entries:
+        return await export_agent_dict_impl(
+            agent_id, authorization, version_no=version_no
+        )
 
-    skill_service = SkillService(tenant_id=tenant_id)
-    skill_zip_entries = skill_service.export_skills_by_names(
-        skill_names, tenant_id)
+    agent_json_str = await export_agent_impl(
+        agent_id, authorization, version_no=version_no
+    )
 
     zip_buffer = io.BytesIO()
     with zipfile.ZipFile(zip_buffer, "w", zipfile.ZIP_DEFLATED) as zf:
         zf.writestr("agent.json", agent_json_str)
         for entry in skill_zip_entries:
-            skill_zip_bytes = base64.b64decode(entry["skill_zip_base64"])
-            zf.writestr(f"skills/{entry['skill_name']}.zip", skill_zip_bytes)
+            skill_zip_bytes = base64.b64decode(entry.skill_zip_base64)
+            zf.writestr(f"skills/{entry.skill_name}.zip", skill_zip_bytes)
 
     zip_buffer.seek(0)
     zip_data = zip_buffer.read()
 
     agent_info = search_agent_info_by_agent_id(
-        agent_id=agent_id, tenant_id=tenant_id)
+        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
+    )
     agent_name = agent_info.get(
         "name", "anonymous") if agent_info else "anonymous"
 
diff --git a/backend/services/agent_version_service.py b/backend/services/agent_version_service.py
index d7096727b..8ed6e14d4 100644
--- a/backend/services/agent_version_service.py
+++ b/backend/services/agent_version_service.py
@@ -49,6 +49,17 @@ def _remove_audit_fields_for_insert(data: dict) -> None:
     data.pop('delete_flag', None)
 
 
+def _build_sub_agent_relations(relations: List[dict]) -> List[dict]:
+    """Map relation snapshots to sub-agent relation payloads for API responses."""
+    return [
+        {
+            'agent_id': r['selected_agent_id'],
+            'version_no': r.get('selected_agent_version_no'),
+        }
+        for r in relations
+    ]
+
+
 def publish_version_impl(
     agent_id: int,
     tenant_id: str,
@@ -92,11 +103,18 @@ def publish_version_impl(
         _remove_audit_fields_for_insert(tool_snapshot)
         insert_tool_snapshot(tool_snapshot)
 
-    # Insert relation snapshots
+    # Insert relation snapshots with pinned child agent versions
     for rel in relations_draft:
+        child_id = rel['selected_agent_id']
+        child_version = query_current_version_no(child_id, tenant_id)
+        if child_version is None:
+            raise ValueError(
+                f"Sub-agent {child_id} has no published version; publish the sub-agent first."
+            )
         rel_snapshot = rel.copy()
         rel_snapshot.pop('version_no', None)
         rel_snapshot['version_no'] = new_version_no
+        rel_snapshot['selected_agent_version_no'] = child_version
         _remove_audit_fields_for_insert(rel_snapshot)
         insert_relation_snapshot(rel_snapshot)
 
@@ -271,6 +289,7 @@ def get_version_detail_impl(
 
     # Extract sub_agent_id_list from relations
     result['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_snapshot]
+    result['sub_agent_relations'] = _build_sub_agent_relations(relations_snapshot)
 
     # Get skill instances for this version (from ag_skill_instance_t with version_no)
     from database import skill_db as skill_db_module
@@ -710,6 +729,7 @@ def _get_version_detail_or_draft(
         # Add tools (only enabled tools)
         result['tools'] = [t for t in tools_draft if t.get('enabled', True)]
         result['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_draft]
+        result['sub_agent_relations'] = _build_sub_agent_relations(relations_draft)
 
         # Get draft skill instances (version_no=0)
         skills_draft = skill_db_module.query_skill_instances_by_agent_id(
@@ -783,12 +803,11 @@ async def list_published_agents_impl(
             CAN_EDIT_ALL_USER_ROLES,
             get_user_tenant_by_user_id,
             query_group_ids_by_user,
-            PERMISSION_EDIT,
-            PERMISSION_READ,
             get_model_by_model_id,
             check_agent_availability,
             _apply_duplicate_name_availability_rules,
         )
+        from services.asset_owner_visibility import resolve_agent_list_permission
         from database.agent_version_db import query_agent_snapshot
 
         # Get user role for permission check
@@ -858,9 +877,10 @@ async def list_published_agents_impl(
 
             # Extract sub_agent_id_list from relations
             agent_info['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_snapshot]
+            agent_info['sub_agent_relations'] = _build_sub_agent_relations(relations_snapshot)
 
-            # Add published version info
-            agent_info['published_version_no'] = current_version_no
+            # Add current version info
+            agent_info['current_version_no'] = current_version_no
 
             # Check agent availability using the shared function
             _, unavailable_reasons = check_agent_availability(
@@ -893,7 +913,12 @@ async def list_published_agents_impl(
                     model_cache[model_id] = get_model_by_model_id(model_id, tenant_id)
                 model_info = model_cache.get(model_id)
 
-            permission = PERMISSION_EDIT if can_edit_all or str(agent.get("created_by")) == str(user_id) else PERMISSION_READ
+            permission = resolve_agent_list_permission(
+                user_role=user_role,
+                agent=agent,
+                user_id=user_id,
+                can_edit_all=can_edit_all,
+            )
 
             simple_agent_list.append({
                 "agent_id": agent.get("agent_id"),
@@ -909,7 +934,9 @@ async def list_published_agents_impl(
                 "is_new": agent.get("is_new", False),
                 "group_ids": agent.get("group_ids", []),
                 "permission": permission,
-                "published_version_no": agent.get("published_version_no"),
+                "current_version_no": agent.get("current_version_no"),
+                "greeting_message": agent.get("greeting_message"),
+                "example_questions": agent.get("example_questions"),
             })
 
         return simple_agent_list
diff --git a/backend/services/cas_service.py b/backend/services/cas_service.py
new file mode 100644
index 000000000..7db3fce1a
--- /dev/null
+++ b/backend/services/cas_service.py
@@ -0,0 +1,424 @@
+import json
+import logging
+import os
+import secrets
+import ssl
+import urllib.parse
+import urllib.request
+from xml.etree.ElementTree import Element
+from dataclasses import dataclass
+from datetime import datetime, timedelta
+from typing import Any, Dict, Optional
+
+import defusedxml.ElementTree as ET
+from defusedxml.common import DefusedXmlException
+
+from consts.const import (
+    CAS_CA_BUNDLE,
+    CAS_CALLBACK_BASE_URL,
+    CAS_EMAIL_ATTRIBUTE,
+    CAS_ENABLED,
+    CAS_LOGIN_MODE,
+    CAS_LOGOUT_URL,
+    CAS_RENEW_BEFORE_SECONDS,
+    CAS_RENEW_TIMEOUT_SECONDS,
+    CAS_ROLE_ATTRIBUTE,
+    CAS_ROLE_MAP_JSON,
+    CAS_SERVER_URL,
+    CAS_SESSION_MAX_AGE_SECONDS,
+    CAS_SSL_VERIFY,
+    CAS_SYNTHETIC_EMAIL_DOMAIN,
+    CAS_TENANT_ATTRIBUTE,
+    CAS_USER_ATTRIBUTE,
+    CAS_VALIDATE_PATH,
+    DEFAULT_TENANT_ID,
+    LOCAL_SESSION_MAX_AGE_SECONDS,
+)
+from database.cas_session_db import (
+    create_cas_session,
+    revoke_cas_session_by_index,
+    revoke_cas_sessions_by_user_id,
+)
+from database.oauth_account_db import get_oauth_account_by_provider
+from database.user_tenant_db import get_user_tenant_by_user_id, upsert_user_tenant
+from services.oauth_service import (
+    create_or_update_oauth_account,
+    find_supabase_user_id_by_email,
+)
+from services.skill_service import init_skill_list_for_tenant
+from services.tool_configuration_service import init_tool_list_for_tenant
+from utils.auth_utils import calculate_expires_at, generate_session_jwt, get_supabase_admin_client
+
+logger = logging.getLogger(__name__)
+
+CAS_PROVIDER = "cas"
+VALID_ROLES = {"SU", "ADMIN", "DEV", "USER"}
+
+
+class CasAuthenticationError(Exception):
+    pass
+
+
+@dataclass
+class CasPrincipal:
+    cas_user_id: str
+    email: str
+    username: str
+    role: str
+    tenant_id: str
+    session_index: str
+    expires_at: datetime
+
+
+def get_cas_config() -> Dict[str, Any]:
+    mode = CAS_LOGIN_MODE if CAS_LOGIN_MODE in {"button", "force", "disabled"} else "disabled"
+    enabled = CAS_ENABLED and bool(CAS_SERVER_URL)
+    if not enabled:
+        mode = "disabled"
+    return {
+        "enabled": enabled,
+        "login_mode": mode,
+        "renew_before_seconds": CAS_RENEW_BEFORE_SECONDS,
+        "renew_timeout_seconds": CAS_RENEW_TIMEOUT_SECONDS,
+        "display_name": "CAS",
+    }
+
+
+def build_login_url(redirect: str = "/") -> str:
+    _ensure_enabled()
+    service_url = _build_callback_url("/api/user/cas/callback", {"redirect": _normalize_redirect(redirect)})
+    return f"{CAS_SERVER_URL}/login?service={service_url}"
+
+
+def build_renew_url() -> str:
+    _ensure_enabled()
+    service_url = _build_callback_url("/api/user/cas/renew_callback", {})
+    return f"{CAS_SERVER_URL}/login?service={service_url}&gateway=true"
+
+
+def build_logout_url() -> str:
+    _ensure_enabled()
+    configured_logout_url = CAS_LOGOUT_URL.strip()
+    if not configured_logout_url:
+        return ""
+
+    parsed_config = urllib.parse.urlsplit(configured_logout_url)
+    if parsed_config.scheme and parsed_config.netloc:
+        logout_url = configured_logout_url
+    else:
+        logout_url = f"{CAS_SERVER_URL}/{configured_logout_url.lstrip('/')}"
+
+    parsed = urllib.parse.urlsplit(logout_url)
+    if parsed.query:
+        return logout_url
+
+    query = f"service={CAS_CALLBACK_BASE_URL}"
+    return urllib.parse.urlunsplit((parsed.scheme, parsed.netloc, parsed.path, query, parsed.fragment))
+
+
+async def login_with_ticket(ticket: str, redirect: str = "/") -> Dict[str, Any]:
+    redirect = _normalize_redirect(redirect)
+    service_url = _build_callback_url("/api/user/cas/callback", {"redirect": redirect})
+    principal = validate_service_ticket(ticket, service_url)
+    return await _create_project_session(principal, redirect=redirect)
+
+
+async def renew_with_ticket(ticket: str) -> Dict[str, Any]:
+    service_url = _build_callback_url("/api/user/cas/renew_callback", {})
+    principal = validate_service_ticket(ticket, service_url)
+    return await _create_project_session(principal, redirect="/", renew=True)
+
+
+def validate_service_ticket(ticket: str, service_url: str) -> CasPrincipal:
+    _ensure_enabled()
+    if not ticket:
+        raise CasAuthenticationError("CAS ticket is missing")
+
+    validate_path = CAS_VALIDATE_PATH if CAS_VALIDATE_PATH.startswith("/") else f"/{CAS_VALIDATE_PATH}"
+    validate_url = f"{CAS_SERVER_URL}{validate_path}"
+    xml_text = _http_get_text(f"{validate_url}?service={service_url}&ticket={ticket}")
+    logger.info("CAS serviceValidate response: %s", xml_text)
+    return parse_service_validate_response(xml_text, fallback_session_index=ticket)
+
+
+def parse_service_validate_response(xml_text: str, fallback_session_index: str = "") -> CasPrincipal:
+    try:
+        root = ET.fromstring(xml_text)
+    except (ET.ParseError, DefusedXmlException) as exc:
+        raise CasAuthenticationError("Invalid CAS validation response") from exc
+
+    failure = _find_first(root, "authenticationFailure")
+    if failure is not None:
+        raise CasAuthenticationError((failure.text or "CAS authentication failed").strip())
+
+    success = _find_first(root, "authenticationSuccess")
+    if success is None:
+        raise CasAuthenticationError("CAS authentication failed")
+
+    user = _get_child_text(success, "user")
+    attrs_node = _find_first(success, "attributes")
+    attrs = _extract_attributes(attrs_node) if attrs_node is not None else {}
+
+    cas_user_id = _attribute_or_default(attrs, CAS_USER_ATTRIBUTE, user) or user
+    if not cas_user_id:
+        raise CasAuthenticationError("CAS user id is missing")
+
+    email = _attribute_or_default(attrs, CAS_EMAIL_ATTRIBUTE, "")
+    username = attrs.get("displayName") or attrs.get("name") or cas_user_id
+    role = _map_role(_attribute_or_default(attrs, CAS_ROLE_ATTRIBUTE, "USER"))
+    tenant_id = _attribute_or_default(attrs, CAS_TENANT_ATTRIBUTE, DEFAULT_TENANT_ID) or DEFAULT_TENANT_ID
+    session_index = attrs.get("SessionIndex") or attrs.get("sessionIndex") or fallback_session_index
+    expires_at = _resolve_expires_at(attrs)
+
+    if not email:
+        safe_user = "".join(c if c.isalnum() or c in ("-", "_", ".") else "_" for c in cas_user_id)
+        email = f"{safe_user}@{CAS_SYNTHETIC_EMAIL_DOMAIN}"
+
+    return CasPrincipal(
+        cas_user_id=str(cas_user_id),
+        email=str(email).lower(),
+        username=str(username),
+        role=role,
+        tenant_id=str(tenant_id),
+        session_index=str(session_index or ""),
+        expires_at=expires_at,
+    )
+
+
+def parse_logout_request(logout_request: str) -> Dict[str, str]:
+    if not logout_request:
+        return {"cas_user_id": "", "session_index": ""}
+    try:
+        root = ET.fromstring(logout_request)
+    except (ET.ParseError, DefusedXmlException):
+        logger.warning("Invalid CAS logoutRequest XML")
+        return {"cas_user_id": "", "session_index": ""}
+
+    session_index = _get_child_text(root, "SessionIndex")
+    cas_user_id = (
+        _get_child_text(root, "NameID")
+        or _get_child_text(root, "nameID")
+        or _get_child_text(root, "user")
+        or _get_child_text(root, "casUserId")
+    )
+    return {"cas_user_id": cas_user_id or "", "session_index": session_index or ""}
+
+
+def revoke_from_logout_request(logout_request: str) -> Dict[str, Any]:
+    parsed = parse_logout_request(logout_request)
+    revoked = 0
+    if parsed["cas_user_id"]:
+        revoked = revoke_cas_sessions_by_user_id(parsed["cas_user_id"])
+        logger.info(
+            "CAS SLO revoke by cas_user_id: cas_user_id=%s revoked=%s",
+            parsed["cas_user_id"],
+            revoked,
+        )
+    if revoked == 0 and parsed["session_index"]:
+        revoked = revoke_cas_session_by_index(parsed["session_index"])
+        logger.info(
+            "CAS SLO revoke by session_index: session_index=%s revoked=%s",
+            parsed["session_index"],
+            revoked,
+        )
+    if revoked == 0:
+        logger.warning("CAS SLO did not revoke any session: %s", parsed)
+    return {"revoked": revoked, **parsed}
+
+
+async def _create_project_session(principal: CasPrincipal, redirect: str = "/", renew: bool = False) -> Dict[str, Any]:
+    user_id = _resolve_project_user(principal)
+    existing_tenant = get_user_tenant_by_user_id(user_id)
+    user_tenant = upsert_user_tenant(
+        user_id=user_id,
+        tenant_id=principal.tenant_id,
+        user_role=principal.role,
+        user_email=principal.email,
+    )
+    if not existing_tenant:
+        await init_tool_list_for_tenant(principal.tenant_id, user_id)
+        await init_skill_list_for_tenant(principal.tenant_id, user_id)
+
+    now = datetime.now()
+    max_local_expiry = now + timedelta(seconds=LOCAL_SESSION_MAX_AGE_SECONDS)
+    expires_at_dt = min(principal.expires_at, max_local_expiry)
+    expires_in_seconds = max(1, int((expires_at_dt - now).total_seconds()))
+
+    session_id = secrets.token_urlsafe(32)
+    create_cas_session(
+        session_id=session_id,
+        user_id=user_id,
+        cas_user_id=principal.cas_user_id,
+        cas_session_index=principal.session_index,
+        expires_at=expires_at_dt,
+    )
+
+    jwt_token = generate_session_jwt(user_id, expires_in=expires_in_seconds, session_id=session_id)
+
+    return {
+        "user": {
+            "id": str(user_id),
+            "email": principal.email,
+            "role": user_tenant.get("user_role", principal.role),
+        },
+        "session": {
+            "access_token": jwt_token,
+            "refresh_token": "",
+            "expires_at": calculate_expires_at(jwt_token),
+            "expires_in_seconds": expires_in_seconds,
+        },
+        "redirect_url": redirect,
+        "renew": renew,
+    }
+
+
+def _resolve_project_user(principal: CasPrincipal) -> str:
+    existing = get_oauth_account_by_provider(CAS_PROVIDER, principal.cas_user_id)
+    if existing:
+        create_or_update_oauth_account(
+            user_id=existing["user_id"],
+            provider=CAS_PROVIDER,
+            provider_user_id=principal.cas_user_id,
+            email=principal.email,
+            username=principal.username,
+            tenant_id=principal.tenant_id,
+        )
+        return existing["user_id"]
+
+    admin_client = get_supabase_admin_client()
+    if not admin_client:
+        raise RuntimeError("Supabase admin client not available")
+
+    user_id = find_supabase_user_id_by_email(admin_client, principal.email)
+    if not user_id:
+        create_resp = admin_client.auth.admin.create_user(
+            {
+                "email": principal.email,
+                "password": secrets.token_urlsafe(32),
+                "email_confirm": True,
+                "user_metadata": {
+                    "full_name": principal.username,
+                    "provider": CAS_PROVIDER,
+                    "cas_user_id": principal.cas_user_id,
+                },
+            }
+        )
+        user_id = create_resp.user.id
+
+    create_or_update_oauth_account(
+        user_id=user_id,
+        provider=CAS_PROVIDER,
+        provider_user_id=principal.cas_user_id,
+        email=principal.email,
+        username=principal.username,
+        tenant_id=principal.tenant_id,
+    )
+    return user_id
+
+
+def _ensure_enabled() -> None:
+    if not CAS_ENABLED or not CAS_SERVER_URL:
+        raise CasAuthenticationError("CAS is not configured")
+
+
+def _build_callback_url(path: str, params: Dict[str, str]) -> str:
+    if not CAS_CALLBACK_BASE_URL:
+        raise CasAuthenticationError("CAS callback base URL is not configured")
+    query = _build_callback_query(params)
+    suffix = f"?{query}" if query else ""
+    return f"{CAS_CALLBACK_BASE_URL}{path}{suffix}"
+
+
+def _build_callback_query(params: Dict[str, str]) -> str:
+    return "&".join(f"{key}={value}" for key, value in params.items())
+
+
+def _normalize_redirect(redirect: str) -> str:
+    if not redirect or not redirect.startswith("/") or redirect.startswith("//"):
+        return "/"
+    return redirect
+
+
+def _build_ssl_context() -> ssl.SSLContext:
+    if CAS_CA_BUNDLE and os.path.isfile(CAS_CA_BUNDLE):
+        return ssl.create_default_context(cafile=CAS_CA_BUNDLE)
+    if not CAS_SSL_VERIFY:
+        ctx = ssl.create_default_context()
+        ctx.check_hostname = False
+        ctx.verify_mode = ssl.CERT_NONE
+        return ctx
+    return ssl.create_default_context()
+
+
+def _http_get_text(url: str) -> str:
+    req = urllib.request.Request(url, headers={"Accept": "application/xml,text/xml,*/*"})
+    with urllib.request.urlopen(req, timeout=15, context=_build_ssl_context()) as resp:
+        return resp.read().decode("utf-8")
+
+
+def _local_name(tag: str) -> str:
+    return tag.rsplit("}", 1)[-1]
+
+
+def _find_first(node: Element, name: str) -> Optional[Element]:
+    for child in node.iter():
+        if _local_name(child.tag) == name:
+            return child
+    return None
+
+
+def _get_child_text(node: Element, name: str) -> str:
+    found = _find_first(node, name)
+    return (found.text or "").strip() if found is not None else ""
+
+
+def _extract_attributes(attrs_node: Element) -> Dict[str, str]:
+    attrs: Dict[str, str] = {}
+    for child in list(attrs_node):
+        value = (child.text or "").strip()
+        if value:
+            attrs[_local_name(child.tag)] = value
+    return attrs
+
+
+def _attribute_or_default(attrs: Dict[str, str], key: str, default: str) -> str:
+    if key and key in attrs:
+        return attrs[key]
+    return default
+
+
+def _map_role(raw_role: str) -> str:
+    role = (raw_role or "USER").upper()
+    try:
+        role_map = json.loads(CAS_ROLE_MAP_JSON) if CAS_ROLE_MAP_JSON else {}
+        role = str(role_map.get(raw_role, role_map.get(role, role))).upper()
+    except Exception:
+        logger.warning("Invalid CAS_ROLE_MAP_JSON; falling back to raw role")
+    return role if role in VALID_ROLES else "USER"
+
+
+def _resolve_expires_at(attrs: Dict[str, str]) -> datetime:
+    for key in ("expiresAt", "expirationDate", "validUntil", "notOnOrAfter"):
+        value = attrs.get(key)
+        if not value:
+            continue
+        parsed = _parse_datetime(value)
+        if parsed:
+            return parsed
+    return datetime.now() + timedelta(seconds=CAS_SESSION_MAX_AGE_SECONDS)
+
+
+def _parse_datetime(value: str) -> Optional[datetime]:
+    try:
+        if value.isdigit():
+            timestamp = int(value)
+            if timestamp > 10_000_000_000:
+                timestamp = timestamp / 1000
+            return datetime.fromtimestamp(timestamp)
+        normalized = value.replace("Z", "+00:00")
+        parsed = datetime.fromisoformat(normalized)
+        if parsed.tzinfo:
+            parsed = parsed.astimezone().replace(tzinfo=None)
+        return parsed
+    except Exception:
+        return None
diff --git a/backend/services/conversation_management_service.py b/backend/services/conversation_management_service.py
index 302ec63a8..0b7345461 100644
--- a/backend/services/conversation_management_service.py
+++ b/backend/services/conversation_management_service.py
@@ -8,6 +8,7 @@
 
 from consts.const import LANGUAGE, MODEL_CONFIG_MAPPING, MESSAGE_ROLE, DEFAULT_EN_TITLE, DEFAULT_ZH_TITLE
 from consts.model import AgentRequest, ConversationResponse, MessageRequest, MessageUnit
+from consts.exceptions import ConversationNotFoundError
 from database.conversation_db import (
     create_conversation,
     create_conversation_message,
@@ -18,12 +19,14 @@
     get_conversation,
     get_conversation_history,
     get_conversation_list,
+    get_latest_assistant_message_id,
     get_message_id_by_index,
     get_source_images_by_conversation,
     get_source_images_by_message,
     get_source_searches_by_conversation,
     get_source_searches_by_message,
     rename_conversation,
+    update_message_minio_files,
     update_message_opinion
 )
 from nexent.core.utils.observer import MessageObserver, ProcessType
@@ -224,7 +227,7 @@ def save_conversation_assistant(request: AgentRequest, messages: List[str], user
             message_list.append(message)
 
     conversation_req = MessageRequest(conversation_id=request.conversation_id, message_idx=user_role_count * 2 + 1,
-                                      role=MESSAGE_ROLE["ASSISTANT"], message=message_list, minio_files=request.minio_files)
+                                      role=MESSAGE_ROLE["ASSISTANT"], message=message_list, minio_files=None)
     save_message(conversation_req, user_id=user_id, tenant_id=tenant_id)
 
 
@@ -296,7 +299,9 @@ def update_conversation_title(conversation_id: int, title: str, user_id: str = N
     """
     success = rename_conversation(conversation_id, title, user_id)
     if not success:
-        raise Exception(f"Conversation {conversation_id} does not exist or has been deleted")
+        raise ConversationNotFoundError(
+            f"Conversation {conversation_id} does not exist or has been deleted"
+        )
     return success
 
 
@@ -509,6 +514,10 @@ def get_conversation_history_service(conversation_id: int, user_id: str) -> List
                     'opinion_flag': msg['opinion_flag']
                 }
 
+                # Add minio_files field (if any, e.g., skill-generated attachments)
+                if 'minio_files' in msg and msg['minio_files']:
+                    message_item['minio_files'] = msg['minio_files']
+
             # Add image content (if any)
             if message_id in image_by_message:
                 message_item['picture'] = image_by_message[message_id]
@@ -701,3 +710,52 @@ async def get_message_id_by_index_impl(conversation_id: int, message_index: int)
     if message_id is None:
         raise Exception("Message not found.")
     return message_id
+
+
+def save_skill_files_to_conversation(
+    conversation_id: int,
+    skill_file_uploads: List[Dict[str, Any]],
+    user_id: str,
+) -> bool:
+    """
+    Append skill file upload records to the latest assistant message in a conversation.
+
+    This persists generated documents (e.g., DOCX, XLSX created by skills) to the
+    conversation history so they appear in subsequent GET /conversation/{id} calls.
+
+    Args:
+        conversation_id: Target conversation ID
+        skill_file_uploads: List of upload metadata dicts (e.g., from upload_fileobj)
+        user_id: User ID for ownership validation
+
+    Returns:
+        bool: True if files were saved, False if no assistant message was found
+    """
+    if not skill_file_uploads:
+        return False
+
+    try:
+        message_id = get_latest_assistant_message_id(conversation_id, user_id)
+        if message_id is None:
+            logging.warning(
+                "[skill-file] no assistant message found for conversation=%s, "
+                "cannot persist skill file uploads",
+                conversation_id,
+            )
+            return False
+
+        success = update_message_minio_files(message_id, skill_file_uploads)
+        if success:
+            logging.info(
+                "[skill-file] persisted %d file(s) to message_id=%s conversation=%s",
+                len(skill_file_uploads),
+                message_id,
+                conversation_id,
+            )
+        return success
+    except Exception as exc:
+        logging.exception(
+            "[skill-file] failed to persist skill file uploads for conversation=%s",
+            conversation_id,
+        )
+        return False
diff --git a/backend/services/data_process_service.py b/backend/services/data_process_service.py
index ae3d35dcd..a7529127c 100644
--- a/backend/services/data_process_service.py
+++ b/backend/services/data_process_service.py
@@ -15,7 +15,7 @@
 import redis
 import torch
 from PIL import Image
-from celery import states, chain
+from celery import states
 from transformers import CLIPProcessor, CLIPModel
 from nexent.data_process.core import DataProcessCore
 
@@ -25,7 +25,7 @@
 from database.attachment_db import delete_file, file_exists, get_file_size_from_minio, get_file_stream, upload_file
 from utils.file_management_utils import convert_office_to_pdf
 from data_process.app import app as celery_app
-from data_process.tasks import process, forward
+from data_process.tasks import submit_process_forward_chain
 from data_process.utils import get_task_info, get_all_task_ids_from_redis
 
 # Limit concurrent LibreOffice processes to avoid resource exhaustion
@@ -54,7 +54,8 @@ def __init__(self):
 
         self._inspector = None
         self._inspector_last_time = 0
-        self._inspector_ttl = 300  # 5 minutes - inspector is expensive to create (ping all workers)
+        # 5 minutes - inspector is expensive to create (ping all workers)
+        self._inspector_ttl = 300
         self._inspector_lock = None
         self._inspector_lock = threading.Lock()
 
@@ -152,7 +153,8 @@ async def get_all_tasks(self, filter: bool = True) -> List[Dict[str, Any]]:
 
             def _normalize_runtime_meta(task: Dict[str, Any]) -> Dict[str, Any]:
                 task_name_full = task.get('name', '') or ''
-                task_name = task_name_full.split('.')[-1] if task_name_full else ''
+                task_name = task_name_full.split(
+                    '.')[-1] if task_name_full else ''
                 kwargs = task.get('kwargs') or {}
                 if isinstance(kwargs, str):
                     try:
@@ -178,35 +180,43 @@ def _normalize_runtime_meta(task: Dict[str, Any]) -> Dict[str, Any]:
             def get_active():
                 t = time.time()
                 # Create fresh inspector with short timeout for each call
-                short_inspector = celery_app.control.inspect(timeout=short_timeout)
+                short_inspector = celery_app.control.inspect(
+                    timeout=short_timeout)
                 result = short_inspector.active()
                 elapsed = time.time() - t
-                logger.info(f"[get_all_tasks] inspector.active() took {elapsed:.3f}s")
+                logger.info(
+                    f"[get_all_tasks] inspector.active() took {elapsed:.3f}s")
                 return result if result else {}
 
             def get_reserved():
                 t = time.time()
-                short_inspector = celery_app.control.inspect(timeout=short_timeout)
+                short_inspector = celery_app.control.inspect(
+                    timeout=short_timeout)
                 result = short_inspector.reserved()
                 elapsed = time.time() - t
-                logger.info(f"[get_all_tasks] inspector.reserved() took {elapsed:.3f}s")
+                logger.info(
+                    f"[get_all_tasks] inspector.reserved() took {elapsed:.3f}s")
                 return result if result else {}
 
             with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor:
                 future_active = executor.submit(get_active)
                 future_reserved = executor.submit(get_reserved)
-                active_tasks_dict = future_active.result(timeout=short_timeout + 0.5)
-                reserved_tasks_dict = future_reserved.result(timeout=short_timeout + 0.5)
+                active_tasks_dict = future_active.result(
+                    timeout=short_timeout + 0.5)
+                reserved_tasks_dict = future_reserved.result(
+                    timeout=short_timeout + 0.5)
             celery_duration = time.time() - celery_start
             if celery_duration > 0.5:
-                logger.warning(f"[get_all_tasks] Inspector took {celery_duration:.3f}s (expected <0.5s)")
+                logger.warning(
+                    f"[get_all_tasks] Inspector took {celery_duration:.3f}s (expected <0.5s)")
             if active_tasks_dict:
                 for worker, tasks in active_tasks_dict.items():
                     for task in tasks:
                         task_id = task.get('id')
                         if task_id:
                             task_ids.add(task_id)
-                            runtime_task_meta[task_id] = _normalize_runtime_meta(task)
+                            runtime_task_meta[task_id] = _normalize_runtime_meta(
+                                task)
             if reserved_tasks_dict:
                 for worker, tasks in reserved_tasks_dict.items():
                     for task in tasks:
@@ -214,7 +224,8 @@ def get_reserved():
                         if task_id:
                             task_ids.add(task_id)
                             # Keep active metadata if already present
-                            runtime_task_meta.setdefault(task_id, _normalize_runtime_meta(task))
+                            runtime_task_meta.setdefault(
+                                task_id, _normalize_runtime_meta(task))
 
             # Get task IDs from Redis backend (covers completed/failed tasks within expiry)
             try:
@@ -241,11 +252,14 @@ def get_reserved():
                     if not task_info.get('task_name') and runtime_meta.get('task_name'):
                         task_info['task_name'] = runtime_meta.get('task_name')
                     if not task_info.get('index_name') and runtime_meta.get('index_name'):
-                        task_info['index_name'] = runtime_meta.get('index_name')
+                        task_info['index_name'] = runtime_meta.get(
+                            'index_name')
                     if not task_info.get('path_or_url') and runtime_meta.get('path_or_url'):
-                        task_info['path_or_url'] = runtime_meta.get('path_or_url')
+                        task_info['path_or_url'] = runtime_meta.get(
+                            'path_or_url')
                     if not task_info.get('original_filename') and runtime_meta.get('original_filename'):
-                        task_info['original_filename'] = runtime_meta.get('original_filename')
+                        task_info['original_filename'] = runtime_meta.get(
+                            'original_filename')
 
                 if filter and not (task_info.get('index_name') and task_info.get('task_name')):
                     # Keep user-visible queued tasks even before worker updates task meta.
@@ -538,30 +552,23 @@ async def create_batch_tasks_impl(self, authorization: Optional[str], request: B
                     f"Missing required field 'index_name' in source config: {source_config}")
                 continue
 
-            # Create and submit a chain: process -> forward
-            task_chain = chain(
-                process.s(
-                    source=source,
-                    source_type=source_type,
-                    chunking_strategy=chunking_strategy,
-                    index_name=index_name,
-                    original_filename=original_filename,
-                    embedding_model_id=embedding_model_id,
-                    tenant_id=tenant_id
-                ).set(queue='process_q'),
-                forward.s(
-                    index_name=index_name,
-                    source=source,
-                    source_type=source_type,
-                    original_filename=original_filename,
-                    authorization=authorization
-                ).set(queue='forward_q')
+            chain_id = submit_process_forward_chain(
+                source=source,
+                source_type=source_type,
+                chunking_strategy=chunking_strategy,
+                index_name=index_name,
+                original_filename=original_filename,
+                authorization=authorization,
+                embedding_model_id=embedding_model_id,
+                tenant_id=tenant_id,
             )
+            if not chain_id:
+                logger.error(
+                    f"Failed to enqueue process-forward chain for source: {source}")
+                continue
 
-            task_result = task_chain.apply_async()
-
-            task_ids.append(task_result.id)
-            logger.debug(f"Created task {task_result.id} for source: {source}")
+            task_ids.append(chain_id)
+            logger.debug(f"Created task {chain_id} for source: {source}")
         logger.info(
             f"Created {len(task_ids)} individual tasks for batch processing")
         return task_ids
@@ -593,7 +600,7 @@ async def process_uploaded_text_file(self, file_content: bytes, filename: str, c
             f"Processing uploaded file: {filename} using SDK DataProcessCore")
 
         data_processor = DataProcessCore()
-        chunks = data_processor.file_process(
+        chunks, _ = data_processor.file_process(
             file_data=file_content,
             filename=filename,
             chunking_strategy=chunking_strategy
@@ -642,7 +649,8 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 # Step 1: Download original Office file from MinIO
                 original_stream = get_file_stream(object_name)
                 if original_stream is None:
-                    raise OfficeConversionException(f"Source file not found in storage: {object_name}")
+                    raise OfficeConversionException(
+                        f"Source file not found in storage: {object_name}")
 
                 original_filename = os.path.basename(object_name)
                 input_path = os.path.join(temp_dir, original_filename)
@@ -654,10 +662,12 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 try:
                     pdf_path = await convert_office_to_pdf(input_path, temp_dir, timeout=30)
                 except Exception as exc:
-                    raise OfficeConversionException(f"LibreOffice conversion failed: {exc}") from exc
+                    raise OfficeConversionException(
+                        f"LibreOffice conversion failed: {exc}") from exc
 
                 # Step 3: Upload converted PDF to MinIO
-                result = upload_file(file_path=pdf_path, object_name=pdf_object_name)
+                result = upload_file(file_path=pdf_path,
+                                     object_name=pdf_object_name)
                 if not result.get('success'):
                     raise OfficeConversionException(
                         f"Failed to upload PDF to MinIO: {result.get('error', 'Unknown error')}"
@@ -666,14 +676,16 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 # Step 4: Validate the uploaded PDF (header check + minimum size)
                 remote_size = get_file_size_from_minio(pdf_object_name)
                 if remote_size <= 0:
-                    raise OfficeConversionException("PDF validation failed: cannot read remote file size")
+                    raise OfficeConversionException(
+                        "PDF validation failed: cannot read remote file size")
                 if remote_size < 100:
                     raise OfficeConversionException(
                         f"PDF validation failed: file too small ({remote_size} bytes)"
                     )
                 remote_stream = get_file_stream(pdf_object_name)
                 if remote_stream is None:
-                    raise OfficeConversionException("PDF validation failed: cannot read uploaded file")
+                    raise OfficeConversionException(
+                        "PDF validation failed: cannot read uploaded file")
                 try:
                     header = remote_stream.read(5)
                 finally:
@@ -682,7 +694,8 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                     except Exception:
                         pass
                 if not header.startswith(b'%PDF-'):
-                    raise OfficeConversionException("PDF validation failed: invalid PDF header")
+                    raise OfficeConversionException(
+                        "PDF validation failed: invalid PDF header")
 
             except OfficeConversionException:
                 # Clean up any partially-uploaded remote PDF so a future retry starts clean
@@ -690,14 +703,16 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                     delete_file(pdf_object_name)
                 raise
             except Exception as exc:
-                raise OfficeConversionException(f"Unexpected error during conversion: {exc}") from exc
+                raise OfficeConversionException(
+                    f"Unexpected error during conversion: {exc}") from exc
             finally:
                 # Step 5: Clean up local temporary directory
                 if temp_dir and os.path.exists(temp_dir):
                     try:
                         shutil.rmtree(temp_dir)
                     except Exception as cleanup_err:
-                        logger.warning(f"Failed to cleanup temp dir '{temp_dir}': {cleanup_err}")
+                        logger.warning(
+                            f"Failed to cleanup temp dir '{temp_dir}': {cleanup_err}")
 
     def convert_celery_states_to_custom(self, process_celery_state: Optional[str], forward_celery_state: Optional[str]) -> str:
         """Map Celery task states to a custom frontend state string.
diff --git a/backend/services/file_management_service.py b/backend/services/file_management_service.py
index b2850403d..585669c0c 100644
--- a/backend/services/file_management_service.py
+++ b/backend/services/file_management_service.py
@@ -52,6 +52,27 @@
 
 logger = logging.getLogger("file_management_service")
 
+ALLOWED_SKILL_UPLOAD_ROOT = Path("/mnt/nexent").resolve()
+
+
+def is_allowed_skill_upload_path(file_path: str) -> bool:
+    """Return True when a local file path is under the allowed skill upload root."""
+    if not file_path:
+        return False
+
+    try:
+        candidate_path = Path(file_path).resolve()
+    except Exception:
+        return False
+
+    try:
+        candidate_path.relative_to(ALLOWED_SKILL_UPLOAD_ROOT)
+        return True
+    except ValueError:
+        return False
+
+
+
 
 def resolve_minio_upload_folder(
     folder: Optional[str],
@@ -83,6 +104,11 @@ def resolve_minio_upload_folder(
     if folder == "knowledge_base":
         return "knowledge_base"
 
+    if folder == "skill-files":
+        if user_id:
+            return f"skill-files/{user_id}"
+        return "skill-files"
+
     if user_id:
         return f"attachments/{user_id}"
 
@@ -101,7 +127,6 @@ def check_file_access(
     - knowledge_base/*: All authenticated users can access
     - attachments/{user_id}/*: Only the owner (user_id) can access
     - images_in_attachments/*: All authenticated users can access
-    - preview/*: Accessible if the original file is accessible
 
     Args:
         object_name: File object name in storage
@@ -125,6 +150,10 @@ def check_file_access(
         # Keep them readable for authenticated users to avoid broken image citations.
         return True
 
+    if object_name.startswith("skill-files/"):
+        # Generated documents are private to the uploader and must stay user-scoped.
+        return object_name.startswith(f"skill-files/{user_id}/")
+
     # Check if file is in user's attachments folder
     # Pattern: attachments/{user_id}/*
     if object_name.startswith(f"attachments/{user_id}/"):
@@ -357,14 +386,20 @@ async def upload_to_minio(
             # Convert file content to BytesIO object
             file_obj = BytesIO(file_content)
 
+            # Store original filename before upload
+            original_filename = f.filename or ""
+
             # Upload file
             result = upload_fileobj(
                 file_obj=file_obj,
-                file_name=f.filename or "",
+                file_name=original_filename,
                 prefix=actual_folder,
                 file_size=len(file_content)
             )
 
+            # Preserve original filename in result (upload_fileobj uses it for object name generation)
+            result["original_file_name"] = original_filename
+
             # Reset file pointer for potential re-reading
             await f.seek(0)
             results.append(result)
@@ -376,6 +411,7 @@ async def upload_to_minio(
             results.append({
                 "success": False,
                 "file_name": f.filename,
+                "original_file_name": f.filename,
                 "error": "An error occurred while processing the file."
             })
     return results
diff --git a/backend/services/northbound_service.py b/backend/services/northbound_service.py
index a6eaed77d..c5493a551 100644
--- a/backend/services/northbound_service.py
+++ b/backend/services/northbound_service.py
@@ -1,31 +1,40 @@
 import asyncio
 import hashlib
+import json
 import logging
 import time
 from dataclasses import dataclass
-from typing import Any, Dict, Optional
+from os.path import basename
+from typing import Any, Dict, List, Optional
 
+from fastapi import HTTPException, UploadFile
 from fastapi.responses import StreamingResponse
 
+
+from consts.const import ASSET_OWNER_TENANT_ID
 from consts.exceptions import (
     LimitExceededError,
     UnauthorizedError,
+    ConversationNotFoundError,
 )
-from consts.model import AgentRequest
-from database.conversation_db import get_conversation_messages
+from consts.model import AgentRequest, ToolParamsRequest
+from database.conversation_db import get_conversation_messages, get_source_searches_by_message
 from database.token_db import log_token_usage, get_latest_usage_metadata
 from services.agent_service import (
     run_agent_stream,
     stop_agent_tasks,
-    list_all_agent_info_impl,
     get_agent_id_by_name
 )
+from services.agent_version_service import list_published_agents_impl
 from services.conversation_management_service import (
     save_conversation_user,
     get_conversation_list_service,
     create_new_conversation,
     update_conversation_title as update_conversation_title_service,
 )
+from services.file_management_service import upload_to_minio, resolve_minio_upload_folder, validate_urls_access
+from database.attachment_db import get_file_url, get_file_size_from_minio
+from nexent.multi_modal.utils import parse_s3_url
 
 logger = logging.getLogger("northbound_service")
 
@@ -39,6 +48,188 @@ class NorthboundContext:
     token_id: int = 0
 
 
+def _build_northbound_file_descriptor(
+    upload_result: Dict[str, Any],
+    original_file_name: str = "",
+    file_type: Optional[str] = None,
+    file_size: Optional[int] = None,
+) -> Dict[str, Any]:
+    """Normalize upload metadata for northbound API consumers."""
+    object_name = str(upload_result.get("object_name") or "").strip()
+    # Use original filename if provided, otherwise fall back to upload result or object name
+    if original_file_name:
+        file_name = original_file_name
+    else:
+        file_name = str(upload_result.get("file_name") or basename(object_name) or "")
+    # Frontend-compatible field order
+    descriptor = {
+        "object_name": object_name,
+        "name": file_name,
+        "type": file_type or "file",
+        # Use provided file_size, or from upload_result, or 0 as fallback
+        "size": file_size if file_size is not None else upload_result.get("file_size", 0),
+        # Use relative URL format matching frontend: /nexent/{object_name}
+        "url": f"/nexent/{object_name}",
+        "description": "",
+    }
+    presigned_url = upload_result.get("presigned_url")
+    if presigned_url:
+        descriptor["presigned_url"] = presigned_url
+    return descriptor
+
+
+async def upload_files_for_northbound(
+    ctx: NorthboundContext,
+    files: List[UploadFile],
+    folder: str = "attachments",
+) -> Dict[str, Any]:
+    """Upload files for northbound callers and return reusable storage references."""
+    if not files:
+        raise ValueError("No files in the request")
+
+    actual_folder = resolve_minio_upload_folder(folder, ctx.user_id, ctx.tenant_id)
+    results = await upload_to_minio(files=files, folder=actual_folder)
+    normalized_files = []
+    for result, upload_file in zip(results, files):
+        if result.get("success") and result.get("object_name"):
+            content_type = result.get("content_type", "")
+            file_type = "image" if content_type.startswith("image/") else "file"
+            # Extract original filename - use upload result first, then fallback to UploadFile
+            # The upload result contains the original filename passed to upload_fileobj
+            original_file_name = result.get("original_file_name") or upload_file.filename or ""
+            file_size = result.get("file_size", 0)
+            # If file_size is 0 but we have the UploadFile, try to get size from headers
+            if file_size == 0 and hasattr(upload_file, 'size') and upload_file.size:
+                file_size = upload_file.size
+            descriptor = _build_northbound_file_descriptor(
+                result,
+                original_file_name=original_file_name,
+                file_type=file_type,
+                file_size=file_size,
+            )
+            normalized_files.append(descriptor)
+
+    if not normalized_files:
+        raise ValueError("No valid files uploaded")
+
+    success_count = sum(1 for result in results if result.get("success", False))
+    failed_count = sum(1 for result in results if not result.get("success", False))
+
+    return {
+        "message": f"Processed {len(results)} files",
+        "requestId": ctx.request_id,
+        "summary": {
+            "total": len(results),
+            "uploaded": success_count,
+            "failed": failed_count,
+        },
+        "files": normalized_files,
+    }
+
+
+def _normalize_northbound_attachments(
+    attachments: Optional[List[Any]],
+    user_id: str,
+    tenant_id: str,
+) -> Optional[List[Dict[str, Any]]]:
+    """Convert northbound attachment references into internal minio_files objects.
+    
+    Supports two formats:
+    1. List of S3 URL strings (backward compatible): ["s3://nexent/...", "/nexent/...", "attachments/..."]
+    2. List of attachment objects (full metadata): [{"object_name": "...", "name": "...", ...}]
+    """
+    from database.attachment_db import _build_mcp_presigned_url
+
+    if attachments is None:
+        return None
+    if not isinstance(attachments, list):
+        raise ValueError("attachments must be an array")
+
+    normalized_files: List[Dict[str, Any]] = []
+    for attachment in attachments:
+        # Handle dict format (full attachment object)
+        if isinstance(attachment, dict):
+            # Use the attachment dict directly, just ensure required fields
+            normalized_file = {
+                "object_name": attachment.get("object_name", ""),
+                "name": attachment.get("name", basename(attachment.get("object_name", ""))),
+                "type": attachment.get("type", "file"),
+                "size": attachment.get("size", 0),
+                "url": attachment.get("url", ""),
+                "description": attachment.get("description", ""),
+            }
+            # Add presigned_url if available, or generate one if we have object_name
+            if "presigned_url" in attachment:
+                normalized_file["presigned_url"] = attachment["presigned_url"]
+            elif normalized_file.get("object_name"):
+                try:
+                    presigned_result = get_file_url(object_name=normalized_file["object_name"], expires=86400)
+                    if presigned_result.get("success") and presigned_result.get("url"):
+                        normalized_file["presigned_url"] = _build_mcp_presigned_url(presigned_result["url"])
+                except Exception:
+                    pass
+            normalized_files.append(normalized_file)
+            continue
+
+        # Handle string format (S3 URL)
+        if not isinstance(attachment, str) or not attachment.strip():
+            raise ValueError("attachments must contain non-empty S3 URLs or object paths")
+
+        attachment_url = attachment.strip()
+
+        # Support multiple URL formats:
+        # 1. s3://nexent/attachments/xxx.md
+        # 2. /nexent/attachments/xxx.md
+        # 3. attachments/xxx.md (relative path)
+        if attachment_url.startswith("s3://"):
+            try:
+                _, object_name = parse_s3_url(attachment_url)
+            except ValueError as exc:
+                raise ValueError(f"Invalid S3 URL format: {attachment_url}") from exc
+            validate_url = attachment_url
+        elif attachment_url.startswith("/nexent/"):
+            object_name = attachment_url[len("/nexent/"):]
+            validate_url = f"s3://nexent/{object_name}"
+        elif attachment_url.startswith("attachments/") or attachment_url.startswith("nexent/"):
+            object_name = attachment_url if attachment_url.startswith("nexent/") else attachment_url
+            validate_url = f"s3://nexent/{object_name}"
+        else:
+            raise ValueError(f"Invalid attachment format: {attachment_url}. Expected s3:// URL, /nexent/ path, or attachments/ path")
+
+        try:
+            validate_urls_access([validate_url], user_id, tenant_id)
+            presigned_result = get_file_url(object_name=object_name, expires=86400)
+        except PermissionError as exc:
+            detail = str(exc)
+            if "Invalid S3 URL format" in detail:
+                raise ValueError(detail) from exc
+            raise PermissionError(detail) from exc
+
+        # Get file size from MinIO
+        try:
+            file_size = get_file_size_from_minio(object_name)
+        except Exception:
+            file_size = 0
+
+        # Build frontend-compatible minio_files format
+        file_name = basename(object_name.rstrip("/"))
+        normalized_file = {
+            "object_name": object_name,
+            "name": file_name,
+            "type": "file",
+            "size": file_size,
+            # Use relative URL format matching frontend: /nexent/{object_name}
+            "url": f"/nexent/{object_name}",
+            "description": "",
+        }
+        # Use MCP proxy URL for presigned_url (same as frontend format)
+        if presigned_result.get("success") and presigned_result.get("url"):
+            normalized_file["presigned_url"] = _build_mcp_presigned_url(presigned_result["url"])
+        normalized_files.append(normalized_file)
+
+    return normalized_files
+
+
 # -----------------------------
 # In-memory idempotency and rate limit placeholders
 # -----------------------------
@@ -111,6 +302,12 @@ def _build_idempotency_key(*parts: Any) -> str:
     return ":".join(processed)
 
 
+def _build_title_update_idempotency_key(tenant_id: str, conversation_id: int, title: str) -> str:
+    """Build an ASCII-safe idempotency key for title updates."""
+    title_hash = hashlib.sha256(title.encode("utf-8")).hexdigest()
+    return _build_idempotency_key(tenant_id, str(conversation_id), title_hash)
+
+
 # -----------------------------
 # Agent resolver
 # -----------------------------
@@ -126,7 +323,9 @@ async def start_streaming_chat(
     conversation_id: Optional[int],
     agent_name: str,
     query: str,
+    attachments: Optional[List[Any]] = None,
     meta_data: Optional[Dict[str, Any]] = None,
+    tool_params: Optional[ToolParamsRequest] = None,
     idempotency_key: Optional[str] = None
 ) -> StreamingResponse:
     try:
@@ -145,6 +344,11 @@ async def start_streaming_chat(
         # Get history according to internal_conversation_id
         history_resp = await get_conversation_history_internal(ctx, internal_conversation_id)
         agent_id = await get_agent_id_by_name(agent_name=agent_name, tenant_id=ctx.tenant_id)
+        normalized_attachments = _normalize_northbound_attachments(
+            attachments=attachments,
+            user_id=ctx.user_id,
+            tenant_id=ctx.tenant_id,
+        )
         # Idempotency: only prevent concurrent duplicate starts
         composed_key = idempotency_key or _build_idempotency_key(ctx.tenant_id, str(conversation_id), agent_id, query)
         await idempotency_start(composed_key)
@@ -153,8 +357,9 @@ async def start_streaming_chat(
             agent_id=agent_id,
             query=query,
             history=(history_resp.get("data", {})).get("history", []),
-            minio_files=None,
+            minio_files=normalized_attachments,
             is_debug=False,
+            tool_params=tool_params,
         )
 
         # Synchronously persist the user message before starting the stream to avoid race conditions
@@ -257,15 +462,58 @@ async def list_conversations(ctx: NorthboundContext) -> Dict[str, Any]:
     return {"message": "success", "data": conversations, "requestId": ctx.request_id}
 
 
+def _format_search_record(record: Dict[str, Any]) -> Dict[str, Any]:
+    """Format a search source record for API response."""
+    search_item = {
+        "title": record.get("source_title", ""),
+        "text": record.get("source_content", ""),
+        "source_type": record.get("source_type", ""),
+        "url": record.get("source_location", ""),
+        "filename": record.get("source_title", "") if record.get("source_type") == "file" else None,
+        "published_date": None,
+        "score": float(record["score_overall"]) if record.get("score_overall") is not None else None,
+        "tool_sign": record.get("tool_sign", ""),
+        "cite_index": record.get("cite_index")
+    }
+
+    if record.get("published_date"):
+        if hasattr(record["published_date"], "strftime"):
+            search_item["published_date"] = record["published_date"].strftime("%Y-%m-%d")
+        else:
+            search_item["published_date"] = str(record["published_date"])[:10]
+
+    return search_item
+
+
 async def get_conversation_history_internal(ctx: NorthboundContext, conversation_id: int) -> Dict[str, Any]:
     """Internal helper to get conversation history without logging."""
     history = get_conversation_messages(conversation_id)
-    # Remove unnecessary fields
     result = []
     for message in history:
+        # Parse minio_files from database (stored as JSON string)
+        minio_files = []
+        raw_minio_files = message.get("minio_files")
+        if raw_minio_files:
+            try:
+                minio_files = json.loads(raw_minio_files) if isinstance(raw_minio_files, str) else raw_minio_files
+            except (json.JSONDecodeError, TypeError):
+                logger.warning(f"Failed to parse minio_files for message {message.get('message_id')}")
+
+        # Fetch search results for this message
+        message_id = message.get("message_id")
+        search_results = []
+        if message_id:
+            try:
+                search_records = get_source_searches_by_message(message_id, user_id=ctx.user_id)
+                search_results = [_format_search_record(r) for r in search_records]
+            except Exception as e:
+                logger.warning(f"Failed to get search records for message {message_id}: {str(e)}")
+
         result.append({
             "role": message["message_role"],
-            "content": message["message_content"]
+            "content": message["message_content"],
+            "minio_files": minio_files,
+            "search": search_results
         })
 
     response = {
@@ -284,7 +532,18 @@ async def get_conversation_history(ctx: NorthboundContext, conversation_id: int)
 
 async def get_agent_info_list(ctx: NorthboundContext) -> Dict[str, Any]:
     try:
-        agent_info_list = await list_all_agent_info_impl(tenant_id=ctx.tenant_id, user_id=ctx.user_id)
+        agent_info_list = await list_published_agents_impl(
+            tenant_id=ctx.tenant_id,
+            user_id=ctx.user_id,
+        )
+        # Match the same scope as /agent/published_list: non-asset-owner tenants
+        # also get the asset owner's published agents merged in.
+        if ctx.tenant_id != ASSET_OWNER_TENANT_ID:
+            asset_agent_list = await list_published_agents_impl(
+                tenant_id=ASSET_OWNER_TENANT_ID,
+                user_id=ctx.user_id,
+            )
+            agent_info_list.extend(asset_agent_list)
         # Remove internal information that partner don't need
         for agent_info in agent_info_list:
             agent_info.pop("agent_id", None)
@@ -298,7 +557,11 @@ async def update_conversation_title(ctx: NorthboundContext, conversation_id: int
     composed_key: Optional[str] = None
     try:
         # Idempotency: avoid concurrent duplicate title update for same conversation
-        composed_key = idempotency_key or _build_idempotency_key(ctx.tenant_id, str(conversation_id), title)
+        composed_key = idempotency_key or _build_title_update_idempotency_key(
+            ctx.tenant_id,
+            conversation_id,
+            title,
+        )
         await idempotency_start(composed_key)
 
         update_conversation_title_service(conversation_id, title, ctx.user_id)
@@ -324,6 +587,8 @@ async def update_conversation_title(ctx: NorthboundContext, conversation_id: int
         }
     except LimitExceededError as _:
         raise LimitExceededError("Duplicate request is still running, please wait.")
+    except ConversationNotFoundError:
+        raise
     except Exception as e:
         raise Exception(f"Failed to update conversation title for conversation_id {conversation_id}: {str(e)}")
     finally:
diff --git a/backend/services/prompt_service.py b/backend/services/prompt_service.py
index ee9704302..f1564cdbc 100644
--- a/backend/services/prompt_service.py
+++ b/backend/services/prompt_service.py
@@ -1,15 +1,17 @@
 import json
 import logging
 import queue
+import sys
 import threading
 from typing import Optional, List
 
 from jinja2 import StrictUndefined, Template
 
-from consts.const import LANGUAGE
+from consts.const import LANGUAGE, ENABLE_JIUWEN_SDK
 from consts.error_code import ErrorCode
 from consts.error_message import ErrorMessage
 from consts.exceptions import AppException
+from consts.model import AgentInfoRequest
 from database.agent_db import search_agent_info_by_agent_id, query_all_agent_info_by_tenant_id, \
     query_sub_agents_id_list
 from database.model_management_db import get_model_by_model_id
@@ -22,15 +24,31 @@
     _regenerate_agent_name_with_llm,
     _regenerate_agent_display_name_with_llm,
     _generate_unique_agent_name_with_suffix,
-    _generate_unique_display_name_with_suffix
+    _generate_unique_display_name_with_suffix,
+    update_agent,
 )
 from services.prompt_template_service import resolve_prompt_generate_template
 from utils.llm_utils import call_llm_for_system_prompt
 from utils.prompt_template_utils import (
-    get_prompt_generate_prompt_template,
     get_prompt_optimize_prompt_template,
+    get_prompt_template,
 )
 
+from dataclasses import dataclass, field
+from typing import Optional as Opt
+
+from adapters.exception import JiuwenSDKError, NexentCapabilityError
+
+
+def _get_jiuwen_adapter_class():
+    """Import Jiuwen adapter only when optimization paths need it."""
+    try:
+        from adapters import JiuwenSDKAdapter
+    except ModuleNotFoundError:
+        return None
+    return JiuwenSDKAdapter
+
+
 # Configure logging
 logger = logging.getLogger("prompt_service")
 
@@ -105,14 +123,16 @@ def generate_and_save_system_prompt_impl(agent_id: int,
     # Get knowledge base display names for few-shot examples
     # Priority: frontend-provided > database query
     if knowledge_base_display_names:
-        logger.debug(f"Using frontend-provided knowledge base display names: {knowledge_base_display_names}")
+        logger.debug(
+            f"Using frontend-provided knowledge base display names: {knowledge_base_display_names}")
     else:
         knowledge_base_display_names = get_knowledge_base_display_names(
             tool_info_list=tool_info_list,
             agent_id=agent_id,
             tenant_id=tenant_id
         )
-        logger.debug(f"Using database query for knowledge base display names: {knowledge_base_display_names}")
+        logger.debug(
+            f"Using database query for knowledge base display names: {knowledge_base_display_names}")
 
     # Handle sub-agent IDs
     if sub_agent_ids and len(sub_agent_ids) > 0:
@@ -146,7 +166,7 @@ def generate_and_save_system_prompt_impl(agent_id: int,
 
     # 1. Real-time streaming push
     final_results = {"duty": "", "constraint": "", "few_shots": "", "agent_var_name": "", "agent_display_name": "",
-                     "agent_description": ""}
+                     "agent_description": "", "greeting_message": "", "example_questions": ""}
 
     # Get all existing agent names and display names for duplicate checking (only if not in create mode)
     all_agents = query_all_agent_info_by_tenant_id(tenant_id)
@@ -192,7 +212,8 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                         exclude_agent_id=agent_id,
                         agents_cache=all_agents
                     ):
-                        logger.info(f"Agent name '{agent_name}' already exists, regenerating with LLM")
+                        logger.info(
+                            f"Agent name '{agent_name}' already exists, regenerating with LLM")
                         try:
                             agent_name = _regenerate_agent_name_with_llm(
                                 original_name=agent_name,
@@ -206,10 +227,12 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                                 prompt_template_id=prompt_template_id,
                                 user_id=user_id,
                             )
-                            logger.info(f"Regenerated agent name: '{agent_name}'")
+                            logger.info(
+                                f"Regenerated agent name: '{agent_name}'")
                             final_results["agent_var_name"] = agent_name
                         except Exception as e:
-                            logger.error(f"Failed to regenerate agent name with LLM: {str(e)}, using fallback")
+                            logger.error(
+                                f"Failed to regenerate agent name with LLM: {str(e)}, using fallback")
                             # Fallback: add suffix
                             agent_name = _generate_unique_agent_name_with_suffix(
                                 agent_name,
@@ -235,7 +258,8 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                         exclude_agent_id=agent_id,
                         agents_cache=all_agents
                     ):
-                        logger.info(f"Agent display_name '{agent_display_name}' already exists, regenerating with LLM")
+                        logger.info(
+                            f"Agent display_name '{agent_display_name}' already exists, regenerating with LLM")
                         try:
                             agent_display_name = _regenerate_agent_display_name_with_llm(
                                 original_display_name=agent_display_name,
@@ -249,10 +273,12 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                                 prompt_template_id=prompt_template_id,
                                 user_id=user_id,
                             )
-                            logger.info(f"Regenerated agent display_name: '{agent_display_name}'")
+                            logger.info(
+                                f"Regenerated agent display_name: '{agent_display_name}'")
                             final_results["agent_display_name"] = agent_display_name
                         except Exception as e:
-                            logger.error(f"Failed to regenerate agent display_name with LLM: {str(e)}, using fallback")
+                            logger.error(
+                                f"Failed to regenerate agent display_name with LLM: {str(e)}, using fallback")
                             # Fallback: add suffix
                             agent_display_name = _generate_unique_display_name_with_suffix(
                                 agent_display_name,
@@ -285,6 +311,68 @@ def generate_and_save_system_prompt_impl(agent_id: int,
     if not has_content:
         raise Exception("Failed to generate prompt content.")
 
+    # 3. Generate greeting message and example questions
+    try:
+        greeting_template = get_prompt_template('greeting_generate', language)
+        greeting_system_prompt = greeting_template.get("GREETING_SYSTEM_PROMPT", "")
+        greeting_user_prompt_template = greeting_template.get("USER_PROMPT", "")
+
+        greeting_user_prompt = Template(greeting_user_prompt_template, undefined=StrictUndefined).render({
+            "display_name": final_results.get("agent_display_name", ""),
+            "duty_description": final_results.get("duty", ""),
+            "business_description": task_description,
+            "few_shots": final_results.get("few_shots", ""),
+        })
+
+        greeting_result = call_llm_for_system_prompt(
+            model_id=model_id,
+            user_prompt=greeting_user_prompt,
+            system_prompt=greeting_system_prompt,
+            tenant_id=tenant_id,
+        )
+
+        parsed = None
+        try:
+            json_start = greeting_result.find("{")
+            json_end = greeting_result.rfind("}") + 1
+            if json_start >= 0 and json_end > json_start:
+                parsed = json.loads(greeting_result[json_start:json_end])
+        except json.JSONDecodeError:
+            logger.warning(f"Failed to parse greeting JSON from LLM output: {greeting_result}")
+
+        if parsed and "greeting_message" in parsed and "example_questions" in parsed:
+            greeting_message = parsed["greeting_message"]
+            example_questions = parsed["example_questions"]
+            if isinstance(example_questions, list) and len(example_questions) > 6:
+                example_questions = example_questions[:6]
+        else:
+            greeting_message = greeting_result.strip() if greeting_result else ""
+            example_questions = []
+
+        yield {
+            "type": "greeting_message",
+            "content": greeting_message,
+            "is_complete": True
+        }
+        yield {
+            "type": "example_questions",
+            "content": json.dumps(example_questions, ensure_ascii=False),
+            "is_complete": True
+        }
+
+        final_results["greeting_message"] = greeting_message
+        final_results["example_questions"] = json.dumps(example_questions, ensure_ascii=False)
+
+        # Update agent with greeting (skip in create mode)
+        if agent_id != 0:
+            update_agent(agent_id, AgentInfoRequest(
+                agent_id=agent_id,
+                greeting_message=greeting_message,
+                example_questions=example_questions,
+            ), user_id)
+    except Exception as e:
+        logger.warning(f"Greeting generation failed: {str(e)}, skipping greeting")
+
 def optimize_prompt_section_impl(
     agent_id: int,
     model_id: int,
@@ -339,7 +427,8 @@ def optimize_prompt_section_impl(
     prompt_context = join_info_for_optimize_prompt_section(
         prompt_for_optimize=prompt_template,
         section_type=normalized_section_type,
-        section_title=section_title or _default_prompt_section_title(normalized_section_type, language),
+        section_title=section_title or _default_prompt_section_title(
+            normalized_section_type, language),
         task_description=task_description,
         current_content=current_content,
         feedback=feedback,
@@ -398,7 +487,8 @@ def generate_system_prompt(sub_agent_info_list, task_description, tool_info_list
     # If None or >= 6, no limit (all 6 calls run concurrently)
     # If < 6, use semaphore to limit concurrent calls
     model_config = get_model_by_model_id(model_id, tenant_id)
-    concurrency_limit = model_config.get("concurrency_limit") if model_config else None
+    concurrency_limit = model_config.get(
+        "concurrency_limit") if model_config else None
 
     # Start all generation threads with concurrency control
     threads, error_holder = _start_generation_threads(
@@ -443,7 +533,8 @@ def _resolve_knowledge_base_display_names(
         agent_id=agent_id,
         tenant_id=tenant_id
     )
-    logger.debug(f"Using database query for knowledge base display names: {resolved_names}")
+    logger.debug(
+        f"Using database query for knowledge base display names: {resolved_names}")
     return resolved_names
 
 
@@ -471,8 +562,9 @@ def _resolve_prompt_generation_sub_agents(
         tenant_id=tenant_id, agent_id=agent_id
     )
 
+
 def _start_generation_threads(content, prompt_for_generate, produce_queue, latest, stop_flags, tenant_id, model_id,
-                                has_selected_resources = True, concurrency_limit: Optional[int] = None):
+                              has_selected_resources=True, concurrency_limit: Optional[int] = None):
     """Start all prompt generation threads with optional concurrency control."""
     # Shared error tracking across threads
     error_holder = {"error": None}
@@ -488,9 +580,11 @@ def _start_generation_threads(content, prompt_for_generate, produce_queue, lates
         effective_limit = concurrency_limit
 
     # Use semaphore if concurrency is limited
-    semaphore = threading.Semaphore(effective_limit) if effective_limit else None
+    semaphore = threading.Semaphore(
+        effective_limit) if effective_limit else None
     if semaphore:
-        logger.info(f"Using concurrency limit of {effective_limit} for prompt generation (total tasks: {total_tasks})")
+        logger.info(
+            f"Using concurrency limit of {effective_limit} for prompt generation (total tasks: {total_tasks})")
     else:
         logger.info("Using unlimited concurrency for prompt generation")
 
@@ -539,7 +633,8 @@ def run_and_flag(tag, sys_prompt):
             ("few_shots", prompt_for_generate["few_shots_system_prompt"]),
         ])
     else:
-        logger.info("Skipping constraint and few_shots generation: no tools or sub-agents selected")
+        logger.info(
+            "Skipping constraint and few_shots generation: no tools or sub-agents selected")
         # Mark these sections as already complete with empty content
         stop_flags["constraint"] = True
         stop_flags["few_shots"] = True
@@ -638,13 +733,15 @@ def join_info_for_generate_system_prompt(prompt_for_generate, sub_agent_info_lis
     # This is necessary because Jinja2 StrictUndefined raises an error for any
     # undefined variable, even inside an {% if %} block.
     if knowledge_base_display_names:
-        kb_names_str = ", ".join(f'"{name}"' for name in knowledge_base_display_names)
+        kb_names_str = ", ".join(
+            f'"{name}"' for name in knowledge_base_display_names)
     else:
         kb_names_str = ""
     template_context["knowledge_base_names"] = kb_names_str
 
     # Generate content using template
-    content = Template(prompt_for_generate["user_prompt"], undefined=StrictUndefined).render(template_context)
+    content = Template(
+        prompt_for_generate["user_prompt"], undefined=StrictUndefined).render(template_context)
     return content
 
 
@@ -672,7 +769,8 @@ def join_info_for_optimize_prompt_section(
     )
 
     if knowledge_base_display_names:
-        kb_names_str = ", ".join(f'"{name}"' for name in knowledge_base_display_names)
+        kb_names_str = ", ".join(
+            f'"{name}"' for name in knowledge_base_display_names)
     else:
         kb_names_str = ""
 
@@ -724,7 +822,8 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
         List of knowledge base display names if knowledge_base_search tool is configured, None otherwise
     """
     # Check if knowledge_base_search tool is in the list
-    kb_tool_ids = [tool['tool_id'] for tool in tool_info_list if tool.get('name') == 'knowledge_base_search']
+    kb_tool_ids = [tool['tool_id'] for tool in tool_info_list if tool.get(
+        'name') == 'knowledge_base_search']
     if not kb_tool_ids:
         logger.debug("No knowledge_base_search tool found in tool list")
         return None
@@ -747,19 +846,23 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
                     try:
                         all_index_names.extend(json.loads(index_names))
                     except json.JSONDecodeError:
-                        logger.warning(f"Failed to parse index_names JSON: {index_names}")
+                        logger.warning(
+                            f"Failed to parse index_names JSON: {index_names}")
         except Exception as e:
-            logger.warning(f"Failed to get tool instance for tool_id {kb_tool_id}: {e}")
+            logger.warning(
+                f"Failed to get tool instance for tool_id {kb_tool_id}: {e}")
 
     if not all_index_names:
-        logger.debug("No index_names configured for knowledge_base_search tool")
+        logger.debug(
+            "No index_names configured for knowledge_base_search tool")
         return None
 
     # Remove duplicates while preserving order
     unique_index_names = list(dict.fromkeys(all_index_names))
 
     # Convert to display names
-    knowledge_name_map = get_knowledge_name_map_by_index_names(unique_index_names)
+    knowledge_name_map = get_knowledge_name_map_by_index_names(
+        unique_index_names)
 
     # Return list of display names (knowledge_name) for each configured index_name
     display_names = []
@@ -768,7 +871,8 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
         if display_name and display_name not in display_names:
             display_names.append(display_name)
 
-    logger.debug(f"Converted index_names {unique_index_names} to display_names: {display_names}")
+    logger.debug(
+        f"Converted index_names {unique_index_names} to display_names: {display_names}")
     return display_names if display_names else None
 
 
@@ -785,3 +889,299 @@ def get_enabled_sub_agent_description_for_generate_prompt(agent_id: int, tenant_
 
         sub_agent_info_list.append(sub_agent_info)
     return sub_agent_info_list
+
+
+# ── Jiuwen SDK 集成 ───────────────────────────────────────────────────────────
+
+
+@dataclass
+class OptimizeRequest:
+    """优化请求的统一数据结构"""
+    agent_id: int
+    model_id: int
+    task_description: str
+    section_type: str
+    section_title: str
+    current_content: str
+    feedback: str
+    mode: str = "general"
+    start_pos: Opt[int] = None
+    end_pos: Opt[int] = None
+    tool_ids: Opt[list[int]] = None
+    sub_agent_ids: Opt[list[int]] = None
+    knowledge_base_display_names: Opt[list[str]] = None
+
+
+@dataclass
+class OptimizeResult:
+    """优化结果的统一数据结构"""
+    optimized_content: str
+    source: str
+    section_type: str = ""
+    section_title: str = ""
+    original_content: str = ""
+
+
+class PromptOptimizationService:
+    """提示词优化服务 — 统一入口，模式二选一"""
+
+    def optimize_from_debug(self, agent_id: int, feedback: str, selected, history=None) -> OptimizeResult:
+        """基于调试对话自动优化整个 system prompt（完整模板）。
+
+        Args:
+            selected: OptimizeFromDebugSelected (pydantic model) or any object with user_question/assistant_answer.
+            history: Optional[List[HistoryItem]]
+        """
+        if not (feedback or "").strip():
+            raise AppException(
+                ErrorCode.COMMON_MISSING_REQUIRED_FIELD,
+                "Optimization feedback is required.",
+            )
+
+        if not self.is_jiuwen_mode_available():
+            raise NexentCapabilityError(
+                "Auto optimize from debug requires Jiuwen SDK to be enabled."
+            )
+
+        agent_info = search_agent_info_by_agent_id(
+            agent_id=agent_id, tenant_id=self.tenant_id, version_no=0)
+
+        duty = (agent_info.get("duty_prompt") or "").strip()
+        constraint = (agent_info.get("constraint_prompt") or "").strip()
+        few_shots = (agent_info.get("few_shots_prompt") or "").strip()
+
+        original_full_prompt = "\n\n".join(
+            [
+                "# Duty\n" + duty,
+                "# Constraint\n" + constraint,
+                "# FewShots\n" + few_shots,
+            ]
+        ).strip()
+
+        if not original_full_prompt:
+            raise AppException(
+                ErrorCode.COMMON_MISSING_REQUIRED_FIELD,
+                "Agent system prompt is empty.",
+            )
+
+        user_question = getattr(selected, "user_question", None) or (
+            selected.get("user_question") if isinstance(selected, dict) else "")
+        assistant_answer = getattr(selected, "assistant_answer", None) or (
+            selected.get("assistant_answer") if isinstance(selected, dict) else "")
+
+        bad_case_obj = type("_BadCase", (), {})
+        bc = bad_case_obj()
+        bc.question = user_question or ""
+        bc.answer = assistant_answer or ""
+        bc.label = ""
+        bc.reason = feedback
+
+        adapter_cls = _get_jiuwen_adapter_class()
+        if adapter_cls is None:
+            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
+
+        adapter = adapter_cls(
+            model_id=self.model_id, tenant_id=self.tenant_id)
+
+        optimized_full_prompt = adapter.optimize_badcase(
+            prompt=original_full_prompt,
+            bad_cases=[bc],
+            language=self.language,
+        )
+
+        return OptimizeResult(
+            optimized_content=optimized_full_prompt,
+            source="jiuwen",
+            section_type="full_prompt",
+            section_title="system_prompt",
+            original_content=original_full_prompt,
+        )
+
+    def __init__(self, model_id: int, tenant_id: str, language: str):
+        self.model_id = model_id
+        self.tenant_id = tenant_id
+        self.language = language
+
+    def is_jiuwen_mode_available(self) -> bool:
+        """判断 Jiuwen SDK 模式是否可用"""
+        if not ENABLE_JIUWEN_SDK:
+            return False
+
+        return _get_jiuwen_adapter_class() is not None
+
+    def optimize(self, request: OptimizeRequest) -> OptimizeResult:
+        """统一优化入口 — 优先 Jiuwen SDK，失败则降级 nexent 原生"""
+        if self.is_jiuwen_mode_available():
+            logger.info(
+                f"[prompt-optimize] mode={request.mode}, using Jiuwen SDK")
+            try:
+                return self._optimize_with_jiuwen(request)
+            except JiuwenSDKError as e:
+                logger.warning(f"Jiuwen SDK 模式失败，降级到 nexent 原生: {e}")
+                return self._optimize_with_nexent(request)
+        else:
+            return self._optimize_with_nexent(request)
+
+    def _optimize_with_jiuwen(self, request: OptimizeRequest) -> OptimizeResult:
+        """Jiuwen SDK 模式"""
+        logger.info(
+            f"[jiuwen-optimize] mode={request.mode}, start_pos={request.start_pos}, "
+            f"end_pos={request.end_pos}, prompt_len={len(request.current_content)}, "
+            f"feedback_len={len(request.feedback)}"
+        )
+        adapter_cls = _get_jiuwen_adapter_class()
+        if adapter_cls is None:
+            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
+
+        adapter = adapter_cls(
+            model_id=self.model_id,
+            tenant_id=self.tenant_id,
+        )
+        result = adapter.optimize(
+            prompt=request.current_content,
+            feedback=request.feedback,
+            mode=request.mode,
+            start_pos=request.start_pos,
+            end_pos=request.end_pos,
+            language=self.language,
+        )
+
+        # Jiuwen insert/select mode returns a fragment by design.
+        # We reassemble the full prompt here so frontend always receives full optimized content.
+        if request.mode == "insert":
+            if request.start_pos is None or not isinstance(request.start_pos, int):
+                raise JiuwenSDKError("insert mode requires start_pos")
+            if request.start_pos < 0 or request.start_pos > len(request.current_content):
+                raise JiuwenSDKError("insert mode start_pos out of bounds")
+            optimized_full = (
+                request.current_content[: request.start_pos]
+                + result
+                + request.current_content[request.start_pos:]
+            )
+        elif request.mode == "select":
+            if request.start_pos is None or request.end_pos is None:
+                raise JiuwenSDKError(
+                    "select mode requires start_pos and end_pos")
+            if not isinstance(request.start_pos, int) or not isinstance(request.end_pos, int):
+                raise JiuwenSDKError(
+                    "select mode start_pos/end_pos must be int")
+            if request.start_pos < 0 or request.end_pos < 0 or request.start_pos >= request.end_pos:
+                raise JiuwenSDKError("select mode start_pos/end_pos invalid")
+            if request.end_pos > len(request.current_content):
+                raise JiuwenSDKError("select mode end_pos out of bounds")
+            optimized_full = (
+                request.current_content[: request.start_pos]
+                + result
+                + request.current_content[request.end_pos:]
+            )
+        else:
+            optimized_full = result
+
+        return OptimizeResult(
+            optimized_content=optimized_full,
+            source="jiuwen",
+            section_type=request.section_type,
+            section_title=request.section_title,
+            original_content=request.current_content,
+        )
+
+    def _optimize_with_nexent(self, request: OptimizeRequest) -> OptimizeResult:
+        """nexent 原生模式 — 只支持 general 模式"""
+        if request.mode != "general":
+            raise NexentCapabilityError(
+                f"nexent 原生模式只支持 general 模式，"
+                f"当前请求 mode={request.mode} 不支持，请启用 Jiuwen SDK"
+            )
+
+        result = optimize_prompt_section_impl(
+            agent_id=request.agent_id,
+            model_id=self.model_id,
+            task_description=request.task_description,
+            tenant_id=self.tenant_id,
+            language=self.language,
+            section_type=request.section_type,
+            section_title=request.section_title,
+            current_content=request.current_content,
+            feedback=request.feedback,
+            tool_ids=request.tool_ids,
+            sub_agent_ids=request.sub_agent_ids,
+            knowledge_base_display_names=request.knowledge_base_display_names,
+        )
+        return OptimizeResult(
+            optimized_content=result["optimized_content"],
+            source="nexent",
+            section_type=result["section_type"],
+            section_title=result["section_title"],
+            original_content=result["original_content"],
+        )
+
+    def optimize_badcase(
+        self,
+        current_content: str,
+        bad_cases: list,
+        agent_id: int,
+        section_type: str,
+        section_title: str,
+        tool_ids: Opt[list[int]] = None,
+        sub_agent_ids: Opt[list[int]] = None,
+        knowledge_base_display_names: Opt[list[str]] = None,
+    ) -> OptimizeResult:
+        """坏案例优化入口 — 优先 Jiuwen SDK，失败则降级"""
+        if self.is_jiuwen_mode_available():
+            logger.info("[prompt-badcase] using Jiuwen SDK")
+            try:
+                return self._optimize_badcase_with_jiuwen(
+                    current_content, bad_cases, section_type, section_title
+                )
+            except JiuwenSDKError as e:
+                logger.warning(f"Jiuwen SDK badcase 模式失败，降级到 nexent 原生: {e}")
+                return self._optimize_badcase_with_nexent(
+                    current_content, bad_cases, agent_id, section_type, section_title,
+                    tool_ids, sub_agent_ids, knowledge_base_display_names,
+                )
+        else:
+            return self._optimize_badcase_with_nexent(
+                current_content, bad_cases, agent_id, section_type, section_title,
+                tool_ids, sub_agent_ids, knowledge_base_display_names,
+            )
+
+    def _optimize_badcase_with_jiuwen(
+        self, current_content: str, bad_cases: list, section_type: str, section_title: str
+    ) -> OptimizeResult:
+        """Jiuwen SDK 坏案例优化"""
+        adapter_cls = _get_jiuwen_adapter_class()
+        if adapter_cls is None:
+            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
+
+        adapter = adapter_cls(
+            model_id=self.model_id,
+            tenant_id=self.tenant_id,
+        )
+        result = adapter.optimize_badcase(
+            prompt=current_content,
+            bad_cases=bad_cases,
+            language=self.language,
+        )
+        return OptimizeResult(
+            optimized_content=result,
+            source="jiuwen",
+            section_type=section_type,
+            section_title=section_title,
+            original_content=current_content,
+        )
+
+    def _optimize_badcase_with_nexent(
+        self,
+        current_content: str,
+        bad_cases: list,
+        agent_id: int,
+        section_type: str,
+        section_title: str,
+        tool_ids: Opt[list[int]] = None,
+        sub_agent_ids: Opt[list[int]] = None,
+        knowledge_base_display_names: Opt[list[str]] = None,
+    ) -> OptimizeResult:
+        """nexent 原生模式不支持坏案例优化"""
+        raise NexentCapabilityError(
+            "nexent 原生模式不支持 badcase 优化，请启用 Jiuwen SDK"
+        )
diff --git a/backend/services/remote_mcp_service.py b/backend/services/remote_mcp_service.py
index 56a73fb4b..7e77a9c43 100644
--- a/backend/services/remote_mcp_service.py
+++ b/backend/services/remote_mcp_service.py
@@ -230,7 +230,7 @@ async def add_mcp_service(
     server_url: str,
     tags: list | None,
     authorization_token: str | None,
-    custom_headers: dict | None,
+    custom_headers: dict | None = None,
     container_config: dict | None,
     registry_json: dict | None,
     enabled: bool = False,
diff --git a/backend/services/tool_configuration_service.py b/backend/services/tool_configuration_service.py
index ba51567dc..3cbf5edc5 100644
--- a/backend/services/tool_configuration_service.py
+++ b/backend/services/tool_configuration_service.py
@@ -782,6 +782,8 @@ def _validate_local_tool(
                 'embedding_model': embedding_model,
                 'rerank_model': rerank_model,
                 'display_name_to_index_map': display_name_to_index_map,
+                # Internal access control: restrict results to specific document paths (path_or_urls)
+                'document_paths': instantiation_params.get('document_paths'),
             }
             tool_instance = tool_class(**params)
         elif tool_name in ["dify_search", "datamate_search"]:
@@ -982,6 +984,7 @@ def import_openapi_service(
     tenant_id: str,
     user_id: str,
     service_description: str = None,
+    headers_template: Dict[str, Any] = None,
     force_update: bool = False
 ) -> Dict[str, Any]:
     """
@@ -995,6 +998,7 @@ def import_openapi_service(
         tenant_id: Tenant ID for multi-tenancy
         user_id: User ID for audit
         service_description: Optional service description (if not provided, reads from openapi_json.info.description)
+        headers_template: Optional default headers template
         force_update: If True, replace all existing tools for this service
 
     Returns:
@@ -1015,7 +1019,8 @@ def import_openapi_service(
         server_url=server_url,
         tenant_id=tenant_id,
         user_id=user_id,
-        description=service_description
+        description=service_description,
+        headers_template=headers_template,
     )
 
     logger.info(f"Imported service '{service_name}' for tenant {tenant_id}")
diff --git a/backend/services/user_management_service.py b/backend/services/user_management_service.py
index a983b25d3..0b38a76bc 100644
--- a/backend/services/user_management_service.py
+++ b/backend/services/user_management_service.py
@@ -18,6 +18,7 @@
     get_supabase_admin_client,
     calculate_expires_at,
     get_jwt_expiry_seconds,
+    ensure_cas_session_active_from_authorization,
     resolve_tenant_id_from_user_tenant_record,
 )
 from consts.const import (
@@ -107,6 +108,7 @@ def validate_token(token: str) -> Tuple[bool, Optional[Any]]:
     try:
         user = get_current_user_from_client(client, token)
         if user:
+            ensure_cas_session_active_from_authorization(token)
             return True, user
         return False, None
     except Exception as e:
diff --git a/backend/services/vectordatabase_service.py b/backend/services/vectordatabase_service.py
index 11c5fd9bf..dd2f6e51a 100644
--- a/backend/services/vectordatabase_service.py
+++ b/backend/services/vectordatabase_service.py
@@ -10,6 +10,7 @@
 4. Health check interface
 """
 import asyncio
+import hashlib
 import json
 import logging
 import os
@@ -28,7 +29,7 @@
 
 from consts.const import DATAMATE_URL, ES_API_KEY, ES_HOST, LANGUAGE, VectorDatabaseType, IS_SPEED_MODE, PERMISSION_EDIT, PERMISSION_READ, ASSET_OWNER_TENANT_ID
 from consts.model import ChunkCreateRequest, ChunkUpdateRequest
-from database.attachment_db import delete_file, get_file_stream
+from database.attachment_db import delete_file, file_exists, get_file_stream
 from database.knowledge_db import (
     create_knowledge_record,
     delete_knowledge_record,
@@ -353,15 +354,18 @@ def get_embedding_model(
         tenant_id: Tenant ID
         model_name: Optional display name of the embedding model to use.
                    If provided, will find the model by display_name in the tenant's model list.
+        model_type: Optional model type filter. When model_name is omitted, queries tenant
+                   model records by this type; when model_type is also omitted, prefers
+                   embedding models, then multi_embedding models.
 
     Returns:
         Tuple of (embedding model instance or None, model_id or None)
     """
     if model_name:
         try:
-            normalized_model_type = _normalize_model_type(model_type)
-            if normalized_model_type:
-                model = get_model_by_display_name(model_name, tenant_id, normalized_model_type)
+            model_type = _normalize_model_type(model_type)
+            if model_type:
+                model = get_model_by_display_name(model_name, tenant_id, model_type)
             else:
                 model = get_model_by_display_name(model_name, tenant_id)
 
@@ -372,8 +376,25 @@ def get_embedding_model(
             return _create_embedding_model(model), model.get("model_id")
         except Exception as e:
             logger.warning(f"Failed to get embedding model by name {model_name}: {e}")
+    else:
+        try:
+            if model_type:
+                records = get_model_records({"model_type": model_type}, tenant_id)
+            else:
+                records = get_model_records({"model_type": "embedding"}, tenant_id)
+                if not records:
+                    records = get_model_records({"model_type": "multi_embedding"}, tenant_id)
+
+            if records:
+                model = records[0]
+                if model.get("model_type") in ["embedding", "multi_embedding"]:
+                    return _create_embedding_model(model), model.get("model_id")
+                logger.warning(
+                    f"Resolved model is not an embedding model: {model.get('model_type')}"
+                )
+        except Exception as e:
+            logger.warning(f"Failed to get default embedding model for tenant {tenant_id}: {e}")
 
-    # No default fallback - return None, None when no model is specified or found
     return None, None
 
 
@@ -636,6 +657,7 @@ def create_knowledge_base(
             group_ids: Optional[List[int]] = None,
             embedding_model_name: Optional[str] = None,
             is_multimodal: Optional[bool] = None,
+            preserve_source_file: Optional[bool] = None,
     ):
         """
         Create a new knowledge base with a user-facing name and an internal Elasticsearch index name.
@@ -655,6 +677,8 @@ def create_knowledge_base(
             group_ids: List of group IDs (optional)
             embedding_model_name: Specific embedding model name to use (optional).
                                    If provided, will use this model instead of tenant default.
+            preserve_source_file: Whether to preserve uploaded source documents after
+                                   vectorization (optional; defaults to True when omitted).
 
         For backward compatibility, legacy callers can still use create_index() directly
         with an explicit index_name.
@@ -694,6 +718,8 @@ def create_knowledge_base(
                 knowledge_data["ingroup_permission"] = ingroup_permission
             if group_ids is not None:
                 knowledge_data["group_ids"] = group_ids
+            if preserve_source_file is not None:
+                knowledge_data["preserve_source_file"] = preserve_source_file
 
             record_info = create_knowledge_record(knowledge_data)
             index_name = record_info["index_name"]
@@ -1091,6 +1117,7 @@ def list_indices(
                         # Auto-summary settings
                         "summary_frequency": record.get("summary_frequency"),
                         "last_summary_time": record.get("last_summary_time"),
+                        "preserve_source_file": record.get("preserve_source_file", True),
                         "stats": index_stats,
                     })
 
@@ -1488,6 +1515,11 @@ async def list_files(
                     # chunk_count is already set from ES aggregation (doc_count)
                     file_data['chunk_count'] = file_data.get('chunk_count', 0)
 
+            for file_data in files:
+                file_data["source_available"] = (
+                    ElasticSearchService._compute_source_available(file_data)
+                )
+
             total_duration = time.time() - total_start_time
             logger.info(f"[list_files:complete] index={index_name}, total_files={len(files)}, "
                        f"total_duration={total_duration:.3f}s")
@@ -1498,6 +1530,100 @@ async def list_files(
             raise Exception(
                 f"Error getting file list for index {index_name}: {str(e)}")
 
+    DOCUMENT_DELETE_SCOPES = ("source_only", "full")
+
+    @staticmethod
+    def _preview_pdf_cache_object_name(object_name: str) -> str:
+        """Object key for Office-to-PDF preview cache (matches file_management_service)."""
+        name_without_ext = (
+            object_name.rsplit(".", 1)[0] if "." in object_name else object_name
+        )
+        hash_suffix = hashlib.md5(object_name.encode()).hexdigest()[:8]
+        return f"preview/converted/{name_without_ext}_{hash_suffix}.pdf"
+
+    @staticmethod
+    def _compute_source_available(file_data: Dict[str, Any]) -> bool:
+        path_or_url = file_data.get("path_or_url") or ""
+        status = file_data.get("status", "")
+        if status != "COMPLETED":
+            return True
+        if path_or_url.startswith("knowledge_base/"):
+            return file_exists(path_or_url)
+        return True
+
+    @staticmethod
+    def delete_source_file(path_or_url: str) -> Dict[str, Any]:
+        """Remove MinIO source (and preview cache); does not touch Elasticsearch."""
+        minio_result = delete_file(path_or_url)
+        deleted_minio = bool(minio_result.get("success"))
+
+        if path_or_url.startswith("knowledge_base/"):
+            preview_key = ElasticSearchService._preview_pdf_cache_object_name(
+                path_or_url
+            )
+            try:
+                if file_exists(preview_key):
+                    delete_file(preview_key)
+            except Exception as exc:
+                logger.warning(
+                    "Failed to delete preview cache for '%s': %s",
+                    path_or_url,
+                    exc,
+                )
+
+        return {"deleted_minio": deleted_minio}
+
+    @staticmethod
+    async def _assert_source_only_deletable(
+            index_name: str, path_or_url: str
+    ) -> None:
+        celery_task_files = await get_all_files_status(index_name)
+        status_info = celery_task_files.get(path_or_url)
+        if not status_info or not isinstance(status_info, dict):
+            return
+        state = status_info.get("state") or ""
+        if state and state != "COMPLETED":
+            raise ValueError(
+                f"Cannot delete source file while document is in state '{state}'. "
+                "Wait until processing completes or use scope=full to remove the document."
+            )
+
+    @staticmethod
+    async def delete_document_by_scope(
+            index_name: str,
+            path_or_url: str,
+            scope: str,
+            vdb_core: VectorDatabaseCore,
+    ) -> Dict[str, Any]:
+        if scope not in ElasticSearchService.DOCUMENT_DELETE_SCOPES:
+            raise ValueError(
+                f"Invalid scope '{scope}'. "
+                f"Must be one of: {ElasticSearchService.DOCUMENT_DELETE_SCOPES}"
+            )
+
+        if scope == "source_only":
+            await ElasticSearchService._assert_source_only_deletable(
+                index_name, path_or_url
+            )
+            minio_part = ElasticSearchService.delete_source_file(path_or_url)
+            return {
+                "status": "success",
+                "scope": scope,
+                "deleted_es_count": 0,
+                "deleted_minio": minio_part.get("deleted_minio", False),
+                "source_available": False,
+                "message": (
+                    "Source file deleted; index chunks and vectors preserved."
+                ),
+            }
+
+        result = ElasticSearchService.delete_documents(
+            index_name, path_or_url, vdb_core
+        )
+        result["scope"] = scope
+        result["source_available"] = False
+        return result
+
     @staticmethod
     def delete_documents(
             index_name: str = Path(..., description="Name of the index"),
diff --git a/backend/utils/auth_utils.py b/backend/utils/auth_utils.py
index 04e81e6e3..a7194f050 100644
--- a/backend/utils/auth_utils.py
+++ b/backend/utils/auth_utils.py
@@ -326,16 +326,13 @@ def calculate_expires_at(token: Optional[str] = None) -> int:
     return int((datetime.now() + timedelta(seconds=expiry_seconds)).timestamp())
 
 
-def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
+def _decode_jwt_token(authorization: str) -> dict:
     """
     Extract user ID from JWT token after verifying signature and expiration.
 
     Args:
         authorization: Authorization header value
 
-    Returns:
-        Optional[str]: User ID, return None if parsing fails
-
     Raises:
         UnauthorizedError: If token is invalid, expired, or signature verification fails
     """
@@ -355,17 +352,12 @@ def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
 
         # Decode and verify JWT (signature + expiration)
         # verify_aud=False: allow tokens with aud claim (e.g. test JWT, Supabase) without strict audience check
-        decoded = jwt.decode(
+        return jwt.decode(
             token,
             SUPABASE_JWT_SECRET,
             algorithms=["HS256"],
             options={"verify_exp": True, "verify_aud": False},
         )
-
-        # Extract user ID from JWT claims
-        user_id = decoded.get("sub")
-
-        return user_id
     except jwt.ExpiredSignatureError:
         logging.warning("Token expired")
         raise UnauthorizedError("Token has expired")
@@ -378,10 +370,47 @@ def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
     except UnauthorizedError:
         raise
     except Exception as e:
-        logging.error(f"Failed to extract user ID from token: {str(e)}")
+        logging.error(f"Failed to decode token: {str(e)}")
         raise UnauthorizedError("Invalid or expired authentication token")
 
 
+def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
+    """
+    Extract user ID from JWT token after verifying signature and expiration.
+    """
+    decoded = _decode_jwt_token(authorization)
+    return decoded.get("sub")
+
+
+def extract_session_id_from_authorization(authorization: Optional[str]) -> Optional[str]:
+    """Extract the sid claim without enforcing token validity, for idempotent logout."""
+    if not authorization:
+        return None
+    try:
+        token = (
+            authorization.replace("Bearer ", "")
+            if authorization.startswith("Bearer ")
+            else authorization
+        )
+        decoded = jwt.decode(token, options={"verify_signature": False})
+        sid = decoded.get("sid")
+        return str(sid) if sid else None
+    except Exception:
+        return None
+
+
+def ensure_cas_session_active_from_authorization(authorization: Optional[str]) -> None:
+    """Reject CAS-issued JWTs whose server-side session is expired or revoked."""
+    session_id = extract_session_id_from_authorization(authorization)
+    if not session_id:
+        return
+
+    from database.cas_session_db import is_cas_session_active
+
+    if not is_cas_session_active(str(session_id)):
+        raise UnauthorizedError("CAS session has expired or been revoked")
+
+
 def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
     """
     Get current user ID and tenant ID from authorization token
@@ -405,10 +434,13 @@ def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
         raise UnauthorizedError("No authorization header provided")
 
     try:
-        user_id = _extract_user_id_from_jwt_token(authorization)
+        decoded = _decode_jwt_token(authorization)
+        user_id = decoded.get("sub")
         if not user_id:
             raise UnauthorizedError("Invalid or expired authentication token")
 
+        ensure_cas_session_active_from_authorization(authorization)
+
         user_tenant_record = get_user_tenant_by_user_id(user_id)
         if user_tenant_record and user_tenant_record.get("tenant_id"):
             tenant_id = user_tenant_record["tenant_id"]
@@ -421,6 +453,8 @@ def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
 
         return user_id, tenant_id
 
+    except UnauthorizedError:
+        raise
     except Exception as e:
         logging.error(f"Failed to get user ID and tenant ID: {str(e)}")
         raise UnauthorizedError("Invalid or expired authentication token")
@@ -472,7 +506,7 @@ def generate_test_jwt(user_id: str, expires_in: int = 3600) -> str:
     return jwt.encode(payload, MOCK_JWT_SECRET_KEY, algorithm="HS256")
 
 
-def generate_session_jwt(user_id: str, expires_in: int = 3600) -> str:
+def generate_session_jwt(user_id: str, expires_in: int = 3600, session_id: str = None) -> str:
     """Generate a signed JWT compatible with the existing auth verification flow."""
     now = int(time.time())
     payload = {
@@ -483,6 +517,8 @@ def generate_session_jwt(user_id: str, expires_in: int = 3600) -> str:
         "exp": now + expires_in,
         "iss": SUPABASE_URL,
     }
+    if session_id:
+        payload["sid"] = session_id
     return jwt.encode(payload, SUPABASE_JWT_SECRET, algorithm="HS256")
 
 
diff --git a/backend/utils/context_utils.py b/backend/utils/context_utils.py
index 740bf66df..0c3af8915 100644
--- a/backend/utils/context_utils.py
+++ b/backend/utils/context_utils.py
@@ -8,7 +8,6 @@
 allowing ContextManager to assemble them in the correct order.
 """
 
-from datetime import datetime
 from typing import TYPE_CHECKING, Any, Dict, List, Optional
 
 if TYPE_CHECKING:
@@ -508,13 +507,12 @@ def _format_agent_fallback(
     return "- 当前没有可用的助手" if language == "zh" else "- No agents are currently available"
 
 
-def _format_app_context(app_name: str, app_description: str, user_id: str, time_str: str) -> str:
+def _format_app_context(app_name: str, app_description: str, user_id: str) -> str:
     """Format application context for system prompt injection."""
     lines = [
         f"Application: {app_name}",
         f"Description: {app_description}",
         f"Current user: {user_id}",
-        f"Current time: {time_str}",
     ]
     return "\n".join(lines)
 
@@ -528,7 +526,6 @@ def _format_app_context(app_name: str, app_description: str, user_id: str, time_
 def build_skeleton_header_component(
     app_name: str,
     app_description: str,
-    time_str: str,
     user_id: str,
     language: str = "zh",
     priority: int = 100,
@@ -536,14 +533,17 @@ def build_skeleton_header_component(
     """Build SystemPromptComponent for the header section.
 
     Section: "### 基本信息" / "### Basic Information"
-    Content: Agent identity, app name/description, time, user_id
+    Content: Agent identity, app name/description, user_id.
+    Note: Current time is intentionally excluded from the system prompt so the
+    static system prefix can hit the LLM KV/prompt cache across requests. The
+    current time is injected on the user-message side instead (see CoreAgent.run).
     """
     from nexent.core.agents.agent_model import SystemPromptComponent
 
     if language == "zh":
-        content = f"### 基本信息\n你是{app_name}，{app_description}，现在是{time_str}，用户ID为{user_id}"
+        content = f"### 基本信息\n你是{app_name}，{app_description}，用户ID为{user_id}"
     else:
-        content = f"### Basic Information\nYou are {app_name}, {app_description}, it is {time_str} now"
+        content = f"### Basic Information\nYou are {app_name}, {app_description}"
 
     return SystemPromptComponent(
         content=content,
@@ -611,6 +611,11 @@ def build_skeleton_execution_flow_component(
         lines.append("   - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。")
         lines.append("   - **重要**：代码执行后，系统会返回 \"Observation:\" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。")
         lines.append("")
+        lines.append("3. 自验证：")
+        lines.append("   - 关键事件（工具调用、检索结果、代码执行、助手返回、准备最终回答）后，系统会进行显式自验证。")
+        lines.append("   - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。")
+        lines.append("   - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。")
+        lines.append("")
         lines.append("在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。")
         lines.append("")
         lines.append("生成最终回答时，你需要遵循以下规范：")
@@ -652,6 +657,11 @@ def build_skeleton_execution_flow_component(
         lines.append("   - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.")
         lines.append("   - **IMPORTANT**: After code execution, the system will return content with \"Observation:\" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**")
         lines.append("")
+        lines.append("3. Self-verification:")
+        lines.append("   - After critical events (tool calls, retrieval results, code execution, agent handoffs, and final-answer preparation), the system may run explicit verification.")
+        lines.append("   - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.")
+        lines.append("   - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.")
+        lines.append("")
         lines.append("After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.")
         lines.append("")
         lines.append("When generating the final answer, you need to follow these specifications:")
@@ -1112,7 +1122,6 @@ def build_context_components(
     few_shots: Optional[str] = None,
     app_name: Optional[str] = None,
     app_description: Optional[str] = None,
-    time_str: Optional[str] = None,
     user_id: Optional[str] = None,
     language: str = "zh",
     is_manager: bool = True,
@@ -1167,7 +1176,6 @@ def build_context_components(
         few_shots: Example templates text
         app_name: Application name
         app_description: Application description
-        time_str: Current time string
         user_id: Current user ID
         language: Language code ('zh' or 'en')
         is_manager: Whether this is a manager agent
@@ -1188,12 +1196,11 @@ def build_context_components(
     components: List = []
 
     # 1. Header
-    if app_name and app_description and time_str and user_id:
+    if app_name and app_description and user_id:
         components.append(
             build_skeleton_header_component(
                 app_name=app_name,
                 app_description=app_description,
-                time_str=time_str,
                 user_id=user_id,
                 language=language,
             )
@@ -1328,5 +1335,4 @@ def build_app_context_string(
     Returns:
         Formatted app context string
     """
-    time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    return _format_app_context(app_name, app_description, user_id, time_str)
\ No newline at end of file
+    return _format_app_context(app_name, app_description, user_id)
diff --git a/backend/utils/http_client_utils.py b/backend/utils/http_client_utils.py
index 1c1d14af6..262c0a593 100644
--- a/backend/utils/http_client_utils.py
+++ b/backend/utils/http_client_utils.py
@@ -8,6 +8,7 @@ def create_httpx_client(
     headers: dict[str, str] | None = None,
     timeout: httpx.Timeout | None = None,
     auth: httpx.Auth | None = None,
+    **kwargs,
 ) -> AsyncClient:
     return AsyncClient(
         headers=headers,
@@ -15,4 +16,5 @@ def create_httpx_client(
         auth=auth,
         trust_env=False,
         verify=False,
+        **kwargs,
     )
diff --git a/backend/utils/memory_utils.py b/backend/utils/memory_utils.py
index ada7019a1..e3ba01d6d 100644
--- a/backend/utils/memory_utils.py
+++ b/backend/utils/memory_utils.py
@@ -1,4 +1,5 @@
 import logging
+import re
 from typing import Dict, Any
 from urllib.parse import urlparse
 
@@ -9,6 +10,11 @@
 logger = logging.getLogger("memory_utils")
 
 
+def _sanitize_index_component(value: str) -> str:
+    """Convert arbitrary text into an Elasticsearch-safe index component."""
+    return re.sub(r"[^a-z0-9_.-]", "_", value.lower())
+
+
 def build_memory_config(tenant_id: str) -> Dict[str, Any]:
     """Return a fully-validated configuration dictionary for *mem0* ``Memory``.
     """
@@ -30,9 +36,8 @@ def build_memory_config(tenant_id: str) -> Dict[str, Any]:
     es_host = f"{parsed.scheme}://{parsed.hostname}"
     es_port = parsed.port
     # Normalize repo/name to avoid problematic characters in index names
-    safe_repo = embed_raw["model_repo"].lower().replace(
-        "/", "_") if embed_raw["model_repo"] else ""
-    safe_name = embed_raw["model_name"].lower().replace("/", "_")
+    safe_repo = _sanitize_index_component(embed_raw["model_repo"]) if embed_raw["model_repo"] else ""
+    safe_name = _sanitize_index_component(embed_raw["model_name"])
     index_name = (
         f"mem0_{safe_repo}_{safe_name}_{embed_raw['max_tokens']}"
         if embed_raw["model_repo"]
@@ -73,4 +78,4 @@ def build_memory_config(tenant_id: str) -> Dict[str, Any]:
         },
         "telemetry": {"enabled": False},
     }
-    return memory_config 
\ No newline at end of file
+    return memory_config
diff --git a/backend/utils/prompt_template_utils.py b/backend/utils/prompt_template_utils.py
index 8822e5fd4..299d3bf94 100644
--- a/backend/utils/prompt_template_utils.py
+++ b/backend/utils/prompt_template_utils.py
@@ -99,6 +99,10 @@ def get_prompt_template(template_type: str, language: str = LANGUAGE["ZH"], **kw
             LANGUAGE["ZH"]: 'backend/prompts/utils/generate_title_zh.yaml',
             LANGUAGE["EN"]: 'backend/prompts/utils/generate_title_en.yaml'
         },
+        'greeting_generate': {
+            LANGUAGE["ZH"]: 'backend/prompts/utils/greeting_generate_zh.yaml',
+            LANGUAGE["EN"]: 'backend/prompts/utils/greeting_generate_en.yaml'
+        },
         'document_summary': {
             LANGUAGE["ZH"]: 'backend/prompts/document_summary_agent_zh.yaml',
             LANGUAGE["EN"]: 'backend/prompts/document_summary_agent_en.yaml'
diff --git a/doc/docs/en/quick-start/installation.md b/doc/docs/en/quick-start/installation.md
index 0b1544819..7b6a9cb76 100644
--- a/doc/docs/en/quick-start/installation.md
+++ b/doc/docs/en/quick-start/installation.md
@@ -273,6 +273,114 @@ Provider enablement rules:
 
 For local Docker, a GitHub callback example is `http://localhost:3000/api/user/oauth/callback?provider=github`. In production, use a public HTTPS domain such as `https://nexent.example.com/api/user/oauth/callback?provider=github` and register the exact same URL in the OAuth provider console.
 
+### CAS Login Configuration
+
+CAS SSO does not require the `supabase` component. Set `CAS_CALLBACK_BASE_URL` to the browser-accessible Nexent Web URL without a trailing `/`. `CAS_SERVER_URL` is the CAS Server root URL and should also not include a trailing `/`.
+
+For Docker, configure CAS in `docker/.env`:
+
+```bash
+CAS_ENABLED=true
+CAS_SERVER_URL=http://localhost:8080/cas
+CAS_VALIDATE_PATH=/p3/serviceValidate
+CAS_CALLBACK_BASE_URL=http://localhost:3000
+
+# disabled: disable the CAS login entry and automatic redirects
+# button: show CAS as an optional login button
+# force: redirect unauthenticated Nexent users to CAS automatically
+CAS_LOGIN_MODE=force
+
+# Empty means use <cas:user>; set userName to read <cas:attributes><cas:userName>
+CAS_USER_ATTRIBUTE=
+CAS_EMAIL_ATTRIBUTE=email
+CAS_ROLE_ATTRIBUTE=role
+CAS_TENANT_ATTRIBUTE=tenant_id
+CAS_ROLE_MAP_JSON={"cas-admin":"ADMIN","cas-user":"USER"}
+CAS_SESSION_MAX_AGE_SECONDS=3600
+LOCAL_SESSION_MAX_AGE_SECONDS=3600
+CAS_RENEW_BEFORE_SECONDS=300
+CAS_RENEW_TIMEOUT_SECONDS=10
+CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
+
+# Empty means Nexent logout will not call the CAS Server logout endpoint.
+# /logout is resolved against CAS_SERVER_URL.
+CAS_LOGOUT_URL=/logout
+CAS_SSL_VERIFY=true
+CAS_CA_BUNDLE=
+```
+
+Common CAS URLs:
+
+| Purpose | URL |
+|---------|-----|
+| Nexent login entry | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
+| CAS service callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
+| CAS silent renewal callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
+| CAS single logout callback | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
+
+For Apereo CAS JSON Service Registry, create a service registration file such as `Nexent-10001.json` in the service registry directory configured by your CAS deployment. The `id` must be globally unique. This is a local Docker example:
+
+```json
+{
+  "@class": "org.apereo.cas.services.RegexRegisteredService",
+  "serviceId": "http://localhost:3000.*",
+  "name": "Nexent CAS Client",
+  "id": 10001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://localhost:3000/api/user/cas/logout_callback"
+}
+```
+
+In production, keep `CAS_SSL_VERIFY=true`; for self-signed certificates, prefer `CAS_CA_BUNDLE` and only use `CAS_SSL_VERIFY=false` for local testing.
+
+#### CAS Integration with ModelEngine
+
+When integrating with ModelEngine through the CAS protocol, deploy Nexent with the following configuration:
+
+```bash
+CAS_ENABLED=true
+CAS_SERVER_URL=https://<ModelEngine IP>:5443/SSOSvr
+CAS_VALIDATE_PATH=/p3/serviceValidate
+CAS_CALLBACK_BASE_URL=http://<Nexent IP>:3000
+CAS_LOGIN_MODE=force
+CAS_USER_ATTRIBUTE=userName
+CAS_EMAIL_ATTRIBUTE=email
+CAS_ROLE_ATTRIBUTE=userType
+CAS_TENANT_ATTRIBUTE=tenant_id
+CAS_ROLE_MAP_JSON={"1":"ADMIN","3":"DEV"}
+CAS_SESSION_MAX_AGE_SECONDS=3600
+LOCAL_SESSION_MAX_AGE_SECONDS=3600
+CAS_RENEW_BEFORE_SECONDS=300
+CAS_RENEW_TIMEOUT_SECONDS=10
+CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
+CAS_LOGOUT_URL=/logout?service=http://<Nexent IP>:3000
+CAS_SSL_VERIFY=false
+CAS_CA_BUNDLE=
+```
+
+You also need to add a CAS client service registration file in the OMS container. Use the following steps as a reference:
+
+```bash
+# Create the registration file, paste the JSON content into it, and save it.
+vim Nexent-10000001.json
+{
+  "@class": "org.apereo.cas.services.CasRegisteredService",
+  "serviceId": "http://<Nexent IP>:3000.*",
+  "name": "Nexent CAS Client",
+  "id": 1000001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://<Nexent IP>:3000/api/user/cas/logout_callback"
+}
+
+# Run the following command to copy the registration file into the container.
+kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+```
+
 ### Northbound Interface Configuration (NORTHBOUND_EXTERNAL_URL)
 
 If you need to use any of the following features, configure the `NORTHBOUND_EXTERNAL_URL` environment variable:
diff --git a/doc/docs/en/quick-start/kubernetes-installation.md b/doc/docs/en/quick-start/kubernetes-installation.md
index 8253c411f..a10873c7c 100644
--- a/doc/docs/en/quick-start/kubernetes-installation.md
+++ b/doc/docs/en/quick-start/kubernetes-installation.md
@@ -291,6 +291,122 @@ Provider callback URLs:
 
 For local NodePort, a GitHub callback example is `http://localhost:30000/api/user/oauth/callback?provider=github`. In production, use a public HTTPS domain and register the exact same URL in the OAuth provider console.
 
+### CAS Login Configuration
+
+CAS SSO does not require the `supabase` component. Set `nexent-common.config.cas.callbackBaseUrl` to the browser-accessible Nexent Web URL without a trailing `/`. `nexent-common.config.cas.serverUrl` is the CAS Server root URL and should also not include a trailing `/`.
+
+Kubernetes writes CAS settings into backend environment variables through `nexent-common` `config.cas.*` values:
+
+```bash
+helm upgrade --install nexent nexent \
+  --namespace nexent --create-namespace \
+  --set nexent-common.config.cas.enabled=true \
+  --set nexent-common.config.cas.serverUrl=https://cas.example.com/cas \
+  --set nexent-common.config.cas.callbackBaseUrl=https://nexent.example.com \
+  --set nexent-common.config.cas.loginMode=force \
+  --set nexent-common.config.cas.logoutUrl=/logout
+```
+
+Configurable CAS values:
+
+| Value | Environment variable | Description |
+|-------|----------------------|-------------|
+| `nexent-common.config.cas.enabled` | `CAS_ENABLED` | Enables CAS |
+| `nexent-common.config.cas.serverUrl` | `CAS_SERVER_URL` | CAS Server root URL |
+| `nexent-common.config.cas.validatePath` | `CAS_VALIDATE_PATH` | serviceValidate path, default `/p3/serviceValidate` |
+| `nexent-common.config.cas.callbackBaseUrl` | `CAS_CALLBACK_BASE_URL` | Web entry URL; CAS callback paths are appended automatically |
+| `nexent-common.config.cas.loginMode` | `CAS_LOGIN_MODE` | `disabled`, `button`, or `force` |
+| `nexent-common.config.cas.userAttribute` | `CAS_USER_ATTRIBUTE` | User identifier attribute. Empty means use `<cas:user>` |
+| `nexent-common.config.cas.emailAttribute` | `CAS_EMAIL_ATTRIBUTE` | Email attribute |
+| `nexent-common.config.cas.roleAttribute` | `CAS_ROLE_ATTRIBUTE` | Role attribute |
+| `nexent-common.config.cas.tenantAttribute` | `CAS_TENANT_ATTRIBUTE` | Tenant attribute |
+| `nexent-common.config.cas.roleMapJson` | `CAS_ROLE_MAP_JSON` | JSON mapping from CAS roles to Nexent roles |
+| `nexent-common.config.cas.sessionMaxAgeSeconds` | `CAS_SESSION_MAX_AGE_SECONDS` | Maximum local CAS session lifetime |
+| `nexent-common.config.cas.localSessionMaxAgeSeconds` | `LOCAL_SESSION_MAX_AGE_SECONDS` | Nexent local session lifetime |
+| `nexent-common.config.cas.renewBeforeSeconds` | `CAS_RENEW_BEFORE_SECONDS` | Trigger silent renewal within this many seconds before expiry |
+| `nexent-common.config.cas.renewTimeoutSeconds` | `CAS_RENEW_TIMEOUT_SECONDS` | Silent renewal timeout |
+| `nexent-common.config.cas.syntheticEmailDomain` | `CAS_SYNTHETIC_EMAIL_DOMAIN` | Domain used when CAS does not return an email |
+| `nexent-common.config.cas.logoutUrl` | `CAS_LOGOUT_URL` | CAS logout URL. Empty means Nexent logout will not call the CAS Server logout endpoint |
+| `nexent-common.config.cas.sslVerify` | `CAS_SSL_VERIFY` | Whether to verify CAS Server TLS certificates |
+| `nexent-common.config.cas.caBundle` | `CAS_CA_BUNDLE` | Custom CA bundle path |
+
+Common CAS URLs:
+
+| Purpose | URL |
+|---------|-----|
+| Nexent login entry | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
+| CAS service callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
+| CAS silent renewal callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
+| CAS single logout callback | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
+
+For Apereo CAS JSON Service Registry, create a service registration file such as `Nexent-10001.json` in the service registry directory configured by your CAS deployment. The `id` must be globally unique. This is a local NodePort example:
+
+```json
+{
+  "@class": "org.apereo.cas.services.RegexRegisteredService",
+  "serviceId": "http://localhost:30000.*",
+  "name": "Nexent CAS Client",
+  "id": 10001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://localhost:30000/api/user/cas/logout_callback"
+}
+```
+
+In production, keep `CAS_SSL_VERIFY=true`; for self-signed certificates, prefer `CAS_CA_BUNDLE` and only use `CAS_SSL_VERIFY=false` for local testing.
+
+#### CAS Integration with ModelEngine
+
+When integrating with ModelEngine through the CAS protocol, use a values file to configure Nexent. This avoids complex command-line escaping for `CAS_ROLE_MAP_JSON`.
+
+Create `cas-modelengine-values.yaml`:
+
+```yaml
+nexent-common:
+  config:
+    cas:
+      enabled: true
+      serverUrl: "https://<ModelEngine IP>:5443/SSOSvr"
+      validatePath: "/p3/serviceValidate"
+      callbackBaseUrl: "http://<Nexent IP>:30000"
+      loginMode: "force"
+      userAttribute: "userName"
+      emailAttribute: "email"
+      roleAttribute: "userType"
+      tenantAttribute: "tenant_id"
+      roleMapJson: '{"1":"ADMIN","3":"DEV"}'
+      sessionMaxAgeSeconds: 3600
+      localSessionMaxAgeSeconds: 3600
+      renewBeforeSeconds: 300
+      renewTimeoutSeconds: 10
+      syntheticEmailDomain: "cas.local"
+      logoutUrl: "/logout?service=http://<Nexent IP>:30000"
+      sslVerify: false
+      caBundle: ""
+```
+
+You also need to add a CAS client service registration file in the OMS container. Use the following steps as a reference:
+
+```bash
+# Create the registration file, paste the JSON content into it, and save it.
+vim Nexent-10000001.json
+{
+  "@class": "org.apereo.cas.services.CasRegisteredService",
+  "serviceId": "http://<Nexent IP>:30000.*",
+  "name": "Nexent CAS Client",
+  "id": 1000001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://<Nexent IP>:30000/api/user/cas/logout_callback"
+}
+
+# Run the following command to copy the registration file into the container.
+kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+```
+
 ## 🔍 Troubleshooting
 
 ### Check Pod Status
diff --git a/doc/docs/en/user-guide/agent-development.md b/doc/docs/en/user-guide/agent-development.md
index 7637cd620..8e6b47d4f 100644
--- a/doc/docs/en/user-guide/agent-development.md
+++ b/doc/docs/en/user-guide/agent-development.md
@@ -111,6 +111,18 @@ In the External A2A Agent list, you can view and manage all discovered external
 > - Batch integrate all agents from the same service registry through Nacos discovery
 > - Configure protocols to meet the requirements of different agent service providers
 
+###### Integrate [DataAgent](https://gitcode.com/datagallery/dataagent) A2A Agent via URL
+
+1. Refer to the [DataAgent documentation](https://gitcode.com/datagallery/dataagent#%F0%9F%8C%90-a2a-10-%E6%9C%8D%E5%8A%A1%E6%A8%A1%E5%BC%8F) and start DataAgent in A2A service mode.
+   > Nexent does not currently support agents that require authentication. Do not set `auth-token` when starting DataAgent.
+
+<div style="display: flex; justify-content: left;">
+  <img src="./assets/agent-development/dataagent_deploy.png" style="width: 80%; height: auto;" />
+</div>
+
+2. Refer to [Discover Agent via URL](#discover-agent-via-url) to integrate the agent. The URL is `http://<IP>:9999/.well-known/agent-card.json`.
+3. Refer to [Manage Discovered External Agents](#manage-discovered-external-agents) to configure the invocation protocol, and select HTTP + JSON for integration.
+
 ### 🛠️ Select Agent Tools
 
 Agents can use various tools to complete tasks, such as knowledge base search, file parsing, image parsing, email sending/receiving, file management, and other local tools. They can also integrate third-party MCP tools or custom tools.
diff --git a/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png b/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png
new file mode 100644
index 000000000..46fa9fde3
Binary files /dev/null and b/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png differ
diff --git a/doc/docs/zh/quick-start/installation.md b/doc/docs/zh/quick-start/installation.md
index 871cae0cc..6d3538b90 100644
--- a/doc/docs/zh/quick-start/installation.md
+++ b/doc/docs/zh/quick-start/installation.md
@@ -269,6 +269,111 @@ Provider 启用规则：
 
 本地默认回调示例为 `http://localhost:3000/api/user/oauth/callback?provider=github`。生产环境应改为公网 HTTPS 域名，例如 `https://nexent.example.com/api/user/oauth/callback?provider=github`，并在 OAuth provider 控制台中登记相同地址。
 
+### CAS 登录配置
+
+CAS SSO 不依赖 `supabase`。启用 CAS 时，请将 `CAS_CALLBACK_BASE_URL` 设置为浏览器可访问的 Nexent Web 地址，且不要带结尾 `/`。`CAS_SERVER_URL` 是 CAS Server 根地址，也不要带结尾 `/`。
+
+Docker 部署在 `docker/.env` 中配置 CAS：
+
+```bash
+CAS_ENABLED=true
+CAS_SERVER_URL=http://localhost:8080/cas
+CAS_VALIDATE_PATH=/p3/serviceValidate
+CAS_CALLBACK_BASE_URL=http://localhost:3000
+
+# disabled: 禁用 CAS 登录入口和自动跳转
+# button: 在登录页显示 CAS 登录按钮
+# force: 未登录访问 Nexent 时自动跳转到 CAS
+CAS_LOGIN_MODE=force
+
+# 为空时使用 <cas:user>；填写 userName 时从 <cas:attributes><cas:userName> 取用户标识
+CAS_USER_ATTRIBUTE=
+CAS_EMAIL_ATTRIBUTE=email
+CAS_ROLE_ATTRIBUTE=role
+CAS_TENANT_ATTRIBUTE=tenant_id
+CAS_ROLE_MAP_JSON={"cas-admin":"ADMIN","cas-user":"USER"}
+CAS_SESSION_MAX_AGE_SECONDS=3600
+LOCAL_SESSION_MAX_AGE_SECONDS=3600
+CAS_RENEW_BEFORE_SECONDS=300
+CAS_RENEW_TIMEOUT_SECONDS=10
+CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
+
+# 为空时 Nexent 主动退出不会调用 CAS Server 登出接口。
+# 可配置为 /logout，系统会基于 CAS_SERVER_URL 拼接。
+CAS_LOGOUT_URL=/logout
+CAS_SSL_VERIFY=true
+CAS_CA_BUNDLE=
+```
+
+常用 CAS 地址：
+
+| 用途 | 地址 |
+|------|------|
+| Nexent 登录入口 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
+| CAS service 回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
+| CAS 无感续期回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
+| CAS 单点登出回调 | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
+
+Apereo CAS 使用 JSON Service Registry 时，可以新增一个服务注册文件，例如 `Nexent-10001.json`。文件需要放到 CAS 部署配置的 service registry 目录中，`id` 必须全局唯一。下面是本地 Docker 示例：
+
+```json
+{
+  "@class": "org.apereo.cas.services.RegexRegisteredService",
+  "serviceId": "http://localhost:3000.*",
+  "name": "Nexent CAS Client",
+  "id": 10001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://localhost:3000/api/user/cas/logout_callback"
+}
+```
+
+生产环境建议保持 `CAS_SSL_VERIFY=true`；自签名证书优先配置 `CAS_CA_BUNDLE`，仅本地验证时再临时设置 `CAS_SSL_VERIFY=false`。
+
+#### CAS对接ModelEngine
+当使用CAS协议对接ModelEngine时，可以使用如下配置部署Nexent：
+```bash
+CAS_ENABLED=true
+CAS_SERVER_URL=https://<ModelEngine IP>:5443/SSOSvr
+CAS_VALIDATE_PATH=/p3/serviceValidate
+CAS_CALLBACK_BASE_URL=http://<Nexent IP>:3000
+CAS_LOGIN_MODE=force
+CAS_USER_ATTRIBUTE=userName
+CAS_EMAIL_ATTRIBUTE=email
+CAS_ROLE_ATTRIBUTE=userType
+CAS_TENANT_ATTRIBUTE=tenant_id
+CAS_ROLE_MAP_JSON={"1":"ADMIN","3":"DEV"}
+CAS_SESSION_MAX_AGE_SECONDS=3600
+LOCAL_SESSION_MAX_AGE_SECONDS=3600
+CAS_RENEW_BEFORE_SECONDS=300
+CAS_RENEW_TIMEOUT_SECONDS=10
+CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
+CAS_LOGOUT_URL=/logout?service=http://<Nexent IP>:3000
+CAS_SSL_VERIFY=false
+CAS_CA_BUNDLE=
+```
+
+同时，需要进入oms容器添加cas client的注册配置文件，参考如下步骤：
+```bash
+# 创建注册配置文件，将json部分输入文件并保存
+vim Nexent-10000001.json
+{
+  "@class": "org.apereo.cas.services.CasRegisteredService",
+  "serviceId": "http://<Nexent IP>:3000.*",
+  "name": "Nexent CAS Client",
+  "id": 1000001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://<Nexent IP>:3000/api/user/cas/logout_callback"
+}
+
+# 执行如下命令，将配置文件拷贝到容器中
+kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+```
+
 ### 北向接口配置 (NORTHBOUND_EXTERNAL_URL)
 
 如果您需要使用以下功能，需要配置 `NORTHBOUND_EXTERNAL_URL` 环境变量：
diff --git a/doc/docs/zh/quick-start/kubernetes-installation.md b/doc/docs/zh/quick-start/kubernetes-installation.md
index 47d2af816..7229f1ea8 100644
--- a/doc/docs/zh/quick-start/kubernetes-installation.md
+++ b/doc/docs/zh/quick-start/kubernetes-installation.md
@@ -291,6 +291,122 @@ Provider 回调地址：
 
 本地 NodePort 默认回调示例为 `http://localhost:30000/api/user/oauth/callback?provider=github`。生产环境应改为公网 HTTPS 域名，并在 OAuth provider 控制台中登记相同地址。
 
+### CAS 登录配置
+
+CAS SSO 不依赖 `supabase`。启用 CAS 时，请将 `nexent-common.config.cas.callbackBaseUrl` 设置为浏览器可访问的 Nexent Web 地址，且不要带结尾 `/`。`nexent-common.config.cas.serverUrl` 是 CAS Server 根地址，也不要带结尾 `/`。
+
+Kubernetes 部署通过 `nexent-common` 的 `config.cas.*` values 写入后端环境变量：
+
+```bash
+helm upgrade --install nexent nexent \
+  --namespace nexent --create-namespace \
+  --set nexent-common.config.cas.enabled=true \
+  --set nexent-common.config.cas.serverUrl=https://cas.example.com/cas \
+  --set nexent-common.config.cas.callbackBaseUrl=https://nexent.example.com \
+  --set nexent-common.config.cas.loginMode=force \
+  --set nexent-common.config.cas.logoutUrl=/logout
+```
+
+可配置的 CAS values：
+
+| Values | 对应环境变量 | 说明 |
+|--------|--------------|------|
+| `nexent-common.config.cas.enabled` | `CAS_ENABLED` | 是否启用 CAS |
+| `nexent-common.config.cas.serverUrl` | `CAS_SERVER_URL` | CAS Server 根地址 |
+| `nexent-common.config.cas.validatePath` | `CAS_VALIDATE_PATH` | serviceValidate 路径，默认 `/p3/serviceValidate` |
+| `nexent-common.config.cas.callbackBaseUrl` | `CAS_CALLBACK_BASE_URL` | Web 入口地址，CAS 回调路径会自动拼接 |
+| `nexent-common.config.cas.loginMode` | `CAS_LOGIN_MODE` | `disabled`、`button` 或 `force` |
+| `nexent-common.config.cas.userAttribute` | `CAS_USER_ATTRIBUTE` | 用户标识属性。为空时使用 `<cas:user>` |
+| `nexent-common.config.cas.emailAttribute` | `CAS_EMAIL_ATTRIBUTE` | 邮箱属性 |
+| `nexent-common.config.cas.roleAttribute` | `CAS_ROLE_ATTRIBUTE` | 角色属性 |
+| `nexent-common.config.cas.tenantAttribute` | `CAS_TENANT_ATTRIBUTE` | 租户属性 |
+| `nexent-common.config.cas.roleMapJson` | `CAS_ROLE_MAP_JSON` | CAS 角色到 Nexent 角色的 JSON 映射 |
+| `nexent-common.config.cas.sessionMaxAgeSeconds` | `CAS_SESSION_MAX_AGE_SECONDS` | CAS 本地会话最长有效期 |
+| `nexent-common.config.cas.localSessionMaxAgeSeconds` | `LOCAL_SESSION_MAX_AGE_SECONDS` | Nexent 本地会话有效期 |
+| `nexent-common.config.cas.renewBeforeSeconds` | `CAS_RENEW_BEFORE_SECONDS` | 距离过期多少秒内触发无感续期 |
+| `nexent-common.config.cas.renewTimeoutSeconds` | `CAS_RENEW_TIMEOUT_SECONDS` | 无感续期等待超时时间 |
+| `nexent-common.config.cas.syntheticEmailDomain` | `CAS_SYNTHETIC_EMAIL_DOMAIN` | CAS 未返回邮箱时生成邮箱使用的域名 |
+| `nexent-common.config.cas.logoutUrl` | `CAS_LOGOUT_URL` | CAS 登出地址。为空时 Nexent 主动退出不调用 CAS Server 登出接口 |
+| `nexent-common.config.cas.sslVerify` | `CAS_SSL_VERIFY` | 访问 CAS Server 时是否校验证书 |
+| `nexent-common.config.cas.caBundle` | `CAS_CA_BUNDLE` | 自定义 CA bundle 路径 |
+
+常用 CAS 地址：
+
+| 用途 | 地址 |
+|------|------|
+| Nexent 登录入口 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
+| CAS service 回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
+| CAS 无感续期回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
+| CAS 单点登出回调 | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
+
+Apereo CAS 使用 JSON Service Registry 时，可以新增一个服务注册文件，例如 `Nexent-10001.json`。文件需要放到 CAS 部署配置的 service registry 目录中，`id` 必须全局唯一。本地 NodePort 示例：
+
+```json
+{
+  "@class": "org.apereo.cas.services.RegexRegisteredService",
+  "serviceId": "http://localhost:30000.*",
+  "name": "Nexent CAS Client",
+  "id": 10001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://localhost:30000/api/user/cas/logout_callback"
+}
+```
+
+生产环境建议保持 `CAS_SSL_VERIFY=true`；自签名证书优先配置 `CAS_CA_BUNDLE`，仅本地验证时再临时设置 `CAS_SSL_VERIFY=false`。
+
+#### CAS 对接 ModelEngine
+
+当使用 CAS 协议对接 ModelEngine 时，建议通过 values 文件配置 Nexent，避免 `CAS_ROLE_MAP_JSON` 在命令行中转义复杂。
+
+创建 `cas-modelengine-values.yaml`：
+
+```yaml
+nexent-common:
+  config:
+    cas:
+      enabled: true
+      serverUrl: "https://<ModelEngine IP>:5443/SSOSvr"
+      validatePath: "/p3/serviceValidate"
+      callbackBaseUrl: "http://<Nexent IP>:30000"
+      loginMode: "force"
+      userAttribute: "userName"
+      emailAttribute: "email"
+      roleAttribute: "userType"
+      tenantAttribute: "tenant_id"
+      roleMapJson: '{"1":"ADMIN","3":"DEV"}'
+      sessionMaxAgeSeconds: 3600
+      localSessionMaxAgeSeconds: 3600
+      renewBeforeSeconds: 300
+      renewTimeoutSeconds: 10
+      syntheticEmailDomain: "cas.local"
+      logoutUrl: "/logout?service=http://<Nexent IP>:30000"
+      sslVerify: false
+      caBundle: ""
+```
+
+同时，需要进入 OMS 容器添加 CAS client 的注册配置文件，参考如下步骤：
+
+```bash
+# 创建注册配置文件，将 JSON 部分输入文件并保存
+vim Nexent-10000001.json
+{
+  "@class": "org.apereo.cas.services.CasRegisteredService",
+  "serviceId": "http://<Nexent IP>:30000.*",
+  "name": "Nexent CAS Client",
+  "id": 1000001,
+  "description": "Nexent CAS SSO client",
+  "evaluationOrder": 1,
+  "logoutType": "BACK_CHANNEL",
+  "logoutUrl": "http://<Nexent IP>:30000/api/user/cas/logout_callback"
+}
+
+# 执行如下命令，将配置文件拷贝到容器中
+kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
+```
+
 ## 🔍 故障排查
 
 ### 查看 Pod 状态
diff --git a/doc/docs/zh/sdk/vector-database.md b/doc/docs/zh/sdk/vector-database.md
index 940af9c33..b940400fd 100644
--- a/doc/docs/zh/sdk/vector-database.md
+++ b/doc/docs/zh/sdk/vector-database.md
@@ -579,7 +579,11 @@ python -m nexent.service.vectordatabase_service
   - 参数:
     - `index_name`: 索引名称 (路径参数)
     - `path_or_url`: 文档路径或URL (查询参数)
-  - 返回示例: `{"status": "success", "deleted_count": 1}`
+    - `scope`: 删除范围 (查询参数，默认 `full`)
+      - `source_only`: 仅删除 MinIO 源文件，保留 ES 中的切片与向量（检索仍可用，预览不可用）
+      - `full`: 删除 ES 文档、MinIO 源文件，并清理相关 Redis 任务记录
+  - 返回示例 (`source_only`): `{"status": "success", "scope": "source_only", "deleted_es_count": 0, "deleted_minio": true, "source_available": false}`
+  - 返回示例 (`full`): `{"status": "success", "scope": "full", "deleted_es_count": 5, "deleted_minio": true}`
 
 #### 搜索操作
 
@@ -728,8 +732,11 @@ curl -X POST "http://localhost:8000/indices/search/hybrid" \
     "weight_accurate": 0.3
   }'
 
-# 删除文档
-curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=https://example.com/doc1"
+# 删除源文件（保留索引）
+curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=knowledge_base/doc1.pdf&scope=source_only"
+
+# 从知识库彻底移除文档
+curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=knowledge_base/doc1.pdf&scope=full"
 
 # 创建索引
 curl -X POST "http://localhost:8000/indices/my_documents"
diff --git a/doc/docs/zh/user-guide/agent-development.md b/doc/docs/zh/user-guide/agent-development.md
index 3edf31de7..40805aeea 100644
--- a/doc/docs/zh/user-guide/agent-development.md
+++ b/doc/docs/zh/user-guide/agent-development.md
@@ -113,6 +113,17 @@ Nexent 支持通过 A2A 协议与第三方 Agent 进行通信。您可以通过
 > - 通过 Nacos 发现批量接入同一服务注册中心的所有 Agent
 > - 配置协议以兼容不同 Agent 服务提供商的要求
 
+
+###### 通过URL对接[DataAgent](https://gitcode.com/datagallery/dataagent) A2A Agent
+1. 参考[DataAgent文档](https://gitcode.com/datagallery/dataagent#%F0%9F%8C%90-a2a-10-%E6%9C%8D%E5%8A%A1%E6%A8%A1%E5%BC%8F)以A2A服务模式启动DataAgent
+   >当前Nexent不支持带认证的agent，启动DataAgent时请勿设置auth-token
+<div style="display: flex; justify-content: left;">
+  <img src="./assets/agent-development/dataagent_deploy.png" style="width: 80%; height: auto;" />
+</div>
+
+2. 参考[通过 URL 发现 Agent](#通过-url-发现-agent)接入agent，url为http://\<IP\>:9999/.well-known/agent-card.json
+3. 参考[管理已发现的外部 Agent](#管理已发现的外部-agent)配置调用协议，选择HTTP+JSON方式接入
+
 ### 🛠️ 选择智能体的工具
 
 智能体可以使用各种工具来完成任务，如知识库检索、文件解析、图片解析、收发邮件、文件管理等本地工具，也可接入第三方 MCP 工具，或自定义工具。
diff --git a/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png b/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png
new file mode 100644
index 000000000..46fa9fde3
Binary files /dev/null and b/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png differ
diff --git a/doc/procedural-memory-verification.md b/doc/procedural-memory-verification.md
new file mode 100644
index 000000000..ea9f53290
--- /dev/null
+++ b/doc/procedural-memory-verification.md
@@ -0,0 +1,315 @@
+# Procedural Memory Verification Report
+
+## Summary
+**Status: ⚠️ FULLY SUPPORTED but REQUIRES OPTIONAL DEPENDENCY**
+
+Procedural memory is a fully implemented feature in mem0ai version 0.1.117, **BUT it requires `langchain-core` to be installed separately**. Without this dependency, the feature will fail at runtime.
+
+---
+
+## ⚠️ CRITICAL FINDING: Optional Dependency Required
+
+**Your colleague is partially correct.** The procedural memory code is NOT empty (it's 50 lines of real implementation), but it has a critical dependency issue:
+
+### The Problem
+
+The `_create_procedural_memory()` method contains:
+
+```python
+try:
+    from langchain_core.messages.utils import convert_to_messages
+except Exception:
+    logger.error(
+        "Import error while loading langchain-core. "
+        "Please install 'langchain-core' to use procedural memory."
+    )
+    raise  # ← Fails here if langchain-core not installed
+```
+
+### Reality Check
+
+| Aspect | Status |
+|--------|--------|
+| Code exists? | ✅ Yes, 50 lines of real implementation |
+| Code is empty/stub? | ❌ No, it's fully implemented |
+| Works out of the box? | ❌ **NO** - requires `langchain-core` package |
+| Documented requirement? | ⚠️ Only in error message, not in main docs |
+
+### Why Your Colleague Thought It Was Empty
+
+1. They called `memory.add(..., memory_type="procedural_memory")`
+2. Got `ImportError: No module named 'langchain_core'`
+3. Saw the error and concluded "it doesn't work" or "it's empty"
+4. This is understandable - the feature exists but is **disabled by default**
+
+---
+
+## Verification Results
+
+### 1. API Support ✅
+The `memory_type` parameter is available in both `AsyncMemory.add()` and `Memory.add()`:
+
+```python
+async def add(
+    self,
+    messages,
+    *,
+    user_id: Optional[str] = None,
+    agent_id: Optional[str] = None,
+    run_id: Optional[str] = None,
+    metadata: Optional[Dict[str, Any]] = None,
+    infer: bool = True,
+    memory_type: Optional[str] = None,  # ✅ SUPPORTED
+    prompt: Optional[str] = None,
+    llm=None
+)
+```
+
+### 2. MemoryType Enum ✅
+Located in `mem0.configs.enums.MemoryType`:
+
+```python
+class MemoryType(Enum):
+    SEMANTIC = "semantic_memory"
+    EPISODIC = "episodic_memory"
+    PROCEDURAL = "procedural_memory"  # ✅ AVAILABLE
+```
+
+### 3. Implementation ✅
+The `_create_procedural_memory()` method exists in both `AsyncMemory` and `Memory` classes:
+
+**AsyncMemory signature:**
+```python
+async def _create_procedural_memory(
+    self,
+    messages,
+    metadata=None,
+    llm=None,
+    prompt=None
+)
+```
+
+**Memory (sync) signature:**
+```python
+def _create_procedural_memory(
+    self,
+    messages,
+    metadata=None,
+    prompt=None
+)
+```
+
+### 4. Validation Logic ✅
+The `add()` method validates `memory_type` and enforces constraints:
+
+```python
+# Only "procedural_memory" is accepted
+if memory_type is not None and memory_type != MemoryType.PROCEDURAL.value:
+    raise ValueError(
+        f"Invalid 'memory_type'. Please pass {MemoryType.PROCEDURAL.value} "
+        "to create procedural memories."
+    )
+
+# agent_id is REQUIRED for procedural memory
+if agent_id is not None and memory_type == MemoryType.PROCEDURAL.value:
+    results = await self._create_procedural_memory(
+        messages, metadata=processed_metadata, prompt=prompt, llm=llm
+    )
+    return results
+```
+
+### 5. System Prompt ✅
+A comprehensive 5,100-character system prompt exists in `mem0.configs.prompts.PROCEDURAL_MEMORY_SYSTEM_PROMPT`:
+
+**Purpose:** Records and preserves complete interaction history between human and AI agent
+
+**Structure:**
+- Overview (Global Metadata)
+  - Task Objective
+  - Progress Status
+- Sequential Agent Actions (Numbered Steps)
+  - Agent Action
+  - Action Result (Mandatory, Unmodified)
+  - Embedded Metadata (Key Findings, Navigation History, Errors, Current Context)
+
+**Key Guidelines:**
+1. Preserve every output verbatim
+2. Maintain chronological order
+3. Include exact data (URLs, element indexes, error messages, JSON responses)
+4. Output only the structured summary
+
+---
+
+## Usage Example
+
+```python
+from mem0 import AsyncMemory
+
+# Initialize memory
+memory = await AsyncMemory.from_config(config)
+
+# Create procedural memory
+messages = [
+    {"role": "user", "content": "Search for AI news"},
+    {"role": "assistant", "content": "I'll search for recent AI news..."},
+    # ... more conversation history
+]
+
+result = await memory.add(
+    messages=messages,
+    user_id="user_123",
+    agent_id="research_agent",  # ⚠️ REQUIRED for procedural memory
+    memory_type="procedural_memory",
+    metadata={
+        "task": "AI news research",
+        "session_id": "session_456"
+    }
+)
+
+# Result format:
+# {
+#     "results": [
+#         {
+#             "id": "memory_id_here",
+#             "memory": "## Summary of the agent's execution history...",
+#             "event": "ADD"
+#         }
+#     ]
+# }
+```
+
+---
+
+## Requirements & Constraints
+
+### Required Parameters
+- ✅ `agent_id`: **MUST** be provided when using `memory_type="procedural_memory"`
+- ✅ `metadata`: **MUST** be provided (cannot be None)
+- ✅ `messages`: List of conversation messages to summarize
+
+### Optional Parameters
+- `prompt`: Custom prompt to override default `PROCEDURAL_MEMORY_SYSTEM_PROMPT`
+- `llm`: Custom LangChain ChatModel (async version only)
+
+### Validation Rules
+1. `memory_type` must be exactly `"procedural_memory"` (or None)
+2. If `memory_type="procedural_memory"` is set, `agent_id` must be provided
+3. `metadata` cannot be None for procedural memories
+
+---
+
+## Implementation Details
+
+### How It Works
+1. **Validation**: Checks `memory_type` and required parameters
+2. **Prompt Construction**: Uses default or custom system prompt
+3. **LLM Summarization**: Calls LLM to generate comprehensive execution summary
+4. **Embedding**: Generates embedding for the summary
+5. **Storage**: Stores in vector database with `metadata["memory_type"] = "procedural_memory"`
+6. **Return**: Returns memory ID and summary text
+
+### Async vs Sync
+- **AsyncMemory**: Supports custom LangChain `llm` parameter
+- **Memory**: Uses internal LLM from config only
+
+---
+
+## Integration with Nexent
+
+### Current Status
+The Nexent codebase does **NOT** currently use procedural memory. The `memory_type` parameter is not passed in any `add_memory()` calls.
+
+### Recommended Integration Points
+
+1. **Agent Service** (`backend/services/agent_service.py`):
+   - Detect when agent completes a multi-step task
+   - Call `add_memory_in_levels()` with `memory_type="procedural_memory"`
+   - Pass the full conversation history as messages
+
+2. **Memory Service** (`sdk/nexent/memory/memory_service.py`):
+   - Add `memory_type` parameter to `add_memory()` and `add_memory_in_levels()`
+   - Pass through to mem0's `add()` method
+
+3. **Agent Run Info** (`sdk/nexent/core/agents/agent_model.py`):
+   - Add `memory_type` field to track if current run should create procedural memory
+
+### Example Integration
+
+```python
+# In agent_service.py, after agent completes a complex task
+if task_complexity >= threshold:  # Your logic here
+    await add_memory_in_levels(
+        messages=conversation_history,
+        memory_config=memory_ctx.memory_config,
+        tenant_id=memory_ctx.tenant_id,
+        user_id=memory_ctx.user_id,
+        agent_id=memory_ctx.agent_id,
+        memory_levels=["agent", "user_agent"],
+        memory_type="procedural_memory",  # ✅ NEW PARAMETER
+        metadata={
+            "task_type": "complex_research",
+            "duration_seconds": duration,
+            "steps_completed": step_count
+        }
+    )
+```
+
+---
+
+## Conclusion
+
+Procedural memory is a **fully functional feature** in mem0ai==0.1.117, **BUT it requires an optional dependency**. It provides:
+
+- ✅ Complete API support
+- ✅ Comprehensive system prompt (5,100 characters)
+- ✅ Proper validation and error handling
+- ✅ Both sync and async implementations
+- ✅ Integration with existing memory infrastructure
+- ⚠️ **REQUIRES `langchain-core` package to be installed**
+
+### The Truth About "Empty Function" Claims
+
+**The code is NOT empty.** It's a 50-line implementation that:
+1. Calls LLM to generate execution summary
+2. Creates embeddings
+3. Stores in vector database
+4. Returns proper results
+
+**However, it fails at runtime** if `langchain-core` is not installed, which is why your colleague might have thought it was a no-op.
+
+### How to Enable
+
+**Option 1: Install the dependency**
+```bash
+pip install langchain-core
+```
+
+**Option 2: Add to Nexent's dependencies**
+```toml
+# In sdk/pyproject.toml
+dependencies = [
+    # ... existing deps ...
+    "langchain-core>=0.1.0",  # Required for procedural memory
+]
+```
+
+**Option 3: Make it optional with fallback**
+```python
+try:
+    result = await memory.add(..., memory_type="procedural_memory")
+except ImportError as e:
+    if "langchain-core" in str(e):
+        logger.warning("Procedural memory requires langchain-core. Using regular memory.")
+        result = await memory.add(...)  # Fallback
+    else:
+        raise
+```
+
+### Final Recommendation
+
+This feature **can be integrated into Nexent**, but you must:
+1. Add `langchain-core` to dependencies, OR
+2. Implement graceful fallback when dependency is missing, OR
+3. Document it as an optional feature requiring extra installation
+
+Without addressing the dependency issue, procedural memory will fail at runtime despite having complete implementation code.
diff --git a/docker/.env.example b/docker/.env.example
index c34300523..3970efb95 100644
--- a/docker/.env.example
+++ b/docker/.env.example
@@ -226,3 +226,27 @@ OAUTH_CALLBACK_BASE_URL=http://localhost:3000
 
 # Asset owner role (opt-in; default false). Set true to enable ASSET_OWNER.
 ENABLE_ASSET_OWNER_ROLE=false
+
+# ===== CAS SSO Configuration =====
+CAS_ENABLED=false
+CAS_SERVER_URL=
+CAS_VALIDATE_PATH=/p3/serviceValidate
+CAS_CALLBACK_BASE_URL=http://localhost:3000
+# Supported values:
+# - disabled: disable CAS login entry and automatic CAS redirects.
+# - button: show CAS as an optional login entry.
+# - force: automatically redirect unauthenticated users to CAS login.
+CAS_LOGIN_MODE=disabled
+CAS_USER_ATTRIBUTE=
+CAS_EMAIL_ATTRIBUTE=email
+CAS_ROLE_ATTRIBUTE=role
+CAS_TENANT_ATTRIBUTE=tenant_id
+CAS_ROLE_MAP_JSON=
+CAS_SESSION_MAX_AGE_SECONDS=3600
+LOCAL_SESSION_MAX_AGE_SECONDS=3600
+CAS_RENEW_BEFORE_SECONDS=300
+CAS_RENEW_TIMEOUT_SECONDS=10
+CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
+CAS_LOGOUT_URL=/logout
+CAS_SSL_VERIFY=true
+CAS_CA_BUNDLE=
diff --git a/docker/deploy.sh b/docker/deploy.sh
index 2069330d1..fbf3664b5 100755
--- a/docker/deploy.sh
+++ b/docker/deploy.sh
@@ -1367,7 +1367,7 @@ main_deploy() {
   echo "--------------------------------"
   echo ""
 
-  APP_VERSION="latest"
+  APP_VERSION="$(get_app_version)"
   if [ -z "$APP_VERSION" ]; then
     echo "❌ Failed to get app version, please check the backend/consts/const.py file"
     exit 1
diff --git a/docker/init.sql b/docker/init.sql
index 0668def01..046bdecf1 100644
--- a/docker/init.sql
+++ b/docker/init.sql
@@ -230,6 +230,7 @@ CREATE TABLE IF NOT EXISTS "knowledge_record_t" (
   "summary_frequency" varchar(10) COLLATE "pg_catalog"."default",
   "last_summary_time" timestamp(0),
   "last_doc_update_time" timestamp(0),
+  "preserve_source_file" boolean NOT NULL DEFAULT true,
   CONSTRAINT "knowledge_record_t_pk" PRIMARY KEY ("knowledge_id")
 );
 ALTER TABLE "knowledge_record_t" OWNER TO "root";
@@ -251,6 +252,7 @@ COMMENT ON COLUMN "knowledge_record_t"."created_by" IS 'User who created the rec
 COMMENT ON COLUMN "knowledge_record_t"."summary_frequency" IS 'Auto-summary frequency: 1h, 3h, 6h, 1d, 1w, or NULL (disabled)';
 COMMENT ON COLUMN "knowledge_record_t"."last_summary_time" IS 'Timestamp of last summary generation';
 COMMENT ON COLUMN "knowledge_record_t"."last_doc_update_time" IS 'Timestamp of last document add/delete operation, used for auto-summary optimization to skip unnecessary summary regeneration';
+COMMENT ON COLUMN "knowledge_record_t"."preserve_source_file" IS 'Whether to preserve uploaded source documents after vectorization';
 COMMENT ON COLUMN "knowledge_record_t"."updated_by" IS 'Last updater ID, audit field';
 COMMENT ON COLUMN "knowledge_record_t"."created_by" IS 'Creator ID, audit field';
 COMMENT ON TABLE "knowledge_record_t" IS 'Records knowledge base description and status information';
@@ -337,9 +339,12 @@ CREATE TABLE IF NOT EXISTS nexent.ag_tenant_agent_t (
     is_new BOOLEAN DEFAULT FALSE,
     provide_run_summary BOOLEAN DEFAULT FALSE,
     enable_context_manager BOOLEAN DEFAULT FALSE,
+    verification_config JSONB,
     version_no INTEGER DEFAULT 0 NOT NULL,
     current_version_no INTEGER NULL,
     ingroup_permission VARCHAR(30),
+    greeting_message TEXT,
+    example_questions JSONB,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -397,6 +402,9 @@ COMMENT ON COLUMN nexent.ag_tenant_agent_t.version_no IS 'Version number. 0 = dr
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.current_version_no IS 'Current published version number. NULL means no version published yet';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.ingroup_permission IS 'In-group permission: EDIT, READ_ONLY, PRIVATE';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.enable_context_manager IS 'Whether to enable context management (compression) for this agent';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
 
 -- Create index for is_new queries
 CREATE INDEX IF NOT EXISTS idx_ag_tenant_agent_t_is_new
@@ -715,6 +723,7 @@ CREATE TABLE IF NOT EXISTS nexent.ag_agent_relation_t (
     parent_agent_id INTEGER,
     tenant_id VARCHAR(100),
     version_no INTEGER DEFAULT 0 NOT NULL,
+    selected_agent_version_no INTEGER,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -747,6 +756,7 @@ COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_id IS 'Selected agen
 COMMENT ON COLUMN nexent.ag_agent_relation_t.parent_agent_id IS 'Parent agent ID';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.tenant_id IS 'Tenant ID';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.version_no IS 'Version number. 0 = draft/editing state, >=1 = published snapshot';
+COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS 'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.create_time IS 'Creation time, audit field';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.update_time IS 'Update time, audit field';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.created_by IS 'Creator ID, audit field';
@@ -1260,7 +1270,6 @@ CREATE TABLE IF NOT EXISTS nexent.ag_skill_info_t (
     config_schemas JSON,
     config_values JSON,
     source VARCHAR(30) DEFAULT 'official',
-    tenant_id VARCHAR(100),
     created_by VARCHAR(100),
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     updated_by VARCHAR(100),
@@ -1900,3 +1909,31 @@ FOR EACH ROW
 EXECUTE FUNCTION update_mcp_community_record_update_time();
 
 COMMENT ON TRIGGER update_mcp_community_record_update_time_trigger ON nexent.mcp_community_record_t IS 'Trigger to maintain update_time';
+
+CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
+    cas_session_id SERIAL PRIMARY KEY,
+    session_id VARCHAR(100) NOT NULL UNIQUE,
+    user_id VARCHAR(100) NOT NULL,
+    cas_user_id VARCHAR(200) NOT NULL,
+    cas_session_index VARCHAR(500),
+    status VARCHAR(30) NOT NULL DEFAULT 'active',
+    expires_at TIMESTAMP NOT NULL,
+    revoked_at TIMESTAMP,
+    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    created_by VARCHAR(100),
+    updated_by VARCHAR(100),
+    delete_flag VARCHAR(1) DEFAULT 'N'
+);
+
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
+    ON nexent.user_cas_session_t (session_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
+    ON nexent.user_cas_session_t (user_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
+    ON nexent.user_cas_session_t (cas_user_id);
+
+COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
+COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
diff --git a/docker/official-skills-zip/create-docx.zip b/docker/official-skills-zip/create-docx.zip
new file mode 100644
index 000000000..aa53e82b0
Binary files /dev/null and b/docker/official-skills-zip/create-docx.zip differ
diff --git a/docker/sql/v2.2.0_0526_add_cas_session_t.sql b/docker/sql/v2.2.0_0526_add_cas_session_t.sql
new file mode 100644
index 000000000..3f1aab4fa
--- /dev/null
+++ b/docker/sql/v2.2.0_0526_add_cas_session_t.sql
@@ -0,0 +1,27 @@
+CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
+    cas_session_id SERIAL PRIMARY KEY,
+    session_id VARCHAR(100) NOT NULL UNIQUE,
+    user_id VARCHAR(100) NOT NULL,
+    cas_user_id VARCHAR(200) NOT NULL,
+    cas_session_index VARCHAR(500),
+    status VARCHAR(30) NOT NULL DEFAULT 'active',
+    expires_at TIMESTAMP NOT NULL,
+    revoked_at TIMESTAMP,
+    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    created_by VARCHAR(100),
+    updated_by VARCHAR(100),
+    delete_flag VARCHAR(1) DEFAULT 'N'
+);
+
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
+    ON nexent.user_cas_session_t (session_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
+    ON nexent.user_cas_session_t (user_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
+    ON nexent.user_cas_session_t (cas_user_id);
+
+COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
+COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
diff --git a/docker/sql/v2.2.1_0601_add_agent_verification_config.sql b/docker/sql/v2.2.1_0601_add_agent_verification_config.sql
new file mode 100644
index 000000000..d3882e1e2
--- /dev/null
+++ b/docker/sql/v2.2.1_0601_add_agent_verification_config.sql
@@ -0,0 +1,7 @@
+-- Migration: Add layered ReAct self-verification config to agents
+-- Description: Stores per-agent verification controls for step-level and final-answer validation.
+
+ALTER TABLE nexent.ag_tenant_agent_t
+ADD COLUMN IF NOT EXISTS verification_config JSONB;
+
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
diff --git a/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql b/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql
new file mode 100644
index 000000000..30b588a51
--- /dev/null
+++ b/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql
@@ -0,0 +1,8 @@
+-- Migration: Add preserve_source_file to knowledge_record_t table
+-- Date: 2026-06-01
+-- Description: Whether to preserve uploaded source documents after vectorization (default: true)
+
+ALTER TABLE nexent.knowledge_record_t
+ADD COLUMN IF NOT EXISTS preserve_source_file BOOLEAN NOT NULL DEFAULT true;
+
+COMMENT ON COLUMN nexent.knowledge_record_t.preserve_source_file IS 'Whether to preserve uploaded source documents after vectorization';
diff --git a/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql b/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql
new file mode 100644
index 000000000..7786bb902
--- /dev/null
+++ b/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql
@@ -0,0 +1,15 @@
+-- Migration: Add greeting_message and example_questions columns to ag_tenant_agent_t table
+-- Date: 2026-06-03
+-- Description: Add greeting message and example questions fields for agent chat initial screen
+
+-- Add greeting_message column to ag_tenant_agent_t table
+ALTER TABLE nexent.ag_tenant_agent_t
+ADD COLUMN IF NOT EXISTS greeting_message TEXT;
+
+-- Add example_questions column to ag_tenant_agent_t table
+ALTER TABLE nexent.ag_tenant_agent_t
+ADD COLUMN IF NOT EXISTS example_questions JSONB;
+
+-- Add comments to the columns
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
\ No newline at end of file
diff --git a/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql b/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql
new file mode 100644
index 000000000..d719fc5aa
--- /dev/null
+++ b/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql
@@ -0,0 +1,96 @@
+-- Migration: Add ag_agent_repository_t table
+-- Date: 2026-06-05
+-- Description: Agent marketplace repository for frozen shareable agent snapshots.
+
+SET search_path TO nexent;
+
+BEGIN;
+
+CREATE SEQUENCE IF NOT EXISTS nexent.ag_agent_repository_t_agent_repository_id_seq;
+
+CREATE TABLE IF NOT EXISTS nexent.ag_agent_repository_t (
+    agent_repository_id BIGINT NOT NULL DEFAULT nextval('nexent.ag_agent_repository_t_agent_repository_id_seq'),
+    publisher_tenant_id VARCHAR(100) NOT NULL,
+    publisher_user_id VARCHAR(100) NOT NULL,
+    agent_id INTEGER NOT NULL,
+    source_version_no INTEGER NOT NULL,
+    name VARCHAR(100) NOT NULL,
+    display_name VARCHAR(100),
+    description TEXT,
+    author VARCHAR(100),
+    category_id INTEGER,
+    tags TEXT[],
+    tool_count INTEGER,
+    version_label VARCHAR(100),
+    agent_info_json JSONB NOT NULL,
+    status VARCHAR(30) DEFAULT 'NOT_SHARED',
+    create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
+    update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
+    created_by VARCHAR(100),
+    updated_by VARCHAR(100),
+    delete_flag VARCHAR(1) DEFAULT 'N',
+    CONSTRAINT ag_agent_repository_t_pkey PRIMARY KEY (agent_repository_id)
+);
+
+ALTER SEQUENCE nexent.ag_agent_repository_t_agent_repository_id_seq
+    OWNED BY nexent.ag_agent_repository_t.agent_repository_id;
+
+ALTER TABLE nexent.ag_agent_repository_t OWNER TO root;
+
+COMMENT ON TABLE nexent.ag_agent_repository_t IS 'Agent marketplace repository for frozen shareable agent snapshots';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_repository_id IS 'Agent repository listing ID, unique primary key';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_tenant_id IS 'Publisher tenant ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_user_id IS 'Publisher user ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_id IS 'Root agent ID from ag_tenant_agent_t; upsert key with publisher_tenant_id';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.source_version_no IS 'Published version number frozen at share time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.name IS 'Root agent programmatic name for display and search';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.display_name IS 'Root agent display name';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.description IS 'Root agent description';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.author IS 'Agent author';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.category_id IS 'Optional marketplace category ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.tags IS 'Marketplace tags';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.tool_count IS 'Total tool count across all agents in the bundle (display only)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.version_label IS 'Repository entry version label for display (e.g. v1.0)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_info_json IS 'Frozen ExportAndImportDataFormat snapshot with optional skills';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.status IS 'Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.create_time IS 'Creation time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.update_time IS 'Update time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.created_by IS 'Creator ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.updated_by IS 'Updater ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.delete_flag IS 'Soft delete flag: Y/N';
+
+CREATE UNIQUE INDEX IF NOT EXISTS uq_agent_repository_tenant_agent_active
+    ON nexent.ag_agent_repository_t (publisher_tenant_id, agent_id)
+    WHERE delete_flag = 'N';
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_publisher_delete
+    ON nexent.ag_agent_repository_t (publisher_tenant_id, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_status_delete
+    ON nexent.ag_agent_repository_t (status, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_name_delete
+    ON nexent.ag_agent_repository_t (name, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_tags_gin
+    ON nexent.ag_agent_repository_t USING GIN (tags);
+
+CREATE OR REPLACE FUNCTION update_ag_agent_repository_update_time()
+RETURNS TRIGGER AS $$
+BEGIN
+    NEW.update_time = CURRENT_TIMESTAMP;
+    RETURN NEW;
+END;
+$$ LANGUAGE plpgsql;
+
+COMMENT ON FUNCTION update_ag_agent_repository_update_time() IS 'Auto-update update_time for ag_agent_repository_t';
+
+DROP TRIGGER IF EXISTS update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t;
+CREATE TRIGGER update_ag_agent_repository_update_time_trigger
+BEFORE UPDATE ON nexent.ag_agent_repository_t
+FOR EACH ROW
+EXECUTE FUNCTION update_ag_agent_repository_update_time();
+
+COMMENT ON TRIGGER update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t IS 'Trigger to maintain update_time';
+
+COMMIT;
diff --git a/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql b/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql
new file mode 100644
index 000000000..9a67c1ab2
--- /dev/null
+++ b/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql
@@ -0,0 +1,15 @@
+-- Migration: Add selected_agent_version_no to ag_agent_relation_t
+-- Date: 2026-06-09
+-- Description: Pin child agent version on parent-child relations at publish time.
+
+SET search_path TO nexent;
+
+BEGIN;
+
+ALTER TABLE nexent.ag_agent_relation_t
+    ADD COLUMN IF NOT EXISTS selected_agent_version_no INTEGER;
+
+COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS
+    'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
+
+COMMIT;
diff --git a/frontend/app/[locale]/agents/components/AgentConfigComp.tsx b/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
index 13484595f..1e750d5eb 100644
--- a/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
+++ b/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
@@ -29,6 +29,8 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
   const currentAgentId = useAgentConfigStore((state) => state.currentAgentId);
   const isCreatingMode = useAgentConfigStore((state) => state.isCreatingMode);
   const isReadOnly = useAgentConfigStore((state) => state.isReadOnly());
+  const selectedTools = useAgentConfigStore((state) => state.editedAgent.tools);
+  const selectedSkills = useAgentConfigStore((state) => state.editedAgent.skills);
 
   const [isMcpModalOpen, setIsMcpModalOpen] = useState(false);
   const [isSkillModalOpen, setIsSkillModalOpen] = useState(false);
@@ -125,7 +127,12 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
       <Tabs defaultValue="tools" className="w-full flex-1 min-h-0 flex flex-col overflow-hidden">
         <TabsList className="grid w-full grid-cols-2 flex-shrink-0">
           <TabsTrigger value="tools">
-            {t("toolPool.title")}
+            <span className="inline-flex items-center gap-1">
+              {t("toolPool.title")}
+              {selectedTools.length > 0 && (
+                <Badge count={selectedTools.length} size="small" color="blue" />
+              )}
+            </span>
             <Tooltip
               title={<div style={{ whiteSpace: "pre-line" }}>{t("toolPool.tooltip.functionGuide")}</div>}
               color="#ffffff"
@@ -144,7 +151,14 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
               <Lightbulb className="mx-2 text-yellow-500" size={16} />
             </Tooltip>
           </TabsTrigger>
-          <TabsTrigger value="skills">{t("skillPool.title")}</TabsTrigger>
+          <TabsTrigger value="skills">
+            <span className="inline-flex items-center gap-1">
+              {t("skillPool.title")}
+              {selectedSkills && selectedSkills.length > 0 && (
+                <Badge count={selectedSkills.length} size="small" color="blue" />
+              )}
+            </span>
+          </TabsTrigger>
         </TabsList>
 
         <TabsContent value="tools" className="mt-4 flex-1 min-h-0 flex flex-col overflow-hidden">
diff --git a/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
index 277e85d3d..41c8baa45 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
@@ -80,6 +80,7 @@ export default function McpConfigModal({
   const [openApiJson, setOpenApiJson] = useState("");
   const [openApiServiceName, setOpenApiServiceName] = useState("");
   const [openApiServerUrl, setOpenApiServerUrl] = useState("");
+  const [openApiHeadersTemplate, setOpenApiHeadersTemplate] = useState("");
   const [importingOpenApi, setImportingOpenApi] = useState(false);
   const [openapiServices, setOpenapiServices] = useState<any[]>([]);
   const [loadingOpenapiServices, setLoadingOpenapiServices] = useState(false);
@@ -506,6 +507,7 @@ export default function McpConfigModal({
           service_name: openApiServiceName.trim(),
           server_url: openApiServerUrl.trim(),
           openapi_json: parsedJson,
+          headers_template: openApiHeadersTemplate.trim() ? JSON.parse(openApiHeadersTemplate.trim()) : null,
         }),
       });
 
@@ -514,6 +516,7 @@ export default function McpConfigModal({
         setOpenApiJson("");
         setOpenApiServiceName("");
         setOpenApiServerUrl("");
+        setOpenApiHeadersTemplate("");
         await loadOpenapiServices();
         await refreshToolsAndAgents();
       } else {
@@ -1220,15 +1223,20 @@ export default function McpConfigModal({
                           style={{ flex: 3 }}
                         />
                       </div>
-                      <div>
-                        <Input.TextArea
-                          placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
-                          value={openApiJson}
-                          onChange={(e) => setOpenApiJson(e.target.value)}
-                          rows={6}
-                          disabled={actionsLocked || importingOpenApi}
-                        />
-                      </div>
+                      <Input.TextArea
+                        placeholder={t("mcpConfig.addServer.customHeadersPlaceholder")}
+                        value={openApiHeadersTemplate}
+                        onChange={(e) => setOpenApiHeadersTemplate(e.target.value)}
+                        rows={2}
+                        disabled={actionsLocked || importingOpenApi}
+                      />
+                      <Input.TextArea
+                        placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
+                        value={openApiJson}
+                        onChange={(e) => setOpenApiJson(e.target.value)}
+                        rows={6}
+                        disabled={actionsLocked || importingOpenApi}
+                      />
                       <div
                         style={{
                           display: "flex",
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
index 7f969edb9..8f040d4b3 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
@@ -56,7 +56,7 @@ import {
   SkillFilesAccessDeniedError,
   type SkillFileNode,
 } from "@/services/agentConfigService";
-import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
+import { MarkdownRenderer } from "@/components/common/markdownRenderer";
 import log from "@/lib/logger";
 
 const { TextArea } = Input;
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
index 4161a3b1a..05f11d6a3 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
@@ -10,7 +10,7 @@ import {
   fetchSkillFileContent,
   SkillFilesAccessDeniedError,
 } from "@/services/agentConfigService";
-import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
+import { MarkdownRenderer } from "@/components/common/markdownRenderer";
 import {
   buildTreeData,
   collectDirKeys,
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
index dc5e22d87..f8a733ae0 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
@@ -3,7 +3,7 @@
 import { useState, useEffect } from "react";
 import { useTranslation } from "react-i18next";
 import { SkillGroup, Skill, SkillParam } from "@/types/agentConfig";
-import { Tabs, message, Tooltip } from "antd";
+import { Tabs, message, Tooltip, Badge } from "antd";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import { useSkillList } from "@/hooks/agent/useSkillList";
 import { Info, Trash2, Settings } from "lucide-react";
@@ -207,21 +207,27 @@ export default function SkillManagement({
   };
 
   const tabItems = skillGroups.map((group) => {
+    const selectedCount = group.skills.filter(s => originalSelectedSkillIdsSet.has(s.skill_id)).length;
+
     return {
       key: group.key,
       label: (
         <Tooltip title={group.label} placement="right">
-          <span
-            style={{
-              display: "block",
-              maxWidth: "100px",
-              overflow: "hidden",
-              textOverflow: "ellipsis",
-              whiteSpace: "nowrap",
-              textAlign: "left",
-            }}
-          >
-            {group.label}
+          <span className="inline-flex items-center gap-1">
+            <span
+              style={{
+                maxWidth: "100px",
+                overflow: "hidden",
+                textOverflow: "ellipsis",
+                whiteSpace: "nowrap",
+                textAlign: "left",
+              }}
+            >
+              {group.label}
+            </span>
+            {selectedCount > 0 && (
+              <Badge count={selectedCount} size="small" color="blue" />
+            )}
           </span>
         </Tooltip>
       ),
diff --git a/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx b/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
index 0cb73de62..62edc3ac8 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
@@ -4,7 +4,7 @@ import { useState, useEffect, useCallback } from "react";
 import { useTranslation } from "react-i18next";
 import ToolConfigModal from "./tool/ToolConfigModal";
 import { ToolGroup, Tool, ToolParam } from "@/types/agentConfig";
-import { Tabs, Collapse, message, Tooltip } from "antd";
+import { Tabs, Collapse, message, Tooltip, Badge } from "antd";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import { useToolList } from "@/hooks/agent/useToolList";
 import { usePrefetchKnowledgeBases } from "@/hooks/useKnowledgeBaseSelector";
@@ -307,21 +307,29 @@ export default function ToolManagement({
   // Generate Tabs configuration
   const tabItems = toolGroups.map((group) => {
     const label = t(group.label);
+    const selectedCount = group.subGroups
+      ? group.subGroups.reduce(
+          (sum, sg) => sum + sg.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length, 0)
+      : group.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length;
 
     return {
       key: group.key,
       label: (
         <Tooltip title={label} placement="right">
-          <span
-            style={{
-              display: "block",
-              maxWidth: "100px",
-              overflow: "hidden",
-              textOverflow: "ellipsis",
-              whiteSpace: "nowrap",
-            }}
-          >
-            {label}
+          <span className="inline-flex items-center gap-1">
+            <span
+              style={{
+                maxWidth: "100px",
+                overflow: "hidden",
+                textOverflow: "ellipsis",
+                whiteSpace: "nowrap",
+              }}
+            >
+              {label}
+            </span>
+            {selectedCount > 0 && (
+              <Badge count={selectedCount} size="small" color="blue" />
+            )}
           </span>
         </Tooltip>
       ),
@@ -351,17 +359,25 @@ export default function ToolManagement({
                   items={group.subGroups.map((subGroup, index) => ({
                     key: subGroup.key,
                     label: (
-                      <span
-                        className="text-gray-700 font-medium"
-                        style={{
-                          paddingTop: "8px",
-                          paddingBottom: "8px",
-                          display: "block",
-                          minHeight: "36px",
-                          lineHeight: "20px",
-                        }}
-                      >
-                        {subGroup.label}
+                      <span className="inline-flex items-center gap-1">
+                        <span
+                          className="text-gray-700 font-medium"
+                          style={{
+                            paddingTop: "8px",
+                            paddingBottom: "8px",
+                            minHeight: "36px",
+                            lineHeight: "20px",
+                          }}
+                        >
+                          {subGroup.label}
+                        </span>
+                        {subGroup.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length > 0 && (
+                          <Badge
+                            count={subGroup.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length}
+                            size="small"
+                            color="blue"
+                          />
+                        )}
                       </span>
                     ),
                     className: `tool-category-panel ${
diff --git a/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
index 6f372e2b4..9729007e2 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
@@ -12,13 +12,13 @@ import {
   message,
   Tag,
   Skeleton,
+  Tooltip
 } from "antd";
 import { Settings } from "lucide-react";
 import { CloseOutlined } from "@ant-design/icons";
 
 import { Skill, SkillParam } from "@/types/agentConfig";
 import { KnowledgeBase } from "@/types/knowledgeBase";
-import { Tooltip } from "@/components/ui/tooltip";
 import { saveSkillInstance } from "@/services/agentConfigService";
 import KnowledgeBaseSelectorModal from "@/components/tool-config/KnowledgeBaseSelectorModal";
 import {
diff --git a/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx b/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
index 8b6cd82d7..cd46d2aa3 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { useState, useEffect, useMemo, useRef, useCallback } from "react";
+import { useState, useEffect, useMemo, useRef } from "react";
 import { useTranslation } from "react-i18next";
 import {
   Button,
@@ -17,9 +17,11 @@ import {
 } from "antd";
 import { Tabs, TabsList, TabsTrigger, TabsContent } from "@/components/ui/tabs";
 import { Zap, Maximize2, Settings2, Sparkles } from "lucide-react";
+import { Textarea } from "@/components/ui/textarea";
 
 import {
   AgentConfigUpdate,
+  DEFAULT_AGENT_VERIFICATION_CONFIG,
   PromptTemplate,
 } from "@/types/agentConfig";
 import {
@@ -169,6 +171,7 @@ export default function AgentGenerateDetail({}) {
       constraintPrompt: editedAgent.constraint_prompt || "",
       fewShotsPrompt: editedAgent.few_shots_prompt || "",
       provideRunSummary: editedAgent.provide_run_summary || false,
+      verificationEnabled: editedAgent.verification_config?.enabled ?? false,
       businessDescription: editedAgent.business_description || "",
       businessLogicModelName:editedAgent.business_logic_model_name,
       businessLogicModelId: editedAgent.business_logic_model_id,
@@ -233,6 +236,7 @@ export default function AgentGenerateDetail({}) {
     setOptimizeModalOpen(true);
   };
 
+
   const renderExpandButton = (type: "duty" | "constraint" | "few-shots") => {
     return (
       <Button
@@ -391,6 +395,7 @@ export default function AgentGenerateDetail({}) {
     setOptimizeModalType(null);
   };
 
+
   const handleSaveExpandModal = (content: string) => {
     switch (expandModalType) {
       case 'duty':
@@ -446,27 +451,35 @@ export default function AgentGenerateDetail({}) {
     }
   };
 
-  const getStoreFieldKey = (type: 'duty' | 'constraint' | 'few-shots') => {
-    switch (type) {
-      case "duty":
-        return "duty_prompt";
-      case "constraint":
-        return "constraint_prompt";
-      case "few-shots":
-        return "few_shots_prompt";
-    }
-  };
+  const handleReplaceOptimizedContent = (
+    content: string,
+    sectionType: "duty" | "constraint" | "few_shots"
+  ) => {
+    const value = content.trim();
 
-  const handleReplaceOptimizedContent = (content: string) => {
-    if (!optimizeModalType) {
+    if (!value) {
+      handleCloseOptimizeModal();
       return;
     }
 
-    const formFieldKey = getPromptFieldKey(optimizeModalType);
-    const storeFieldKey = getStoreFieldKey(optimizeModalType);
+    const fieldMap = {
+      duty: {
+        formField: "dutyPrompt" as const,
+        storeField: "duty_prompt" as const,
+      },
+      constraint: {
+        formField: "constraintPrompt" as const,
+        storeField: "constraint_prompt" as const,
+      },
+      few_shots: {
+        formField: "fewShotsPrompt" as const,
+        storeField: "few_shots_prompt" as const,
+      },
+    };
 
-    form.setFieldsValue({ [formFieldKey]: content });
-    updateAgentConfig({ [storeFieldKey]: content } as AgentConfigUpdate);
+    const { formField, storeField } = fieldMap[sectionType];
+    form.setFieldsValue({ [formField]: value });
+    updateAgentConfig({ [storeField]: value } as AgentConfigUpdate);
     handleCloseOptimizeModal();
   };
 
@@ -682,11 +695,12 @@ export default function AgentGenerateDetail({}) {
             }}
             className="agent-config-tabs flex flex-col h-full w-full"
           >
-            <TabsList className="grid w-full grid-cols-4 flex-shrink-0">
+            <TabsList className="grid w-full grid-cols-5 flex-shrink-0">
               <TabsTrigger value="agent-info">{t("agent.info.title")}</TabsTrigger>
               <TabsTrigger value="duty">{t("systemPrompt.card.duty.title")}</TabsTrigger>
               <TabsTrigger value="constraint">{t("systemPrompt.card.constraint.title")}</TabsTrigger>
               <TabsTrigger value="few-shots">{t("systemPrompt.card.fewShots.title")}</TabsTrigger>
+              <TabsTrigger value="greeting">{t("agent.greeting.tabTitle")}</TabsTrigger>
             </TabsList>
 
             <TabsContent value="agent-info" className="flex-1 min-h-0 overflow-y-auto">
@@ -861,7 +875,7 @@ export default function AgentGenerateDetail({}) {
                       </Row>
 
                       <Row gutter={16}>
-                        <Col span={12}>
+                        <Col span={8}>
                           <Form.Item
                             name="mainAgentMaxStep"
                             label={t("businessLogic.config.maxSteps")}
@@ -889,7 +903,7 @@ export default function AgentGenerateDetail({}) {
                             />
                           </Form.Item>
                         </Col>
-                        <Col span={12}>
+                        <Col span={8}>
                           <Form.Item
                             name="provideRunSummary"
                             label={t("agent.provideRunSummary")}
@@ -911,6 +925,33 @@ export default function AgentGenerateDetail({}) {
                             />
                           </Form.Item>
                         </Col>
+                        <Col span={8}>
+                          <Form.Item
+                            name="verificationEnabled"
+                            label={t("agent.verification")}
+                            rules={[
+                              {
+                                required: true,
+                                message: t("agent.verification.error"),
+                              },
+                            ]}
+                          >
+                            <Select
+                              options={[
+                                { value: true, label: t("common.yes") },
+                                { value: false, label: t("common.no") },
+                              ]}
+                              onChange={(value) => {
+                                updateAgentConfig({
+                                  verification_config: {
+                                    ...(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG),
+                                    enabled: value,
+                                  },
+                                });
+                              }}
+                            />
+                          </Form.Item>
+                        </Col>
                       </Row>
 
                       <Form.Item
@@ -959,6 +1000,70 @@ export default function AgentGenerateDetail({}) {
                 (value) => updateAgentConfig({ few_shots_prompt: value })
               )}
             </TabsContent>
+
+            <TabsContent value="greeting" className="flex-1 min-h-0 overflow-y-auto">
+              <div className="overflow-y-auto overflow-x-hidden h-full px-3 pb-3">
+                <div className="mb-4">
+                  <div className="flex items-center mb-2">
+                    <h4 className="text-md font-medium text-gray-700">{t("agent.greeting.messageTitle")}</h4>
+                  </div>
+                  <Textarea
+                    value={editedAgent.greeting_message || ""}
+                    onChange={(e) => updateAgentConfig({ greeting_message: e.target.value })}
+                    disabled={!editable || isGenerating}
+                    placeholder={t("agent.greeting.messagePlaceholder")}
+                    className="w-full min-h-[80px]"
+                  />
+                </div>
+
+                <div className="mb-4">
+                  <div className="flex items-center mb-2">
+                    <h4 className="text-md font-medium text-gray-700">{t("agent.greeting.questionsTitle")}</h4>
+                  </div>
+                  {(editedAgent.example_questions || []).length > 0 && (
+                    <div className="space-y-2">
+                      {(editedAgent.example_questions || []).map((q: string, idx: number) => (
+                        <div key={idx} className="flex items-center gap-2">
+                          <Input
+                            value={q}
+                            onChange={(e) => {
+                              const newQuestions = [...(editedAgent.example_questions || [])];
+                              newQuestions[idx] = e.target.value;
+                              updateAgentConfig({ example_questions: newQuestions });
+                            }}
+                            disabled={!editable || isGenerating}
+                            className="flex-1"
+                          />
+                          <Button
+                            size="small"
+                            disabled={!editable || isGenerating}
+                            onClick={() => {
+                              const newQuestions = (editedAgent.example_questions || []).filter((_: string, i: number) => i !== idx);
+                              updateAgentConfig({ example_questions: newQuestions });
+                            }}
+                          >
+                            {t("agent.greeting.removeQuestion")}
+                          </Button>
+                        </div>
+                      ))}
+                    </div>
+                  )}
+                  {(editedAgent.example_questions || []).length < 6 && editable && !isGenerating && (
+                    <Button
+                      size="small"
+                      type="dashed"
+                      onClick={() => {
+                        const newQuestions = [...(editedAgent.example_questions || []), ""];
+                        updateAgentConfig({ example_questions: newQuestions });
+                      }}
+                      className="mt-2"
+                    >
+                      {t("agent.greeting.addQuestion")}
+                    </Button>
+                  )}
+                </div>
+              </div>
+            </TabsContent>
           </Tabs>
         </Col>
       </Row>
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
index 4e284f879..511c74218 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
@@ -18,6 +18,7 @@ import {
 import { useModelList } from "@/hooks/model/useModelList";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import DebugMessageList from "./DebugMessageList";
+import DebugOptimizeModal from "./DebugOptimizeModal";
 import { useCompareStream } from "./useCompareStream";
 
 // Agent debugging component Props interface
@@ -30,6 +31,11 @@ interface AgentDebuggingProps {
   isStreaming: boolean;
   isCompareStreaming?: boolean;
   messages: ChatMessageType[];
+  onOptimizeReply?: (params: {
+    userQuestion: string;
+    assistantAnswer: string;
+    history: Array<{ role: string; content: string }>;
+  }) => void;
   comparePanel?: React.ReactNode;
   showCompare?: boolean;
   onOpenCompare?: () => void;
@@ -55,6 +61,7 @@ function AgentDebugging({
   isStreaming,
   isCompareStreaming = false,
   messages,
+  onOptimizeReply,
   comparePanel,
   showCompare,
   onOpenCompare,
@@ -74,7 +81,11 @@ function AgentDebugging({
         ) : (
           <div className="flex flex-col gap-4 flex-1 min-h-0 overflow-hidden">
             {/* Message display area */}
-            <DebugMessageList messages={messages} isStreaming={isStreaming} />
+            <DebugMessageList
+              messages={messages}
+              isStreaming={isStreaming}
+              onOptimizeReply={onOptimizeReply}
+            />
           </div>
         )}
 
@@ -152,6 +163,16 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
   const prevAgentIdRef = useRef<number | null | undefined>(undefined);
   // Maintain an independent step ID counter per Agent
   const stepIdCounter = useRef<{ current: number }>({ current: 0 });
+
+  const [debugOptimizeOpen, setDebugOptimizeOpen] = useState(false);
+  const [debugOptimizeSelected, setDebugOptimizeSelected] = useState<null | {
+    userQuestion: string;
+    assistantAnswer: string;
+    history: Array<{ role: string; content: string }>;
+  }>(null);
+  const [compareOriginalPrompt, setCompareOriginalPrompt] = useState("");
+  const [compareOptimizedPrompt, setCompareOptimizedPrompt] = useState("");
+
   const [isComparePanelOpen, setIsComparePanelOpen] = useState(false);
   const [compareLeftModelId, setCompareLeftModelId] = useState<number | null>(null);
   const [compareRightModelId, setCompareRightModelId] = useState<number | null>(null);
@@ -602,8 +623,113 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
     }
   };
 
+  const handleOpenOptimize = (params: {
+    userQuestion: string;
+    assistantAnswer: string;
+    history: Array<{ role: string; content: string }>;
+  }) => {
+    if (!parsedAgentId) return;
+    if (!editedAgent?.model_id) return;
+
+    const duty = (editedAgent?.duty_prompt || "").trim();
+    const constraint = (editedAgent?.constraint_prompt || "").trim();
+    const fewShots = (editedAgent?.few_shots_prompt || "").trim();
+
+    const originalFullPrompt = [
+      "# 智能体角色",
+      duty,
+      "",
+      "# 使用要求",
+      constraint,
+      "",
+      "# 示例",
+      fewShots,
+    ]
+      .filter((part) => part !== undefined)
+      .join("\n")
+      .trim();
+
+    setCompareOriginalPrompt(originalFullPrompt);
+    setCompareOptimizedPrompt("");
+
+    setDebugOptimizeSelected(params);
+    setDebugOptimizeOpen(true);
+  };
+
+  const handleOptimized = (params: {
+    originalFullPrompt: string;
+    optimizedFullPrompt: string;
+  }) => {
+    setCompareOriginalPrompt(params.originalFullPrompt || "");
+    setCompareOptimizedPrompt(params.optimizedFullPrompt || "");
+  };
+
+  const handleApplyOptimizedPrompt = (optimizedFullPrompt?: string) => {
+    const optimized = (optimizedFullPrompt || compareOptimizedPrompt || "").trim();
+    if (!optimized) {
+      return;
+    }
+
+    const normalized = optimized
+      .replace(/\r\n/g, "\n")
+      .replace(/^#\s*智能体角色\s*$/gm, "# Duty")
+      .replace(/^#\s*使用要求\s*$/gm, "# Constraint")
+      .replace(/^#\s*示例\s*$/gm, "# FewShots");
+
+    const pickSection = (header: "Duty" | "Constraint" | "FewShots"): string => {
+      const headerRegex = new RegExp(`^#\\s*${header}\\s*$`, "gm");
+      const matches = [...normalized.matchAll(headerRegex)];
+      const current = matches[0];
+      if (!current) return "";
+
+      const start = current.index + current[0].length;
+      const rest = normalized.slice(start);
+      const nextHeaderMatch = rest.match(/^#\s*(Duty|Constraint|FewShots)\s*$/m);
+      const end = nextHeaderMatch?.index ?? rest.length;
+      return rest.slice(0, end).trim();
+    };
+
+    const duty = pickSection("Duty");
+    const constraint = pickSection("Constraint");
+    const fewShots = pickSection("FewShots");
+
+    const updateAgentConfig = useAgentConfigStore.getState().updateAgentConfig;
+
+    updateAgentConfig({
+      ...(duty ? { duty_prompt: duty } : {}),
+      ...(constraint ? { constraint_prompt: constraint } : {}),
+      ...(fewShots ? { few_shots_prompt: fewShots } : {}),
+    });
+    // Close optimize modal after applying.
+    setDebugOptimizeOpen(false);
+    setDebugOptimizeSelected(null);
+    setCompareOriginalPrompt("");
+    setCompareOptimizedPrompt("");
+  };
+
   return (
     <div className="w-full h-full bg-white">
+      <DebugOptimizeModal
+        open={debugOptimizeOpen}
+        agentId={parsedAgentId ?? 0}
+        modelId={editedAgent?.model_id ?? 0}
+        userQuestion={debugOptimizeSelected?.userQuestion || ""}
+        assistantAnswer={debugOptimizeSelected?.assistantAnswer || ""}
+        history={debugOptimizeSelected?.history || []}
+        initialOriginalFullPrompt={compareOriginalPrompt || ""}
+        onCancel={() => {
+          setDebugOptimizeOpen(false);
+          setDebugOptimizeSelected(null);
+          setCompareOriginalPrompt("");
+          setCompareOptimizedPrompt("");
+        }}
+        onOptimized={handleOptimized}
+        onApply={(optimizedFullPrompt) => {
+          setCompareOptimizedPrompt(optimizedFullPrompt || "");
+          handleApplyOptimizedPrompt(optimizedFullPrompt);
+        }}
+      />
+
       <AgentDebugging
         key={agentId} // Re-render when agentId changes to ensure state resets
         onStop={handleStop}
@@ -614,6 +740,7 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
         isStreaming={isStreaming}
         isCompareStreaming={isCompareStreaming}
         messages={messages}
+        onOptimizeReply={handleOpenOptimize}
         comparePanel={comparePanel}
         showCompare={hasMultipleLlmModels}
         onOpenCompare={toggleComparePanel}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
index 7eb25c220..4b299d52b 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
@@ -5,17 +5,25 @@ import { TaskWindow } from "@/app/chat/streaming/taskWindow";
 import { transformMessagesToTaskMessages } from "@/app/chat/streaming/messageTransformer";
 import { MESSAGE_ROLES } from "@/const/chatConfig";
 import { ChatMessageType, TaskMessageType } from "@/types/chat";
+import { Button, Tooltip } from "antd";
+import { Sparkles } from "lucide-react";
 
 interface DebugMessageListProps {
   messages: ChatMessageType[];
   isStreaming: boolean;
   emptyPlaceholder?: string;
+  onOptimizeReply?: (params: {
+    userQuestion: string;
+    assistantAnswer: string;
+    history: Array<{ role: string; content: string }>;
+  }) => void;
 }
 
 export default function DebugMessageList({
   messages,
   isStreaming,
   emptyPlaceholder,
+  onOptimizeReply,
 }: DebugMessageListProps) {
   const processMessageSteps = (message: ChatMessageType): TaskMessageType[] => {
     if (!message.steps || message.steps.length === 0) return [];
@@ -35,6 +43,40 @@ export default function DebugMessageList({
     );
   }
 
+  const buildHistory = () =>
+    messages
+      .filter((msg) => msg.isComplete !== false && msg.content?.trim())
+      .map((msg) => ({
+        role: msg.role,
+        content:
+          msg.role === MESSAGE_ROLES.ASSISTANT
+            ? msg.finalAnswer?.trim() || msg.content || ""
+            : msg.content || "",
+      }));
+
+  const onOptimizeClick = (assistantIndex: number) => {
+    if (!onOptimizeReply) return;
+
+    const assistantMsg = messages[assistantIndex];
+    if (!assistantMsg) return;
+
+    const assistantAnswer = assistantMsg.finalAnswer?.trim() || assistantMsg.content || "";
+    if (!assistantAnswer.trim()) return;
+
+    const userMsg = [...messages]
+      .slice(0, assistantIndex)
+      .reverse()
+      .find((m) => m.role === MESSAGE_ROLES.USER);
+
+    const userQuestion = userMsg?.content || "";
+
+    onOptimizeReply({
+      userQuestion,
+      assistantAnswer,
+      history: buildHistory(),
+    });
+  };
+
   return (
     <div className="flex flex-col gap-3 h-full overflow-y-auto custom-scrollbar">
       {messages.map((message, index) => {
@@ -43,6 +85,18 @@ export default function DebugMessageList({
             ? processMessageSteps(message)
             : [];
 
+        const isLastStreamingAssistant =
+          isStreaming &&
+          index === messages.length - 1 &&
+          message.role === MESSAGE_ROLES.ASSISTANT;
+
+        const canOptimize =
+          Boolean(onOptimizeReply) &&
+          message.role === MESSAGE_ROLES.ASSISTANT &&
+          message.isComplete !== false &&
+          !isLastStreamingAssistant &&
+          Boolean((message.finalAnswer || message.content || "").trim());
+
         return (
           <div key={message.id || index} className="flex flex-col gap-2">
             {message.role === MESSAGE_ROLES.USER && (
@@ -69,16 +123,39 @@ export default function DebugMessageList({
               )}
 
             {message.role === MESSAGE_ROLES.ASSISTANT && (
-              <ChatStreamFinalMessage
-                message={message}
-                onSelectMessage={() => {}}
-                isSelected={false}
-                searchResultsCount={message.searchResults?.length || 0}
-                imagesCount={message.images?.length || 0}
-                onImageClick={() => {}}
-                onOpinionChange={() => {}}
-                hideButtons={true}
-              />
+              <div className="relative">
+                <ChatStreamFinalMessage
+                  message={message}
+                  onSelectMessage={() => {}}
+                  isSelected={false}
+                  searchResultsCount={message.searchResults?.length || 0}
+                  imagesCount={message.images?.length || 0}
+                  onImageClick={() => {}}
+                  onOpinionChange={() => {}}
+                  hideButtons={true}
+                />
+
+                {canOptimize && (
+                  <div className="mt-1 flex justify-start">
+                    <Tooltip title="优化" placement="top">
+                      <Button
+                        type="text"
+                        size="small"
+                        onClick={() => onOptimizeClick(index)}
+                        icon={<Sparkles size={14} />}
+                        className="prompt-toolbar-button"
+                        style={{
+                          color: "#475569",
+                          width: 24,
+                          minWidth: 24,
+                          height: 24,
+                          borderRadius: 9999,
+                        }}
+                      />
+                    </Tooltip>
+                  </div>
+                )}
+              </div>
             )}
           </div>
         );
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx
new file mode 100644
index 000000000..f9b1f4eca
--- /dev/null
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx
@@ -0,0 +1,230 @@
+"use client";
+
+import { useEffect, useState } from "react";
+import { useTranslation } from "react-i18next";
+import { App, Button, Input, Modal, Space, Spin, Typography } from "antd";
+
+const { TextArea } = Input;
+const { Paragraph, Text } = Typography;
+
+export interface DebugOptimizeModalProps {
+  open: boolean;
+  agentId: number;
+  modelId: number;
+  userQuestion: string;
+  assistantAnswer: string;
+  history: Array<{ role: string; content: string }>;
+  initialOriginalFullPrompt?: string;
+  onCancel: () => void;
+  onOptimized: (params: { originalFullPrompt: string; optimizedFullPrompt: string }) => void;
+  onApply: (optimizedFullPrompt: string) => void;
+  applying?: boolean;
+}
+
+export default function DebugOptimizeModal({
+  open,
+  agentId,
+  modelId,
+  userQuestion,
+  assistantAnswer,
+  history,
+  initialOriginalFullPrompt,
+  onCancel,
+  onOptimized,
+  onApply,
+  applying,
+}: DebugOptimizeModalProps) {
+  const { t } = useTranslation("common");
+  const { message } = App.useApp();
+
+  const [feedback, setFeedback] = useState("");
+  const [isOptimizing, setIsOptimizing] = useState(false);
+
+  const [originalFullPrompt, setOriginalFullPrompt] = useState("");
+  const [optimizedFullPrompt, setOptimizedFullPrompt] = useState("");
+  const [displayedContent, setDisplayedContent] = useState("");
+
+  // Section header mapping: English -> Chinese
+  const headerMap: Record<string, string> = {
+    "# Duty": "#智能体角色",
+    "# Constraint": "#使用要求",
+    "# FewShots": "#示例",
+  };
+
+  const mapHeadersToChinese = (text: string) => {
+    let result = text;
+    for (const [en, zh] of Object.entries(headerMap)) {
+      result = result.split(en).join(zh);
+    }
+    return result;
+  };
+
+  useEffect(() => {
+    if (!open) {
+      setFeedback("");
+      setIsOptimizing(false);
+      setOriginalFullPrompt("");
+      setOptimizedFullPrompt("");
+      setDisplayedContent("");
+      return;
+    }
+
+    setFeedback("");
+    setIsOptimizing(false);
+    setDisplayedContent("");
+    // Show original prompt immediately when opening the modal.
+    setOriginalFullPrompt((prev) => prev || initialOriginalFullPrompt || "");
+    // Keep original prompt visible while waiting for new optimized result.
+    setOptimizedFullPrompt("");
+  }, [open, agentId, modelId]);
+
+  const handleOk = async () => {
+    if (!feedback.trim()) {
+      message.error(t("systemPrompt.optimize.feedbackRequired"));
+      return;
+    }
+
+    setIsOptimizing(true);
+    try {
+      const resp = await fetch("/api/prompt/optimize/from_debug", {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({
+          agent_id: agentId,
+          model_id: modelId,
+          feedback: feedback.trim(),
+          selected: {
+            user_question: userQuestion,
+            assistant_answer: assistantAnswer,
+          },
+          history,
+        }),
+      });
+
+      const result = await resp.json();
+      if (!resp.ok) {
+        throw new Error(result?.message || t("systemPrompt.optimize.error"));
+      }
+
+      const data = result?.data;
+      const original = data?.original_full_prompt || "";
+      const fullText = mapHeadersToChinese(data?.optimized_full_prompt || "");
+
+      setOriginalFullPrompt(original);
+      setOptimizedFullPrompt(fullText);
+      setDisplayedContent(fullText);
+
+      // Ensure modal stays open and does not reset prompts.
+      setIsOptimizing(false);
+
+      onOptimized({
+        originalFullPrompt: original,
+        optimizedFullPrompt: fullText,
+      });
+    } catch (e: any) {
+      message.error(e?.message || t("systemPrompt.optimize.error"));
+    } finally {
+      setIsOptimizing(false);
+    }
+  };
+
+  return (
+    <Modal
+      title={t("agent.debug.optimizeTitle", "Optimize prompt")}
+      open={open}
+      onCancel={onCancel}
+      width={1200}
+      footer={
+        <Space>
+          <Button onClick={onCancel}>{t("common.cancel")}</Button>
+          <Button
+            type="primary"
+            onClick={() => onApply(optimizedFullPrompt)}
+            disabled={!optimizedFullPrompt.trim()}
+            loading={applying}
+          >
+            {t("agent.debug.promptCompare.apply", "Apply")}
+          </Button>
+          <Button type="primary" onClick={handleOk}>
+            {t("systemPrompt.optimize.submit")}
+          </Button>
+        </Space>
+      }
+      destroyOnHidden
+    >
+      <div className="flex flex-col gap-3">
+        <Text type="secondary">
+          {t(
+            "agent.debug.optimizeHint",
+            "Select a reply, provide feedback, and we will optimize the full system prompt."
+          )}
+        </Text>
+
+        <div>
+          <Text strong>{t("systemPrompt.optimize.feedbackLabel")}</Text>
+          <TextArea
+            value={feedback}
+            onChange={(e) => setFeedback(e.target.value)}
+            placeholder={t("systemPrompt.optimize.feedbackPlaceholder")}
+            rows={4}
+            className="mt-2"
+            disabled={isOptimizing}
+          />
+        </div>
+
+        <div className="grid grid-cols-1 gap-3 md:grid-cols-2">
+          <div>
+            <Text strong>{t("agent.debug.selectedQuestion", "Selected question")}</Text>
+            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
+              <Paragraph style={{ whiteSpace: "pre-wrap", marginBottom: 0 }} className="text-sm">
+                {userQuestion || t("common.none")}
+              </Paragraph>
+            </div>
+          </div>
+          <div>
+            <Text strong>{t("agent.debug.selectedAnswer", "Selected answer")}</Text>
+            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
+              <Paragraph style={{ whiteSpace: "pre-wrap", marginBottom: 0 }} className="text-sm">
+                {assistantAnswer || t("common.none")}
+              </Paragraph>
+            </div>
+          </div>
+        </div>
+
+        <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
+          <div>
+            <Text strong>{t("agent.debug.promptCompare.original", "Original")}</Text>
+            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
+              <Paragraph
+                style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
+                className="font-mono text-sm"
+              >
+                {mapHeadersToChinese(originalFullPrompt) || "-"}
+              </Paragraph>
+            </div>
+          </div>
+          <div>
+            <Text strong>{t("agent.debug.promptCompare.optimized", "Optimized")}</Text>
+            <div className="mt-2 border border-gray-200 rounded-md p-3">
+              {isOptimizing ? (
+                <div className="flex flex-col items-center justify-center gap-3" style={{ minHeight: 520 }}>
+                  <Spin size="medium" />
+                  <span className="text-gray-500 text-sm">
+                    {t("systemPrompt.optimize.generating")}
+                  </span>
+                </div>
+              ) : (
+                <Paragraph
+                  style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
+                  className="font-mono text-sm"
+                >
+                  {displayedContent || t("systemPrompt.optimize.empty")}
+                </Paragraph>
+              )}
+            </div>
+          </div>
+        </div>
+      </div>
+    </Modal>
+  );
+}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx
new file mode 100644
index 000000000..eec0ed132
--- /dev/null
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx
@@ -0,0 +1,76 @@
+"use client";
+
+import { useTranslation } from "react-i18next";
+import { Button, Modal, Space, Typography } from "antd";
+
+const { Paragraph, Text } = Typography;
+
+export interface DebugPromptCompareModalProps {
+  open: boolean;
+  originalFullPrompt: string;
+  optimizedFullPrompt: string;
+  onClose: () => void;
+  onApply: () => void;
+  applying?: boolean;
+}
+
+export default function DebugPromptCompareModal({
+  open,
+  originalFullPrompt,
+  optimizedFullPrompt,
+  onClose,
+  onApply,
+  applying,
+}: DebugPromptCompareModalProps) {
+  const { t } = useTranslation("common");
+
+  return (
+    <Modal
+      title={t("agent.debug.promptCompare.title", "Prompt compare")}
+      open={open}
+      onCancel={onClose}
+      width={1200}
+      footer={
+        <Space>
+          <Button onClick={onClose}>
+            {t("agent.debug.promptCompare.close", "Close")}
+          </Button>
+          <Button
+            type="primary"
+            onClick={onApply}
+            disabled={!optimizedFullPrompt.trim()}
+            loading={applying}
+          >
+            {t("agent.debug.promptCompare.apply", "Apply")}
+          </Button>
+        </Space>
+      }
+      destroyOnHidden
+    >
+      <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
+        <div className="border border-gray-200 rounded-md p-3 bg-gray-50">
+          <Text type="secondary" className="text-xs">
+            {t("agent.debug.promptCompare.original", "Original")}
+          </Text>
+          <Paragraph
+            style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
+            className="font-mono text-sm"
+          >
+            {originalFullPrompt || "-"}
+          </Paragraph>
+        </div>
+        <div className="border border-gray-200 rounded-md p-3">
+          <Text type="secondary" className="text-xs">
+            {t("agent.debug.promptCompare.optimized", "Optimized")}
+          </Text>
+          <Paragraph
+            style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
+            className="font-mono text-sm"
+          >
+            {optimizedFullPrompt || "-"}
+          </Paragraph>
+        </div>
+      </div>
+    </Modal>
+  );
+}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
index 1d7629951..897c523c3 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
@@ -1,6 +1,22 @@
-import { useEffect, useState } from "react";
+"use client";
+
+import { useEffect, useState, useRef, useCallback } from "react";
 import { useTranslation } from "react-i18next";
-import { App, Button, Card, Input, Modal, Space, Typography } from "antd";
+import {
+  App,
+  Button,
+  Card,
+  Input,
+  Modal,
+  Radio,
+  Space,
+  Spin,
+  Typography,
+  Divider,
+  Tooltip,
+  Alert,
+} from "antd";
+import { MousePointer2 } from "lucide-react";
 
 import log from "@/lib/logger";
 import { optimizePromptSection } from "@/services/promptService";
@@ -9,6 +25,8 @@ import type { OptimizePromptSectionResponse } from "@/types/agentConfig";
 const { TextArea } = Input;
 const { Paragraph, Text } = Typography;
 
+export type OptimizeMode = "general" | "insert" | "select";
+
 export interface PromptOptimizeModalProps {
   open: boolean;
   title: string;
@@ -21,7 +39,7 @@ export interface PromptOptimizeModalProps {
   subAgentIds: number[];
   knowledgeBaseDisplayNames?: string[];
   onClose: () => void;
-  onReplace: (content: string) => void;
+  onReplace: (content: string, sectionType: "duty" | "constraint" | "few_shots") => void;
 }
 
 export default function PromptOptimizeModal({
@@ -40,43 +58,115 @@ export default function PromptOptimizeModal({
 }: PromptOptimizeModalProps) {
   const { t } = useTranslation("common");
   const { message } = App.useApp();
+  const [mode, setMode] = useState<OptimizeMode>("general");
   const [feedback, setFeedback] = useState("");
+  const [startPos, setStartPos] = useState<string>("");
+  const [endPos, setEndPos] = useState<string>("");
   const [optimizedContent, setOptimizedContent] = useState("");
   const [isOptimizing, setIsOptimizing] = useState(false);
+  const [isContentSelected, setIsContentSelected] = useState(false);
+  const contentTextAreaRef = useRef<any>(null);
+
+  // Section header mapping: English -> Chinese
+  const headerMap: Record<string, string> = {
+    "# Duty": "#智能体角色",
+    "# Constraint": "#使用要求",
+    "# FewShots": "#示例",
+  };
+
+  const mapHeadersToChinese = (text: string) => {
+    let result = text;
+    for (const [en, zh] of Object.entries(headerMap)) {
+      result = result.split(en).join(zh);
+    }
+    return result;
+  };
 
   useEffect(() => {
     if (!open) {
       setFeedback("");
       setOptimizedContent("");
       setIsOptimizing(false);
+      setMode("general");
+      setStartPos("");
+      setEndPos("");
+      setIsContentSelected(false);
       return;
     }
-
     setFeedback("");
     setOptimizedContent("");
+    setIsOptimizing(false);
+    setMode("general");
+    setStartPos("");
+    setEndPos("");
+    setIsContentSelected(false);
   }, [open, sectionType, currentContent]);
 
+  const handleContentSelect = useCallback(() => {
+    if (!contentTextAreaRef.current) return;
+    const textarea = contentTextAreaRef.current.resizableTextArea?.textArea;
+    if (!textarea) return;
+
+    const { selectionStart, selectionEnd } = textarea;
+
+    // Insert mode: allow caret position even when no range is selected
+    if (selectionStart === selectionEnd) {
+      setStartPos(String(selectionStart));
+      setEndPos("");
+      setIsContentSelected(false);
+      setMode("insert");
+      return;
+    }
+
+    // Select mode: range selected
+    setStartPos(String(selectionStart));
+    setEndPos(String(selectionEnd));
+    setIsContentSelected(true);
+    setMode("select");
+  }, []);
+
   const handleOptimize = async () => {
     if (!feedback.trim()) {
       message.error(t("systemPrompt.optimize.feedbackRequired"));
       return;
     }
 
+    if (mode === "insert") {
+      const pos = parseInt(startPos, 10);
+      if (isNaN(pos) || pos < 0) {
+        message.error(t("systemPrompt.finetune.positionError"));
+        return;
+      }
+    }
+
+    if (mode === "select") {
+      const start = parseInt(startPos, 10);
+      const end = parseInt(endPos, 10);
+      if (isNaN(start) || isNaN(end) || start < 0 || end < 0 || start >= end) {
+        message.error(t("systemPrompt.finetune.positionError"));
+        return;
+      }
+    }
+
     setIsOptimizing(true);
     try {
       const result: OptimizePromptSectionResponse = await optimizePromptSection({
         agent_id: agentId,
         task_description: taskDescription,
-        model_id: String(modelId),
+        model_id: modelId,
         section_type: sectionType,
         section_title: title,
         current_content: currentContent,
         feedback,
+        mode,
+        start_pos: mode !== "general" ? parseInt(startPos, 10) : undefined,
+        end_pos: mode === "select" ? parseInt(endPos, 10) : undefined,
         tool_ids: toolIds,
         sub_agent_ids: subAgentIds,
         knowledge_base_display_names: knowledgeBaseDisplayNames,
       });
-      setOptimizedContent(result.optimized_content || "");
+      const fullText = mapHeadersToChinese(result.optimized_content || "");
+      setOptimizedContent(fullText);
     } catch (error: any) {
       log.error("Optimize prompt section failed:", error);
       message.error(error?.message || t("systemPrompt.optimize.error"));
@@ -86,12 +176,28 @@ export default function PromptOptimizeModal({
   };
 
   const handleReplace = () => {
-    if (!optimizedContent.trim()) {
-      return;
-    }
-    onReplace(optimizedContent);
+    if (!optimizedContent.trim() || isOptimizing) return;
+    onReplace(optimizedContent.trim(), sectionType);
   };
 
+  const modeOptions: Array<{ value: OptimizeMode; label: string; desc: string }> = [
+    {
+      value: "general",
+      label: t("systemPrompt.finetune.modeGeneral"),
+      desc: t("systemPrompt.finetune.modeGeneralDesc"),
+    },
+    {
+      value: "insert",
+      label: t("systemPrompt.finetune.modeInsert"),
+      desc: t("systemPrompt.finetune.modeInsertDesc"),
+    },
+    {
+      value: "select",
+      label: t("systemPrompt.finetune.modeSelect"),
+      desc: t("systemPrompt.finetune.modeSelectDesc"),
+    },
+  ];
+
   return (
     <Modal
       title={title}
@@ -100,9 +206,7 @@ export default function PromptOptimizeModal({
       width={1200}
       footer={
         <Space>
-          <Button onClick={onClose}>
-            {t("common.cancel")}
-          </Button>
+          <Button onClick={onClose}>{t("common.cancel")}</Button>
           <Button
             type="primary"
             onClick={handleReplace}
@@ -115,11 +219,97 @@ export default function PromptOptimizeModal({
       destroyOnHidden
     >
       <div className="flex flex-col gap-4">
+        {/* Mode Selection */}
+        <div>
+          <Text strong className="mb-2 block">
+            {t("systemPrompt.finetune.modeLabel")}
+          </Text>
+          <Radio.Group
+            value={mode}
+            onChange={(e) => setMode(e.target.value)}
+            className="flex flex-col gap-2"
+          >
+            {modeOptions.map((opt) => (
+              <Radio key={opt.value} value={opt.value} className="!ml-0">
+                <span className="font-medium">{opt.label}</span>
+                <span className="text-gray-500 text-sm ml-2">{opt.desc}</span>
+              </Radio>
+            ))}
+          </Radio.Group>
+        </div>
+
+        {/* Position inputs for insert/select modes */}
+        {mode !== "general" && (
+          <div className="bg-gray-50 rounded-md p-4">
+            {mode === "insert" && (
+              <div className="flex items-center gap-4">
+                <div className="flex-1">
+                  <Text type="secondary" className="text-xs">
+                    {t("systemPrompt.finetune.insertPositionLabel")}
+                  </Text>
+                  <Input
+                    type="number"
+                    min={0}
+                    value={startPos}
+                    onChange={(e) => setStartPos(e.target.value)}
+                    placeholder={t("systemPrompt.finetune.insertPositionPlaceholder")}
+                  />
+                </div>
+              </div>
+            )}
+            {mode === "select" && (
+              <div className="flex items-center gap-4 flex-wrap">
+                <div>
+                  <Text type="secondary" className="text-xs">
+                    {t("systemPrompt.finetune.selectStartLabel")}
+                  </Text>
+                  <Input
+                    type="number"
+                    min={0}
+                    value={startPos}
+                    onChange={(e) => setStartPos(e.target.value)}
+                    placeholder={t("systemPrompt.finetune.selectStartPlaceholder")}
+                    style={{ width: 140 }}
+                  />
+                </div>
+                <div>
+                  <Text type="secondary" className="text-xs">
+                    {t("systemPrompt.finetune.selectEndLabel")}
+                  </Text>
+                  <Input
+                    type="number"
+                    min={0}
+                    value={endPos}
+                    onChange={(e) => setEndPos(e.target.value)}
+                    placeholder={t("systemPrompt.finetune.selectEndPlaceholder")}
+                    style={{ width: 140 }}
+                  />
+                </div>
+              </div>
+            )}
+            {isContentSelected && (
+              <Alert
+                title={
+                  <span className="text-xs">
+                    {t("systemPrompt.finetune.selectTip")}: {startPos} - {endPos}
+                  </span>
+                }
+                type="success"
+                showIcon
+                className="mt-2"
+              />
+            )}
+          </div>
+        )}
+
+        <Divider className="my-2" />
+
+        {/* Feedback Input */}
         <div>
           <Text strong>{t("systemPrompt.optimize.feedbackLabel")}</Text>
           <TextArea
             value={feedback}
-            onChange={(event) => setFeedback(event.target.value)}
+            onChange={(e) => setFeedback(e.target.value)}
             placeholder={t("systemPrompt.optimize.feedbackPlaceholder")}
             rows={4}
             className="mt-2"
@@ -127,30 +317,64 @@ export default function PromptOptimizeModal({
           />
         </div>
 
+        {/* Submit Button */}
         <div className="flex justify-end">
-          <Button
-            type="primary"
-            onClick={handleOptimize}
-            loading={isOptimizing}
-          >
+          <Button type="primary" onClick={handleOptimize}>
             {t("systemPrompt.optimize.submit")}
           </Button>
         </div>
 
+        {/* Before/After Comparison */}
         <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
-          <Card title={t("systemPrompt.optimize.original")}>
-            <Paragraph
-              style={{ whiteSpace: "pre-wrap", minHeight: 320, marginBottom: 0 }}
-            >
-              {currentContent || t("common.none")}
-            </Paragraph>
+          <Card
+            title={
+              <div className="flex items-center justify-between">
+                <span>{t("systemPrompt.optimize.original")}</span>
+                <Tooltip title={t("systemPrompt.finetune.selectTip")}>
+                  <Button
+                    size="small"
+                    type="text"
+                    icon={<MousePointer2 size={12} />}
+                    onClick={handleContentSelect}
+                    disabled={isOptimizing}
+                  />
+                </Tooltip>
+              </div>
+            }
+            styles={{ body: { padding: 0 } }}
+          >
+            <TextArea
+              ref={contentTextAreaRef}
+              value={mapHeadersToChinese(currentContent)}
+              readOnly
+              rows={10}
+              className="border-0 rounded-none font-mono text-sm"
+              style={{
+                resize: "none",
+                background: "#fafafa",
+                minHeight: 200,
+              }}
+              onSelect={handleContentSelect}
+              onClick={handleContentSelect}
+              onKeyUp={handleContentSelect}
+            />
           </Card>
           <Card title={t("systemPrompt.optimize.optimized")}>
-            <Paragraph
-              style={{ whiteSpace: "pre-wrap", minHeight: 320, marginBottom: 0 }}
-            >
-              {optimizedContent || t("systemPrompt.optimize.empty")}
-            </Paragraph>
+            {isOptimizing ? (
+              <div className="flex flex-col items-center justify-center py-8 gap-3 min-h-[200px]">
+                <Spin size="medium" />
+                <span className="text-gray-500 text-sm">
+                  {t("systemPrompt.optimize.generating")}
+                </span>
+              </div>
+            ) : (
+              <Paragraph
+                style={{ whiteSpace: "pre-wrap", minHeight: 200, marginBottom: 0 }}
+                className="font-mono text-sm"
+              >
+                {optimizedContent || t("systemPrompt.optimize.empty")}
+              </Paragraph>
+            )}
           </Card>
         </div>
       </div>
diff --git a/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
index 24434c0aa..a3c6ebded 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
@@ -119,16 +119,20 @@ export default function PromptTemplateManagerModal({
   };
 
   const openTemplateEditor = (template: PromptTemplate, readOnly = false) => {
-    editorForm.setFieldsValue({
-      template_name: template.template_name,
-      description: template.description || "",
-      template_content_zh: template.template_content_zh || createEmptyPromptTemplateContent(),
-      template_content_en: template.template_content_en || createEmptyPromptTemplateContent(),
-    });
     setEditingTemplate(template);
     setEditorSeedTemplate(template);
     setEditorReadOnly(readOnly);
     setEditorOpen(true);
+
+    // Defer form operations until Form is mounted inside the editor modal.
+    queueMicrotask(() => {
+      editorForm.setFieldsValue({
+        template_name: template.template_name,
+        description: template.description || "",
+        template_content_zh: template.template_content_zh || createEmptyPromptTemplateContent(),
+        template_content_en: template.template_content_en || createEmptyPromptTemplateContent(),
+      });
+    });
   };
 
   const closeEditor = () => {
@@ -136,7 +140,6 @@ export default function PromptTemplateManagerModal({
     setEditingTemplate(null);
     setEditorSeedTemplate(null);
     setEditorReadOnly(false);
-    editorForm.resetFields();
   };
 
   const buildPayload = (values: PromptTemplateFormValues): PromptTemplatePayload => {
@@ -446,7 +449,7 @@ export default function PromptTemplateManagerModal({
           : t("businessLogic.config.template.createTitle")}
         width={980}
         centered
-        destroyOnClose
+        destroyOnHidden
         okText={editorReadOnly ? t("common.close") : t("common.save")}
         cancelText={t("common.cancel")}
         cancelButtonProps={editorReadOnly ? { style: { display: "none" } } : undefined}
diff --git a/frontend/app/[locale]/agents/page.tsx b/frontend/app/[locale]/agents/page.tsx
index 52d66fe8a..2ef7692d4 100644
--- a/frontend/app/[locale]/agents/page.tsx
+++ b/frontend/app/[locale]/agents/page.tsx
@@ -12,6 +12,8 @@ import AgentInfoComp from "./components/AgentInfoComp";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import AgentVersionManage from "./AgentVersionManage";
 import AgentSelectorHeader from "./components/AgentSelectorHeader";
+import { searchAgentInfo } from "@/services/agentConfigService";
+import log from "@/lib/logger";
 
 const { Header, Content } = Layout;
 
@@ -21,6 +23,8 @@ export default function AgentSetupOrchestrator() {
   const enterCreateMode = useAgentConfigStore((state) => state.enterCreateMode);
   const reset = useAgentConfigStore((state) => state.reset);
   const setDefaultLlmConfig = useAgentConfigStore((state) => state.setDefaultLlmConfig);
+  const currentAgentId = useAgentConfigStore((state) => state.currentAgentId);
+  const setCurrentAgent = useAgentConfigStore((state) => state.setCurrentAgent);
   const { config } = useConfig();
 
   // Sync default LLM config from load_config
@@ -47,6 +51,26 @@ export default function AgentSetupOrchestrator() {
     }
   }, [searchParams, enterCreateMode]);
 
+  // Handle auto-select agent from URL params (agent_id)
+  useEffect(() => {
+    const agentId = searchParams.get('agent_id');
+    if (agentId && (!currentAgentId || String(currentAgentId) !== agentId)) {
+      const loadAgent = async () => {
+        try {
+          const result = await searchAgentInfo(parseInt(agentId));
+          if (result.success && result.data) {
+            setCurrentAgent(result.data);
+          } else {
+            log.warn("Failed to load agent from URL agent_id:", result.message);
+          }
+        } catch (error) {
+          log.error("Failed to load agent from URL agent_id:", error);
+        }
+      };
+      loadAgent();
+    }
+  }, [searchParams, currentAgentId, setCurrentAgent]);
+
   // Reset agent selection state when leaving the page
   useEffect(() => {
     return () => {
diff --git a/frontend/app/[locale]/chat/components/chatAgentSelector.tsx b/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
index f7a540172..47449fd08 100644
--- a/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
+++ b/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
@@ -209,7 +209,8 @@ export function ChatAgentSelector({
       }
     }
 
-    onAgentSelect(agentId);
+    const agent = agentId !== null ? agents.find((a: Agent) => a.id === agentId) : null;
+    onAgentSelect(agentId, agent?.greeting_message, agent?.example_questions);
     setIsOpen(false);
 
     // If it's an iframe embedded page, send postMessage to the parent page
diff --git a/frontend/app/[locale]/chat/components/chatAttachment.tsx b/frontend/app/[locale]/chat/components/chatAttachment.tsx
index d12e939cd..69dfbc71a 100644
--- a/frontend/app/[locale]/chat/components/chatAttachment.tsx
+++ b/frontend/app/[locale]/chat/components/chatAttachment.tsx
@@ -19,7 +19,7 @@ import {
 } from "@/services/storageService";
 import { cn } from "@/lib/utils";
 import { AttachmentItem, ChatAttachmentProps } from "@/types/chat";
-import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
+import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
 import { App } from "antd";
 
 // Selected file state for preview drawer
diff --git a/frontend/app/[locale]/chat/components/chatInput.tsx b/frontend/app/[locale]/chat/components/chatInput.tsx
index bcfc86f6b..512f940e9 100644
--- a/frontend/app/[locale]/chat/components/chatInput.tsx
+++ b/frontend/app/[locale]/chat/components/chatInput.tsx
@@ -15,10 +15,9 @@ import {
 } from "@ant-design/icons";
 
 import { Input } from "@/components/ui/input";
-import { Button } from "antd";
-import { Tooltip } from "@/components/ui/tooltip";
+import { Button, Tooltip } from "antd";
 import { Textarea } from "@/components/ui/textarea";
-import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
+import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
 import { conversationService } from "@/services/conversationService";
 import { useConfig } from "@/hooks/useConfig";
 import { extractColorsFromUri } from "@/lib/avatar";
@@ -27,7 +26,7 @@ import { chatConfig } from "@/const/chatConfig";
 import { FilePreview } from "@/types/chat";
 
 import { ChatAgentSelector } from "./chatAgentSelector";
-import { TokenUsageIndicator } from "@/components/ui/tokenUsageIndicator";
+import { TokenUsageIndicator } from "@/components/common/tokenUsageIndicator";
 import { TokenMetrics } from "@/types/chat";
 
 // Get file extension
@@ -135,8 +134,10 @@ interface ChatInputProps {
   attachments?: FilePreview[];
   onAttachmentsChange?: (attachments: FilePreview[]) => void;
   selectedAgentId?: string | null;
-  onAgentSelect?: (agentId: string | null) => void;
+  onAgentSelect?: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
   latestMetrics?: TokenMetrics | null;
+  agentGreeting?: string | null;
+  agentExampleQuestions?: string[];
 }
 
 export function ChatInput({
@@ -156,6 +157,8 @@ export function ChatInput({
   selectedAgentId = null,
   onAgentSelect,
   latestMetrics = null,
+  agentGreeting = null,
+  agentExampleQuestions = [],
 }: ChatInputProps) {
   const [isRecording, setIsRecording] = useState(false);
   const [recordingStatus, setRecordingStatus] = useState<
@@ -1065,17 +1068,23 @@ export function ChatInput({
       {/* Chat input part */}
       {isInitialMode ? (
         <div className="flex flex-col items-center justify-center h-full w-full max-w-5xl mx-auto mt-[-80px]">
-          <div className="flex flex-col items-center mb-4">
-            <div className="flex items-center mb-6">
-              <div className="h-16 w-16 rounded-full overflow-hidden mr-4">
-                <img
-                  src={avatarUrl}
-                  alt={appConfig.appName}
-                  className="h-full w-full object-cover"
-                />
+          <div className="flex flex-col items-center mb-6">
+            <div className="h-16 w-16 rounded-full overflow-hidden mb-4 ring-2 ring-offset-2 ring-slate-100">
+              <img
+                src={avatarUrl}
+                alt={appConfig.appName}
+                className="h-full w-full object-cover"
+              />
+            </div>
+            {agentGreeting ? (
+              <div className="bg-gradient-to-br from-slate-50 to-white rounded-2xl px-6 py-5 max-w-2xl shadow-sm border border-slate-100 mb-4">
+                <p className="text-lg text-gray-800 leading-relaxed text-center">
+                  {agentGreeting}
+                </p>
               </div>
+            ) : (
               <h1
-                className="text-4xl font-bold bg-clip-text text-transparent"
+                className="text-4xl font-bold bg-clip-text text-transparent mb-2"
                 style={{
                   backgroundImage: (() => {
                     const colors = extractColorsFromUri(
@@ -1089,11 +1098,27 @@ export function ChatInput({
               >
                 {t("chatInput.helloIm", { appName: appConfig.appName })}
               </h1>
-            </div>
-            <p className="text-left text-muted-foreground max-w-2xl mx-auto leading-relaxed">
-              {appConfig.appDescription || t("chatInput.introMessage")}
-            </p>
+            )}
+            {!agentGreeting && (
+              <p className="text-left text-muted-foreground max-w-2xl mx-auto leading-relaxed">
+                {appConfig.appDescription || t("chatInput.introMessage")}
+              </p>
+            )}
           </div>
+          {agentExampleQuestions.length > 0 && (
+            <div className="flex flex-col gap-2 max-w-3xl mb-4 w-full">
+              {agentExampleQuestions.map((question, idx) => (
+                <button
+                  key={idx}
+                  onClick={() => onInputChange(question)}
+                  className="w-full px-4 py-3 rounded-xl border border-slate-200 bg-white hover:bg-slate-50 hover:border-slate-300 text-sm text-gray-700 shadow-sm transition-all text-left flex items-center gap-2"
+                >
+                  <span className="text-muted-foreground font-medium">{idx + 1}.</span>
+                  <span>{question}</span>
+                </button>
+              ))}
+            </div>
+          )}
           <div
             ref={dropAreaRef}
             className="relative w-full max-w-4xl rounded-3xl shadow-sm border border-slate-200 bg-slate-100 overflow-hidden"
diff --git a/frontend/app/[locale]/chat/internal/chatInterface.tsx b/frontend/app/[locale]/chat/internal/chatInterface.tsx
index 0f3c99715..9dd9bb847 100644
--- a/frontend/app/[locale]/chat/internal/chatInterface.tsx
+++ b/frontend/app/[locale]/chat/internal/chatInterface.tsx
@@ -113,6 +113,14 @@ export function ChatInterface() {
 
   // Add agent selection state
   const [selectedAgentId, setSelectedAgentId] = useState<string | null>(null);
+  const [agentGreeting, setAgentGreeting] = useState<string | null>(null);
+  const [agentExampleQuestions, setAgentExampleQuestions] = useState<string[]>([]);
+
+  const handleAgentSelectWithGreeting = (agentId: string | null, greeting?: string, exampleQuestions?: string[]) => {
+    setSelectedAgentId(agentId);
+    setAgentGreeting(greeting || null);
+    setAgentExampleQuestions(exampleQuestions || []);
+  };
 
   useEffect(() => {
     const agentId = sessionStorage.getItem("selectedAgentId");
@@ -1297,9 +1305,11 @@ export function ChatInterface() {
                 currentConversationId={conversationManagement.selectedConversationId ?? undefined}
                 shouldScrollToBottom={shouldScrollToBottom}
                 selectedAgentId={selectedAgentId}
-                onAgentSelect={setSelectedAgentId}
+                onAgentSelect={handleAgentSelectWithGreeting}
                 onCitationHover={clearCompletedIndicator}
                 onScroll={clearCompletedIndicator}
+                agentGreeting={agentGreeting}
+                agentExampleQuestions={agentExampleQuestions}
               />
             </div>
 
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx b/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
index e5809c435..285225f23 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
@@ -10,7 +10,7 @@ import {
   ThumbsUp,
 } from "lucide-react";
 
-import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
+import { MarkdownRenderer } from "@/components/common/markdownRenderer";
 
 /**
  * Convert custom code tags to standard markdown code fences
@@ -30,8 +30,7 @@ const convertToMarkdownCodeFences = (content: string): string => {
   });
   return content;
 };
-import { Button } from "antd";
-import { Tooltip, TooltipProvider } from "@/components/ui/tooltip";
+import { Button, Tooltip } from "antd";
 import { ChatMessageType, MaxStepsInfo } from "@/types/chat";
 import { chatConfig, Opinion } from "@/const/chatConfig";
 import { conversationService } from "@/services/conversationService";
@@ -354,6 +353,16 @@ function ChatStreamFinalMessageInner({
                 resolveS3Media={Boolean(message.finalAnswer || message.content)}
               />
 
+              {/* Skill-generated file attachments - render below the main content */}
+              {message.attachments && message.attachments.length > 0 && (
+                <div className="mt-3">
+                  <ChatAttachment
+                    attachments={message.attachments as AttachmentItem[]}
+                    onImageClick={onImageClick}
+                  />
+                </div>
+              )}
+
               {/* Button group - only show when hideButtons is false and message is complete */}
               {!hideButtons && message.isComplete && (
                 <div className="flex items-center justify-between mt-3">
@@ -393,7 +402,7 @@ function ChatStreamFinalMessageInner({
 
                   {/* Tool button */}
                   <div className="flex items-center space-x-2 mt-1 justify-end">
-                    <TooltipProvider>
+                    <div>
                       {/* Copy button */}
                       <Tooltip
                         title={
@@ -477,7 +486,7 @@ function ChatStreamFinalMessageInner({
                           {ttsButtonContent.icon}
                         </Button>
                       </Tooltip>
-                    </TooltipProvider>
+                    </div>
                   </div>
                 </div>
               )}
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx b/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
index 366d0f035..8d19cd69f 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
@@ -148,6 +148,7 @@ export const handleStreamResponse = async (
     | typeof chatConfig.contentTypes.SEARCH_CONTENT
     | typeof chatConfig.contentTypes.CARD
     | typeof chatConfig.contentTypes.MEMORY_SEARCH
+    | typeof chatConfig.contentTypes.VERIFICATION
     | typeof chatConfig.contentTypes.PREPROCESS
     | null = null;
   let lastModelOutputIndex = -1; // Track the index of the last model output in currentStep.contents
@@ -795,6 +796,36 @@ export const handleStreamResponse = async (
                   });
                   break;
 
+                case chatConfig.messageTypes.VERIFICATION:
+                  if (!currentStep) {
+                    currentStep = {
+                      id: `step-verification-${Date.now()}-${Math.random()
+                        .toString(36)
+                        .substring(2, 9)}`,
+                      title: "Verification",
+                      content: "",
+                      expanded: true,
+                      contents: [],
+                      metrics: null,
+                      thinking: { content: "", expanded: true },
+                      code: { content: "", expanded: true },
+                      output: { content: "", expanded: true },
+                    };
+                  }
+
+                  currentStep.contents.push({
+                    id: `verification-${Date.now()}-${Math.random()
+                      .toString(36)
+                      .substring(2, 7)}`,
+                    type: chatConfig.messageTypes.VERIFICATION,
+                    subType: "verification",
+                    content: messageContent,
+                    expanded: true,
+                    timestamp: Date.now(),
+                  });
+                  lastContentType = chatConfig.contentTypes.VERIFICATION;
+                  break;
+
                 case chatConfig.messageTypes.MEMORY_SEARCH:
                   // If there's no currentStep, create one
                   if (!currentStep) {
@@ -943,6 +974,43 @@ export const handleStreamResponse = async (
                   }
                   break;
 
+                case chatConfig.messageTypes.SKILL_FILES:
+                  // Process skill-generated file uploads (e.g., documents created by skills)
+                  try {
+                    const skillFilesData = JSON.parse(messageContent);
+                    const skillUploads = skillFilesData.skill_file_uploads || [];
+
+                    // Convert uploads to AttachmentItem format
+                    const newAttachments = skillUploads
+                      .filter((upload: any) => upload.status === "success")
+                      .map((upload: any) => ({
+                        type: "file",
+                        name: upload.file_name || "document",
+                        size: upload.file_size || 0,
+                        object_name: upload.object_name,
+                        url: upload.preview_url || upload.presigned_url || upload.object_name,
+                        contentType: upload.mime_type,
+                      }));
+
+                    if (newAttachments.length > 0) {
+                      setMessages((prev) => {
+                        const newMessages = [...prev];
+                        const lastMsg = newMessages[newMessages.length - 1];
+                        if (lastMsg && lastMsg.role === MESSAGE_ROLES.ASSISTANT) {
+                          const existingAttachments = lastMsg.attachments || [];
+                          newMessages[newMessages.length - 1] = {
+                            ...lastMsg,
+                            attachments: [...existingAttachments, ...newAttachments],
+                          };
+                        }
+                        return newMessages;
+                      });
+                    }
+                  } catch (e) {
+                    log.error(t("chatStreamHandler.streamResponseError"), e);
+                  }
+                  break;
+
                 default:
                   // Process other types of messages
                   break;
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx b/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
index 4d0dd8d88..27f2649d7 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
@@ -39,6 +39,8 @@ export function ChatStreamMain({
   onAgentSelect,
   onCitationHover,
   onScroll,
+  agentGreeting,
+  agentExampleQuestions,
 }: ChatStreamMainProps) {
   const { t } = useTranslation();
   // Animation variants for ChatInput
@@ -357,6 +359,8 @@ export function ChatStreamMain({
                         selectedAgentId={selectedAgentId}
                         onAgentSelect={onAgentSelect}
                         latestMetrics={latestMetrics}
+                        agentGreeting={agentGreeting}
+                        agentExampleQuestions={agentExampleQuestions}
                       />
                     </motion.div>
                   </AnimatePresence>
@@ -455,6 +459,8 @@ export function ChatStreamMain({
               selectedAgentId={selectedAgentId}
               onAgentSelect={onAgentSelect}
               latestMetrics={latestMetrics}
+              agentGreeting={agentGreeting}
+              agentExampleQuestions={agentExampleQuestions}
             />
           </motion.div>
         </AnimatePresence>
diff --git a/frontend/app/[locale]/chat/streaming/taskWindow.tsx b/frontend/app/[locale]/chat/streaming/taskWindow.tsx
index 665ed8467..5211c6ab8 100644
--- a/frontend/app/[locale]/chat/streaming/taskWindow.tsx
+++ b/frontend/app/[locale]/chat/streaming/taskWindow.tsx
@@ -9,11 +9,15 @@ import {
   FileText,
   ChevronRight,
   Wrench,
+  CheckCircle2,
+  AlertTriangle,
+  RotateCcw,
+  ShieldCheck,
 } from "lucide-react";
 
 import { ScrollArea } from "@/components/ui/scrollArea";
 import { Button, message as antdMessage } from "antd";
-import { MarkdownRenderer, CodeBlock } from "@/components/ui/markdownRenderer";
+import { MarkdownRenderer, CodeBlock } from "@/components/common/markdownRenderer";
 import { chatConfig } from "@/const/chatConfig";
 import {
   ChatMessageType,
@@ -1150,6 +1154,114 @@ const messageHandlers: MessageHandler[] = [
     render: (_message, _t) => null, // Return null, do not render this type of message
   },
 
+  // verification type processor - layered ReAct self-check status
+  {
+    canHandle: (message) =>
+      message.type === chatConfig.messageTypes.VERIFICATION,
+    render: (message, t) => {
+      let data: any = {};
+      try {
+        data =
+          typeof message.content === "string"
+            ? JSON.parse(message.content)
+            : message.content || {};
+      } catch (_) {
+        data = { message: message.content };
+      }
+
+      const phase = data.phase || "start";
+      const severity = data.severity || "info";
+      const labelMap: Record<string, string> = {
+        start: t("taskWindow.verification.start"),
+        pass: t("taskWindow.verification.pass"),
+        warning: t("taskWindow.verification.warning"),
+        blocked: t("taskWindow.verification.blocked"),
+        repair: t("taskWindow.verification.repair"),
+        final_pass: t("taskWindow.verification.finalPass"),
+        final_fail: t("taskWindow.verification.finalFail"),
+      };
+      const label =
+        labelMap[phase] || data.message || t("taskWindow.verification.start");
+      const rawMessage =
+        typeof data.message === "string" ? data.message.trim() : "";
+      const genericPassMessages = new Set([
+        "自检通过",
+        "最终自检通过",
+        "Self-check passed",
+        "Final self-check passed",
+      ]);
+      const fallbackReason = (() => {
+        if (data.event === "tool_precheck") {
+          return "动作非空、参数和语法已检查";
+        }
+        if (data.event === "retrieval") {
+          return "检索结果和错误信号已检查";
+        }
+        if (data.event === "handoff") {
+          return "子任务返回内容已检查";
+        }
+        if (data.event === "tool_result" || data.event === "code_execution") {
+          return "执行结果非空，未发现未处理错误";
+        }
+        if (data.event === "final_answer") {
+          return phase === "final_pass"
+            ? "答案完整、格式正常，未发现未处理错误"
+            : "答案非空、无内部标记、无占位符";
+        }
+        return "未发现阻断问题";
+      })();
+      const displayMessage =
+        (phase === "pass" || phase === "final_pass") &&
+        (!rawMessage || genericPassMessages.has(rawMessage))
+          ? `${rawMessage || label}：${fallbackReason}`
+          : rawMessage || label;
+      const tone =
+        phase === "final_pass" || phase === "pass"
+          ? "#047857"
+          : phase === "blocked" ||
+              phase === "final_fail" ||
+              severity === "blocking"
+            ? "#dc2626"
+            : phase === "repair" || phase === "warning"
+              ? "#d97706"
+              : "#2563eb";
+      const Icon =
+        phase === "final_pass" || phase === "pass"
+          ? CheckCircle2
+          : phase === "repair"
+            ? RotateCcw
+            : phase === "blocked" || phase === "final_fail"
+              ? AlertTriangle
+              : ShieldCheck;
+
+      return (
+        <div
+          style={{
+            display: "flex",
+            alignItems: "center",
+            gap: "0.5rem",
+            fontFamily:
+              "-apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Helvetica, Arial, sans-serif",
+            fontSize: "0.875rem",
+            lineHeight: 1.5,
+            color: tone,
+            fontWeight: 500,
+            borderRadius: "0.25rem",
+            paddingTop: "0.5rem",
+          }}
+        >
+          <Icon size={16} />
+          <span>{displayMessage}</span>
+          {typeof data.score === "number" && (
+            <span style={{ opacity: 0.72 }}>
+              {Math.round(data.score * 100)}%
+            </span>
+          )}
+        </div>
+      );
+    },
+  },
+
   // error type processor - error information
   {
     canHandle: (message) => message.type === "error",
diff --git a/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx b/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
index 09fe5c962..26cd438a5 100644
--- a/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
+++ b/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
@@ -157,7 +157,14 @@ function DataConfig({ isActive }: DataConfigProps) {
   const { t } = useTranslation();
   const { message } = App.useApp();
   const { confirm } = useConfirmModal();
-  const { modelConfig, data: configData, invalidateConfig, config, updateConfig, saveConfig } = useConfig();
+  const {
+    modelConfig,
+    data: configData,
+    invalidateConfig,
+    config,
+    updateConfig,
+    saveConfig,
+  } = useConfig();
   const { token } = theme.useToken();
 
   // Get available embedding models for knowledge base creation
@@ -177,7 +184,10 @@ function DataConfig({ isActive }: DataConfigProps) {
       setDataMateUrl("");
     }
 
-    if (configData?.app && typeof configData.app.modelEngineEnabled === "boolean") {
+    if (
+      configData?.app &&
+      typeof configData.app.modelEngineEnabled === "boolean"
+    ) {
       setModelEngineEnabled(configData.app.modelEngineEnabled);
     }
 
@@ -214,8 +224,11 @@ function DataConfig({ isActive }: DataConfigProps) {
   // Create mode state
   const [isCreatingMode, setIsCreatingMode] = useState(false);
   const [newKbName, setNewKbName] = useState("");
-  const [newKbIngroupPermission, setNewKbIngroupPermission] = useState<string>("READ_ONLY");
+  const [newKbIngroupPermission, setNewKbIngroupPermission] =
+    useState<string>("READ_ONLY");
   const [newKbGroupIds, setNewKbGroupIds] = useState<number[]>([]);
+  const [newKbPreserveSourceFile, setNewKbPreserveSourceFile] =
+    useState<boolean>(true);
   const [newKbEmbeddingModel, setNewKbEmbeddingModel] = useState<string>(""); // Selected embedding model for new KB
   const [uploadFiles, setUploadFiles] = useState<File[]>([]);
   const [hasClickedUpload, setHasClickedUpload] = useState(false);
@@ -269,7 +282,8 @@ function DataConfig({ isActive }: DataConfigProps) {
       const modelType = isMultimodal ? "multi_embedding" : "embedding";
       return availableEmbeddingModels.find(
         (model) =>
-          model.displayName === normalizedDisplayName && model.type === modelType
+          model.displayName === normalizedDisplayName &&
+          model.type === modelType
       )?.id;
     },
     [availableEmbeddingModels]
@@ -280,8 +294,13 @@ function DataConfig({ isActive }: DataConfigProps) {
     const singleEmbeddingModelName = modelConfig?.embedding?.modelName?.trim();
     const multiEmbeddingModelName =
       modelConfig?.multiEmbedding?.modelName?.trim();
-    setShowEmbeddingWarning(!singleEmbeddingModelName && !multiEmbeddingModelName);
-  }, [modelConfig?.embedding?.modelName, modelConfig?.multiEmbedding?.modelName]);
+    setShowEmbeddingWarning(
+      !singleEmbeddingModelName && !multiEmbeddingModelName
+    );
+  }, [
+    modelConfig?.embedding?.modelName,
+    modelConfig?.multiEmbedding?.modelName,
+  ]);
 
   // Add event listener for selecting new knowledge base
   useEffect(() => {
@@ -698,9 +717,11 @@ function DataConfig({ isActive }: DataConfigProps) {
     setNewKbName(defaultName);
     setNewKbIngroupPermission("READ_ONLY");
     setNewKbGroupIds([]);
+    setNewKbPreserveSourceFile(true);
     // Set default embedding model:
     // 1) configured embedding model, 2) configured multimodal model, 3) first available option.
-    const configEmbeddingModel = modelConfig?.embedding?.modelName?.trim() || "";
+    const configEmbeddingModel =
+      modelConfig?.embedding?.modelName?.trim() || "";
     const configMultiEmbeddingModel =
       modelConfig?.multiEmbedding?.modelName?.trim() || "";
     const preferredModel = [
@@ -715,7 +736,10 @@ function DataConfig({ isActive }: DataConfigProps) {
     );
     const defaultModel =
       (preferredModel &&
-        toEmbeddingModelOptionValue(preferredModel.modelName, preferredModel.type)) ||
+        toEmbeddingModelOptionValue(
+          preferredModel.modelName,
+          preferredModel.type
+        )) ||
       (availableEmbeddingModels[0]
         ? toEmbeddingModelOptionValue(
             availableEmbeddingModels[0].displayName,
@@ -795,7 +819,8 @@ function DataConfig({ isActive }: DataConfigProps) {
           newKbIngroupPermission,
           newKbGroupIds,
           parsedSelectedModel.displayName,
-          isMultimodal
+          isMultimodal,
+          newKbPreserveSourceFile
         );
 
         if (!newKB) {
@@ -1015,7 +1040,10 @@ function DataConfig({ isActive }: DataConfigProps) {
               onKnowledgeBaseUpdate={(updatedKnowledgeBase) => {
                 // Update knowledge base in list and active knowledge base
                 updateKnowledgeBase(updatedKnowledgeBase);
-                if (kbState.activeKnowledgeBase && kbState.activeKnowledgeBase.id === updatedKnowledgeBase.id) {
+                if (
+                  kbState.activeKnowledgeBase &&
+                  kbState.activeKnowledgeBase.id === updatedKnowledgeBase.id
+                ) {
                   setActiveKnowledgeBase(updatedKnowledgeBase);
                 }
               }}
@@ -1062,6 +1090,8 @@ function DataConfig({ isActive }: DataConfigProps) {
                 onIngroupPermissionChange={setNewKbIngroupPermission}
                 selectedGroupIds={newKbGroupIds}
                 onSelectedGroupIdsChange={setNewKbGroupIds}
+                preserveSourceFile={newKbPreserveSourceFile}
+                onPreserveSourceFileChange={setNewKbPreserveSourceFile}
                 // Embedding model for create mode
                 availableEmbeddingModels={availableEmbeddingModels}
                 selectedEmbeddingModel={newKbEmbeddingModel}
@@ -1102,25 +1132,30 @@ function DataConfig({ isActive }: DataConfigProps) {
                 isNewlyCreatedAndWaiting={isNewlyCreatedAndWaiting}
                 onChunkCountChange={() => {
                   // Trigger knowledge base list update to refresh chunk count
-                  knowledgeBasePollingService.triggerKnowledgeBaseListUpdate(true);
+                  knowledgeBasePollingService.triggerKnowledgeBaseListUpdate(
+                    true
+                  );
                 }}
-                  permission={kbState.activeKnowledgeBase?.permission}
+                permission={kbState.activeKnowledgeBase?.permission}
                 summaryFrequency={kbState.activeKnowledgeBase?.summaryFrequency}
                 onSummaryFrequencyChange={(frequency) => {
                   if (kbState.activeKnowledgeBase) {
-                    knowledgeBaseService.updateSummaryFrequency(
-                      kbState.activeKnowledgeBase.id,
-                      frequency
-                    ).then(() => {
-                      const updatedKB: KnowledgeBase = {
-                        ...kbState.activeKnowledgeBase!,
-                        summaryFrequency: frequency
-                      };
-                      updateKnowledgeBase(updatedKB);
-                      setActiveKnowledgeBase(updatedKB);
-                    }).catch((error) => {
-                      log.error("Failed to update summary frequency:", error);
-                    });
+                    knowledgeBaseService
+                      .updateSummaryFrequency(
+                        kbState.activeKnowledgeBase.id,
+                        frequency
+                      )
+                      .then(() => {
+                        const updatedKB: KnowledgeBase = {
+                          ...kbState.activeKnowledgeBase!,
+                          summaryFrequency: frequency,
+                        };
+                        updateKnowledgeBase(updatedKB);
+                        setActiveKnowledgeBase(updatedKB);
+                      })
+                      .catch((error) => {
+                        log.error("Failed to update summary frequency:", error);
+                      });
                   }
                 }}
                 // Upload related props
diff --git a/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx b/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
index 3590db86b..4f75fd66e 100644
--- a/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
+++ b/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
@@ -10,9 +10,16 @@ import { useTranslation } from "react-i18next";
 import { Input, Button, App, Select } from "antd";
 const { TextArea } = Input;
 import { InfoCircleFilled } from "@ant-design/icons";
-import { BookText, Pilcrow, PencilRuler, Eye, Glasses, CircleOff } from "lucide-react";
-import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
-import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
+import {
+  BookText,
+  Pilcrow,
+  PencilRuler,
+  Eye,
+  Glasses,
+  CircleOff,
+} from "lucide-react";
+import { MarkdownRenderer } from "@/components/common/markdownRenderer";
+import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
 
 import {
   UI_CONFIG,
@@ -21,7 +28,10 @@ import {
   LAYOUT,
   DOCUMENT_STATUS,
 } from "@/const/knowledgeBase";
-import { SUMMARY_FREQUENCY_OPTIONS_API, FrequencyOption } from "@/const/scheduler";
+import {
+  SUMMARY_FREQUENCY_OPTIONS_API,
+  FrequencyOption,
+} from "@/const/scheduler";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
 import { modelService } from "@/services/modelService";
 import { getTenantDefaultGroupId } from "@/services/groupService";
@@ -83,7 +93,9 @@ interface DocumentListProps {
   isMultimodal?: boolean;
   onMultimodalChange?: (value: boolean) => void;
   permission?: string; // User's permission for this knowledge base (READ_ONLY, EDIT, etc.)
-  
+  preserveSourceFile?: boolean;
+  onPreserveSourceFileChange?: (value: boolean) => void;
+
   // Auto-summary frequency
   summaryFrequency?: string | null;
   onSummaryFrequencyChange?: (frequency: string | null) => void;
@@ -132,7 +144,9 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
       isMultimodal = false,
       onMultimodalChange,
       permission,
-      
+      preserveSourceFile = true,
+      onPreserveSourceFileChange,
+
       // Auto-summary frequency
       summaryFrequency,
       onSummaryFrequencyChange,
@@ -240,14 +254,16 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
     const [showDetail, setShowDetail] = React.useState(false);
     const [showChunk, setShowChunk] = React.useState(false);
     const [summary, setSummary] = useState("");
-const [isSummarizing, setIsSummarizing] = useState(false);
-  const [isEditing, setIsEditing] = useState(false);
-  const [isSaving, setIsSaving] = useState(false);
-  const [selectedModel, setSelectedModel] = useState<number>(0);
-  const [availableModels, setAvailableModels] = useState<ModelOption[]>([]);
-  const [isLoadingModels, setIsLoadingModels] = useState(false);
-  const [frequencyOptions, setFrequencyOptions] = useState<FrequencyOption[]>([]);
-  const { t } = useTranslation();
+    const [isSummarizing, setIsSummarizing] = useState(false);
+    const [isEditing, setIsEditing] = useState(false);
+    const [isSaving, setIsSaving] = useState(false);
+    const [selectedModel, setSelectedModel] = useState<number>(0);
+    const [availableModels, setAvailableModels] = useState<ModelOption[]>([]);
+    const [isLoadingModels, setIsLoadingModels] = useState(false);
+    const [frequencyOptions, setFrequencyOptions] = useState<FrequencyOption[]>(
+      []
+    );
+    const { t } = useTranslation();
     const isDataMate = (knowledgeBaseSource || "").toLowerCase() === "datamate";
 
     // Determine if user has read-only permission
@@ -271,7 +287,9 @@ const [isSummarizing, setIsSummarizing] = useState(false);
         label: (
           <span className="flex items-center gap-2">
             {getPermissionIcon("READ_ONLY")}
-            <span>{t("tenantResources.knowledgeBase.permission.READ_ONLY")}</span>
+            <span>
+              {t("tenantResources.knowledgeBase.permission.READ_ONLY")}
+            </span>
           </span>
         ),
       },
@@ -341,33 +359,38 @@ const [isSummarizing, setIsSummarizing] = useState(false);
     };
 
     // Load frequency options from backend API
-  useEffect(() => {
-    const loadFrequencyOptions = async () => {
-      if (showDetail && frequencyOptions.length === 0) {
-        try {
-          const response = await fetch(SUMMARY_FREQUENCY_OPTIONS_API);
-          const data = await response.json();
-          setFrequencyOptions(data.options || []);
-        } catch (error) {
-          log.error("Failed to load frequency options:", error);
-          // Fallback to default options if API fails
-          setFrequencyOptions([
-            { value: "disabled", label: t("knowledgeBase.tag.autoSummary.off") },
-          ]);
+    useEffect(() => {
+      const loadFrequencyOptions = async () => {
+        if (showDetail && frequencyOptions.length === 0) {
+          try {
+            const response = await fetch(SUMMARY_FREQUENCY_OPTIONS_API);
+            const data = await response.json();
+            setFrequencyOptions(data.options || []);
+          } catch (error) {
+            log.error("Failed to load frequency options:", error);
+            // Fallback to default options if API fails
+            setFrequencyOptions([
+              {
+                value: "disabled",
+                label: t("knowledgeBase.tag.autoSummary.off"),
+              },
+            ]);
+          }
         }
-      }
-    };
-    loadFrequencyOptions();
-  }, [showDetail, frequencyOptions.length, t]);
+      };
+      loadFrequencyOptions();
+    }, [showDetail, frequencyOptions.length, t]);
 
-  // Load available models when showing detail
-  useEffect(() => {
-    const loadModels = async () => {
-      if (showDetail && availableModels.length === 0) {
+    // Load available models when showing detail
+    useEffect(() => {
+      const loadModels = async () => {
+        if (showDetail && availableModels.length === 0) {
           setIsLoadingModels(true);
           try {
             const models = await modelService.getLLMModels();
-            setAvailableModels(models.filter(m => m.connect_status === "available"));
+            setAvailableModels(
+              models.filter((m) => m.connect_status === "available")
+            );
 
             // Determine initial selection order:
             // 1) Knowledge base's own configured model (server-side config)
@@ -532,10 +555,16 @@ const [isSummarizing, setIsSummarizing] = useState(false);
         <div
           className={`${LAYOUT.KB_HEADER_PADDING} border-b border-gray-200 flex-shrink-0 flex items-center ${titleBarHeightClass}`}
         >
-          <div className="flex items-center justify-between w-full" style={{ width: "100%" }}>
-            <div className="flex items-center" style={{width: "100%"}}>
+          <div
+            className="flex items-center justify-between w-full"
+            style={{ width: "100%" }}
+          >
+            <div className="flex items-center" style={{ width: "100%" }}>
               {isCreatingMode ? (
-                <div className="flex items-center flex-1" style={{ width: "100%" }}>
+                <div
+                  className="flex items-center flex-1"
+                  style={{ width: "100%" }}
+                >
                   <Input
                     value={knowledgeBaseName}
                     onChange={(e) =>
@@ -551,14 +580,29 @@ const [isSummarizing, setIsSummarizing] = useState(false);
                     }
                   />
                   {/* Right-aligned container for dropdowns */}
-                  <div className="flex items-center ml-auto justify-end" style={{ gap: "12px", justifyContent: "flex-end", alignItems: "flex-end", width: "100%" }}>
+                  <div
+                    className="flex items-center ml-auto justify-end"
+                    style={{
+                      gap: "12px",
+                      justifyContent: "flex-end",
+                      alignItems: "flex-end",
+                      width: "100%",
+                    }}
+                  >
                     {/* Embedding model selection - first position in create mode */}
                     {isCreatingMode && onEmbeddingModelChange && (
                       <Select
                         value={selectedEmbeddingModel}
                         onChange={onEmbeddingModelChange}
-                        style={{ minWidth: 200, justifyContent: "center", alignItems: "flex-end" }}
-                        placeholder={t("knowledgeBase.create.embeddingModelPlaceholder") || "Select embedding model"}
+                        style={{
+                          minWidth: 200,
+                          justifyContent: "center",
+                          alignItems: "flex-end",
+                        }}
+                        placeholder={
+                          t("knowledgeBase.create.embeddingModelPlaceholder") ||
+                          "Select embedding model"
+                        }
                         allowClear={false}
                         options={[
                           {
@@ -574,7 +618,9 @@ const [isSummarizing, setIsSummarizing] = useState(false);
                           {
                             label: t("modelConfig.option.multiEmbeddingModel"),
                             options: embeddingModelsForOptions
-                              .filter((model) => model.type === "multi_embedding")
+                              .filter(
+                                (model) => model.type === "multi_embedding"
+                              )
                               .map((model) => ({
                                 value: `${model.displayName}::${model.type}`,
                                 label: model.displayName,
@@ -590,8 +636,14 @@ const [isSummarizing, setIsSummarizing] = useState(false);
                         mode="multiple"
                         value={isGroupSelectDisabled ? [] : selectedGroupIds}
                         onChange={onSelectedGroupIdsChange}
-                        style={{ minWidth: 200, justifyContent: "center", alignItems: "flex-end" }}
-                        placeholder={t("knowledgeBase.create.permission.groupPlaceholder")}
+                        style={{
+                          minWidth: 200,
+                          justifyContent: "center",
+                          alignItems: "flex-end",
+                        }}
+                        placeholder={t(
+                          "knowledgeBase.create.permission.groupPlaceholder"
+                        )}
                         options={groupOptions}
                         maxTagCount={2}
                         allowClear
@@ -603,11 +655,39 @@ const [isSummarizing, setIsSummarizing] = useState(false);
                       <Select
                         value={ingroupPermission}
                         onChange={onIngroupPermissionChange}
-                        style={{ width: 160, justifyContent: "center", alignItems: "flex-end" }}
-                        placeholder={t("knowledgeBase.ingroup.permission.DEFAULT")}
+                        style={{
+                          width: 160,
+                          justifyContent: "center",
+                          alignItems: "flex-end",
+                        }}
+                        placeholder={t(
+                          "knowledgeBase.ingroup.permission.DEFAULT"
+                        )}
                         options={permissionOptions}
                       />
                     </Can>
+                    {onPreserveSourceFileChange && (
+                      <Select
+                        value={preserveSourceFile}
+                        onChange={onPreserveSourceFileChange}
+                        style={{
+                          width: 200,
+                          justifyContent: "center",
+                          alignItems: "flex-end",
+                        }}
+                        allowClear={false}
+                        options={[
+                          {
+                            value: true,
+                            label: t("knowledgeBase.create.preserveSourceFile"),
+                          },
+                          {
+                            value: false,
+                            label: t("knowledgeBase.tag.noPreserveSourceFile"),
+                          },
+                        ]}
+                      />
+                    )}
                   </div>
                 </div>
               ) : (
@@ -699,7 +779,7 @@ const [isSummarizing, setIsSummarizing] = useState(false);
               />
             </div>
           ) : showDetail ? (
-<div className="px-8 py-4 h-full flex flex-col">
+            <div className="px-8 py-4 h-full flex flex-col">
               <div className="flex items-center justify-between mb-5">
                 <span className="font-bold text-lg">
                   {t("document.summary.title")}
@@ -737,13 +817,14 @@ const [isSummarizing, setIsSummarizing] = useState(false);
                       }}
                       disabled={isReadOnlyMode}
                       style={{ width: 85 }}
-placeholder={t("knowledgeBase.tag.autoSummary.off")}
-                      options={frequencyOptions.map(opt => ({
-                          value: opt.value,
-                          label: opt.value === "disabled" 
-                            ? t("knowledgeBase.tag.autoSummary.off") 
+                      placeholder={t("knowledgeBase.tag.autoSummary.off")}
+                      options={frequencyOptions.map((opt) => ({
+                        value: opt.value,
+                        label:
+                          opt.value === "disabled"
+                            ? t("knowledgeBase.tag.autoSummary.off")
                             : opt.label,
-                        }))}
+                      }))}
                     />
                   </div>
                   <Button
@@ -751,7 +832,10 @@ placeholder={t("knowledgeBase.tag.autoSummary.off")}
                     onClick={handleAutoSummary}
                     loading={isSummarizing}
                     disabled={
-                      !knowledgeBaseName || isSummarizing || !selectedModel || isReadOnlyMode
+                      !knowledgeBaseName ||
+                      isSummarizing ||
+                      !selectedModel ||
+                      isReadOnlyMode
                     }
                   >
                     {t("document.button.autoSummary")}
@@ -759,59 +843,59 @@ placeholder={t("knowledgeBase.tag.autoSummary.off")}
                 </div>
               </div>
               <div className="flex-1 min-h-0 mb-5 border border-gray-300 rounded-md overflow-auto">
-                  {isReadOnlyMode ? (
-                    <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                      <MarkdownRenderer content={summary} />
-                    </div>
-                  ) : isSummarizing ? (
-                    <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                      <MarkdownRenderer content={summary} />
-                    </div>
-                  ) : (
-                    <div
-                          className="w-full h-full cursor-text hover:bg-gray-50"
-                      onClick={() => {
-                        if (!isSummarizing) {
-                          setIsEditing(true);
-                        }
-                      }}
-                    >
-                      {isEditing ? (
-                        <TextArea
-                          value={summary}
-                          onChange={(e) => setSummary(e.target.value)}
-                          onBlur={() => setIsEditing(false)}
-                              className="w-full h-full border-0 resize-none focus:shadow-none"
-                          style={{
-                            height: '100%',
-                            padding: '20px',
-                            fontSize: '18px',
-                            lineHeight: '1.7',
-                            whiteSpace: 'pre-wrap',
-                          }}
-                          autoFocus
-                          placeholder={t("document.summary.placeholder")}
-                        />
-                      ) : (
-                              <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                                <MarkdownRenderer content={summary} />
-                              </div>
-                      )}
-                    </div>
-                  )}
+                {isReadOnlyMode ? (
+                  <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                    <MarkdownRenderer content={summary} />
+                  </div>
+                ) : isSummarizing ? (
+                  <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                    <MarkdownRenderer content={summary} />
+                  </div>
+                ) : (
+                  <div
+                    className="w-full h-full cursor-text hover:bg-gray-50"
+                    onClick={() => {
+                      if (!isSummarizing) {
+                        setIsEditing(true);
+                      }
+                    }}
+                  >
+                    {isEditing ? (
+                      <TextArea
+                        value={summary}
+                        onChange={(e) => setSummary(e.target.value)}
+                        onBlur={() => setIsEditing(false)}
+                        className="w-full h-full border-0 resize-none focus:shadow-none"
+                        style={{
+                          height: "100%",
+                          padding: "20px",
+                          fontSize: "18px",
+                          lineHeight: "1.7",
+                          whiteSpace: "pre-wrap",
+                        }}
+                        autoFocus
+                        placeholder={t("document.summary.placeholder")}
+                      />
+                    ) : (
+                      <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                        <MarkdownRenderer content={summary} />
+                      </div>
+                    )}
+                  </div>
+                )}
               </div>
               <div className="flex gap-3 justify-end">
-                  {!isReadOnlyMode && (
-                    <Button
-                      type="primary"
-                      size="large"
-                      onClick={handleSaveSummary}
-                      loading={isSaving}
-                      disabled={!summary || isSaving}
-                    >
-                      {t("common.save")}
-                    </Button>
-                  )}
+                {!isReadOnlyMode && (
+                  <Button
+                    type="primary"
+                    size="large"
+                    onClick={handleSaveSummary}
+                    loading={isSaving}
+                    disabled={!summary || isSaving}
+                  >
+                    {t("common.save")}
+                  </Button>
+                )}
                 <Button
                   size="large"
                   onClick={() => {
@@ -944,9 +1028,12 @@ placeholder={t("knowledgeBase.tag.autoSummary.off")}
                           <div className="flex gap-2">
                             <button
                               onClick={() => {
-                                const objectName =  extractObjectNameFromUrl(doc.id) || undefined;
+                                const objectName =
+                                  extractObjectNameFromUrl(doc.id) || undefined;
                                 if (!objectName) {
-                                  message.warning(t("filePreview.previewFailed"));
+                                  message.warning(
+                                    t("filePreview.previewFailed")
+                                  );
                                   return;
                                 }
 
@@ -1031,6 +1118,7 @@ placeholder={t("knowledgeBase.tag.autoSummary.off")}
             fileName={selectedFile.fileName}
             fileType={selectedFile.fileType}
             fileSize={selectedFile.fileSize}
+            previewContext="knowledgeBase"
             onClose={() => setSelectedFile(null)}
           />
         )}
diff --git a/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx b/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
index 186b8e36c..53758147b 100644
--- a/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
+++ b/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
@@ -3,7 +3,7 @@ import { useTranslation } from "react-i18next";
 
 import log from "@/lib/logger";
 
-import { Button, Input, Select } from "antd";
+import { Button, Input, Select, Tooltip } from "antd";
 import {
   SyncOutlined,
   PlusOutlined,
@@ -19,7 +19,6 @@ import {
   SquarePen,
   CircleOff,
 } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { Can } from "@/components/permission/Can";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import { useGroupList } from "@/hooks/group/useGroupList";
@@ -639,6 +638,13 @@ const KnowledgeBaseList: React.FC<KnowledgeBaseListProps> = ({
                                   </span>
                                 ))}
                             </Can>
+                            {kb.preserve_source_file === false && (
+                              <span
+                                className={`inline-flex items-center ${KB_LAYOUT.TAG_PADDING} ${KB_LAYOUT.TAG_ROUNDED} ${KB_LAYOUT.TAG_TEXT} ${KB_LAYOUT.SECOND_ROW_TAG_MARGIN} bg-blue-100 text-blue-800 border border-blue-200 mr-1`}
+                              >
+                                {t("knowledgeBase.tag.noPreserveSourceFile")}
+                              </span>
+                            )}
                           </>
                         )}
                       </div>
diff --git a/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx b/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
index 63d9ad1c2..668436765 100644
--- a/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
+++ b/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
@@ -1,7 +1,14 @@
-"use client"
+"use client";
 
-import { createContext, useReducer, useContext, ReactNode, useCallback, useEffect } from "react";
-import { useTranslation } from 'react-i18next';
+import {
+  createContext,
+  useReducer,
+  useContext,
+  ReactNode,
+  useCallback,
+  useEffect,
+} from "react";
+import { useTranslation } from "react-i18next";
 
 import { DOCUMENT_ACTION_TYPES } from "@/const/knowledgeBase";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
@@ -9,17 +16,20 @@ import { DocumentState, DocumentAction } from "@/types/knowledgeBase";
 import log from "@/lib/logger";
 
 // Reducer function
-const documentReducer = (state: DocumentState, action: DocumentAction): DocumentState => {
+const documentReducer = (
+  state: DocumentState,
+  action: DocumentAction
+): DocumentState => {
   switch (action.type) {
     case DOCUMENT_ACTION_TYPES.FETCH_SUCCESS:
       return {
         ...state,
         documentsMap: {
           ...state.documentsMap,
-          [action.payload.kbId]: action.payload.documents
+          [action.payload.kbId]: action.payload.documents,
         },
         isLoadingDocuments: false,
-        error: null
+        error: null,
       };
     case DOCUMENT_ACTION_TYPES.SELECT_DOCUMENT:
       // Toggle document selection
@@ -28,41 +38,48 @@ const documentReducer = (state: DocumentState, action: DocumentAction): Document
       return {
         ...state,
         selectedIds: isSelected
-          ? state.selectedIds.filter(id => id !== docId)
-          : [...state.selectedIds, docId]
+          ? state.selectedIds.filter((id) => id !== docId)
+          : [...state.selectedIds, docId],
       };
     case DOCUMENT_ACTION_TYPES.SELECT_DOCUMENTS:
       return {
         ...state,
-        selectedIds: action.payload
+        selectedIds: action.payload,
       };
     case DOCUMENT_ACTION_TYPES.SELECT_ALL:
       const { kbId, selected } = action.payload;
       const documents = state.documentsMap[kbId] || [];
-      
+
       // If selected is true, add all document IDs, else remove all
       const newSelectedIds = selected
-        ? [...new Set([...state.selectedIds, ...documents.map(doc => doc.id)])]
-        : state.selectedIds.filter(id => !documents.some(doc => doc.id === id));
-      
+        ? [
+            ...new Set([
+              ...state.selectedIds,
+              ...documents.map((doc) => doc.id),
+            ]),
+          ]
+        : state.selectedIds.filter(
+            (id) => !documents.some((doc) => doc.id === id)
+          );
+
       return {
         ...state,
-        selectedIds: newSelectedIds
+        selectedIds: newSelectedIds,
       };
     case DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES:
       return {
         ...state,
-        uploadFiles: action.payload
+        uploadFiles: action.payload,
       };
     case DOCUMENT_ACTION_TYPES.SET_UPLOADING:
       return {
         ...state,
-        isUploading: action.payload
+        isUploading: action.payload,
       };
     case DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS:
       return {
         ...state,
-        isLoadingDocuments: action.payload
+        isLoadingDocuments: action.payload,
       };
     case DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT:
       const { kbId: deleteKbId, docId: deleteDocId } = action.payload;
@@ -71,36 +88,39 @@ const documentReducer = (state: DocumentState, action: DocumentAction): Document
         ...state,
         documentsMap: {
           ...state.documentsMap,
-          [deleteKbId]: state.documentsMap[deleteKbId]?.filter(doc => doc.id !== deleteDocId) || []
+          [deleteKbId]:
+            state.documentsMap[deleteKbId]?.filter(
+              (doc) => doc.id !== deleteDocId
+            ) || [],
         },
-        selectedIds: state.selectedIds.filter(id => id !== deleteDocId)
+        selectedIds: state.selectedIds.filter((id) => id !== deleteDocId),
       };
     case DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID:
       const { kbId: loadingKbId, isLoading } = action.payload;
       const newLoadingKbIds = new Set(state.loadingKbIds);
-      
+
       if (isLoading) {
         newLoadingKbIds.add(loadingKbId);
       } else {
         newLoadingKbIds.delete(loadingKbId);
       }
-      
+
       return {
         ...state,
-        loadingKbIds: newLoadingKbIds
+        loadingKbIds: newLoadingKbIds,
       };
     case DOCUMENT_ACTION_TYPES.CLEAR_DOCUMENTS:
       return {
         ...state,
         documentsMap: {},
         selectedIds: [],
-        error: null
+        error: null,
       };
     case DOCUMENT_ACTION_TYPES.ERROR:
       return {
         ...state,
         error: action.payload,
-        isLoadingDocuments: false
+        isLoadingDocuments: false,
       };
     default:
       return state;
@@ -111,8 +131,16 @@ const documentReducer = (state: DocumentState, action: DocumentAction): Document
 export const DocumentContext = createContext<{
   state: DocumentState;
   dispatch: React.Dispatch<DocumentAction>;
-  fetchDocuments: (kbId: string, forceRefresh?: boolean, kbSource?: string) => Promise<void>;
-  uploadDocuments: (kbId: string, files: File[], modelId?: number) => Promise<void>;
+  fetchDocuments: (
+    kbId: string,
+    forceRefresh?: boolean,
+    kbSource?: string
+  ) => Promise<void>;
+  uploadDocuments: (
+    kbId: string,
+    files: File[],
+    modelId?: number
+  ) => Promise<void>;
   deleteDocument: (kbId: string, docId: string) => Promise<void>;
 }>({
   state: {
@@ -122,12 +150,12 @@ export const DocumentContext = createContext<{
     isUploading: false,
     loadingKbIds: new Set<string>(),
     isLoadingDocuments: false,
-    error: null
+    error: null,
   },
   dispatch: () => {},
   fetchDocuments: async () => {},
   uploadDocuments: async () => {},
-  deleteDocument: async () => {}
+  deleteDocument: async () => {},
 });
 
 // Custom hook for using the context
@@ -138,7 +166,9 @@ interface DocumentProviderProps {
   children: ReactNode;
 }
 
-export const DocumentProvider: React.FC<DocumentProviderProps> = ({ children }) => {
+export const DocumentProvider: React.FC<DocumentProviderProps> = ({
+  children,
+}) => {
   const { t } = useTranslation();
   const [state, dispatch] = useReducer(documentReducer, {
     documentsMap: {},
@@ -147,115 +177,169 @@ export const DocumentProvider: React.FC<DocumentProviderProps> = ({ children })
     isUploading: false,
     loadingKbIds: new Set<string>(),
     isLoadingDocuments: false,
-    error: null
+    error: null,
   });
 
   // Listen for document update events
   useEffect(() => {
     const handleDocumentsUpdated = (event: Event) => {
       const customEvent = event as CustomEvent;
-      if (customEvent.detail && customEvent.detail.kbId && customEvent.detail.documents) {
+      if (
+        customEvent.detail &&
+        customEvent.detail.kbId &&
+        customEvent.detail.documents
+      ) {
         const { kbId, documents } = customEvent.detail;
-        
+
         // Update document information directly
-        dispatch({ 
-          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS, 
-          payload: { kbId, documents } 
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
+          payload: { kbId, documents },
         });
       }
     };
-    
+
     // Add event listener
-    window.addEventListener('documentsUpdated', handleDocumentsUpdated as EventListener);
-    
+    window.addEventListener(
+      "documentsUpdated",
+      handleDocumentsUpdated as EventListener
+    );
+
     // Cleanup function
     return () => {
-      window.removeEventListener('documentsUpdated', handleDocumentsUpdated as EventListener);
+      window.removeEventListener(
+        "documentsUpdated",
+        handleDocumentsUpdated as EventListener
+      );
     };
   }, []);
 
   // Fetch documents for a knowledge base
-  const fetchDocuments = useCallback(async (kbId: string, forceRefresh?: boolean, kbSource?: string) => {
-    // Skip if already loading this kb
-    if (state.loadingKbIds.has(kbId)) return;
-
-    // If forceRefresh is false and we have cached data, return directly
-    if (!forceRefresh && state.documentsMap[kbId] && state.documentsMap[kbId].length > 0) {
-      return; // If we have cached data and don't need force refresh, return directly without server request
-    }
+  const fetchDocuments = useCallback(
+    async (kbId: string, forceRefresh?: boolean, kbSource?: string) => {
+      // Skip if already loading this kb
+      if (state.loadingKbIds.has(kbId)) return;
 
-    dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID, payload: { kbId, isLoading: true } });
+      // If forceRefresh is false and we have cached data, return directly
+      if (
+        !forceRefresh &&
+        state.documentsMap[kbId] &&
+        state.documentsMap[kbId].length > 0
+      ) {
+        return; // If we have cached data and don't need force refresh, return directly without server request
+      }
 
-    try {
-      // Use getAllFiles() to get documents including those not yet in ES
-      const documents = await knowledgeBaseService.getAllFiles(kbId, kbSource);
       dispatch({
-        type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
-        payload: { kbId, documents }
+        type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID,
+        payload: { kbId, isLoading: true },
       });
-    } catch (error) {
-      log.error(t('document.error.fetch'), error);
-      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: t('document.error.load') });
-    } finally {
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID, payload: { kbId, isLoading: false } });
-    }
-  }, [state.loadingKbIds, state.documentsMap, t]);
+
+      try {
+        // Use getAllFiles() to get documents including those not yet in ES
+        const documents = await knowledgeBaseService.getAllFiles(
+          kbId,
+          kbSource
+        );
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
+          payload: { kbId, documents },
+        });
+      } catch (error) {
+        log.error(t("document.error.fetch"), error);
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.ERROR,
+          payload: t("document.error.load"),
+        });
+      } finally {
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID,
+          payload: { kbId, isLoading: false },
+        });
+      }
+    },
+    [state.loadingKbIds, state.documentsMap, t]
+  );
 
   // Upload documents to a knowledge base
-  const uploadDocuments = useCallback(async (kbId: string, files: File[], modelId?: number) => {
-    dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: true });
-    
-    try {
-      await knowledgeBaseService.uploadDocuments(kbId, files, undefined, modelId);
-      
-      // Set loading state before fetching latest documents
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS, payload: true });
-      
-      // Get latest status immediately after upload
-      const latestDocuments = await knowledgeBaseService.getAllFiles(kbId);
-      // Update document status
-      dispatch({ 
-        type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS, 
-        payload: { kbId, documents: latestDocuments } 
-      });
-      
-      // Trigger document status update event to notify other components
-      window.dispatchEvent(new CustomEvent('documentsUpdated', {
-        detail: { 
+  const uploadDocuments = useCallback(
+    async (kbId: string, files: File[], modelId?: number) => {
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: true });
+
+      try {
+        await knowledgeBaseService.uploadDocuments(
           kbId,
-          documents: latestDocuments 
-        }
-      }));
-      
-      // Clear upload files
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES, payload: [] });
-    } catch (error) {
-      log.error(t('document.error.upload'), error);
-      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: `${t('document.error.upload')}. ${t('document.error.retry')}` });
-    } finally {
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: false });
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS, payload: false });
-    }
-  }, [t]);
+          files,
+          undefined,
+          modelId
+        );
+
+        // Set loading state before fetching latest documents
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS,
+          payload: true,
+        });
+
+        // Get latest status immediately after upload
+        const latestDocuments = await knowledgeBaseService.getAllFiles(kbId);
+        // Update document status
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
+          payload: { kbId, documents: latestDocuments },
+        });
+
+        // Trigger document status update event to notify other components
+        window.dispatchEvent(
+          new CustomEvent("documentsUpdated", {
+            detail: {
+              kbId,
+              documents: latestDocuments,
+            },
+          })
+        );
+
+        // Clear upload files
+        dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES, payload: [] });
+      } catch (error) {
+        log.error(t("document.error.upload"), error);
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.ERROR,
+          payload: `${t("document.error.upload")}. ${t("document.error.retry")}`,
+        });
+      } finally {
+        dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: false });
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS,
+          payload: false,
+        });
+      }
+    },
+    [t]
+  );
 
   // Delete a document
-  const deleteDocument = useCallback(async (kbId: string, docId: string) => {
-    try {
-      await knowledgeBaseService.deleteDocument(docId, kbId);
-      dispatch({ 
-        type: DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT, 
-        payload: { kbId, docId } 
-      });
-    } catch (error) {
-      log.error(t('document.error.delete'), error);
-      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: `${t('document.error.delete')}. ${t('document.error.retry')}` });
-    }
-  }, [t]);
+  const deleteDocument = useCallback(
+    async (kbId: string, docId: string) => {
+      try {
+        await knowledgeBaseService.deleteDocument(docId, kbId);
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT,
+          payload: { kbId, docId },
+        });
+      } catch (error) {
+        log.error(t("document.error.delete"), error);
+        dispatch({
+          type: DOCUMENT_ACTION_TYPES.ERROR,
+          payload: `${t("document.error.delete")}. ${t("document.error.retry")}`,
+        });
+      }
+    },
+    [t]
+  );
 
   return (
-    <DocumentContext.Provider 
-      value={{ 
-        state, 
+    <DocumentContext.Provider
+      value={{
+        state,
         dispatch,
         fetchDocuments,
         uploadDocuments,
@@ -265,4 +349,4 @@ export const DocumentProvider: React.FC<DocumentProviderProps> = ({ children })
       {children}
     </DocumentContext.Provider>
   );
-}; 
+};
diff --git a/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx b/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
index 9733d44c4..eb3a05fa0 100644
--- a/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
+++ b/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
@@ -118,7 +118,8 @@ export const KnowledgeBaseContext = createContext<{
     ingroup_permission?: string,
     group_ids?: number[],
     embeddingModel?: string,
-    is_multimodal?: boolean
+    is_multimodal?: boolean,
+    preserve_source_file?: boolean
   ) => Promise<KnowledgeBase | null>;
   deleteKnowledgeBase: (id: string) => Promise<boolean>;
   selectKnowledgeBase: (id: string) => void;
@@ -348,7 +349,8 @@ export const KnowledgeBaseProvider: React.FC<KnowledgeBaseProviderProps> = ({
       ingroup_permission?: string,
       group_ids?: number[],
       embeddingModel?: string,
-      is_multimodal?: boolean
+      is_multimodal?: boolean,
+      preserve_source_file?: boolean
     ) => {
       try {
         const selectedEmbeddingModel = embeddingModel?.trim() || "";
@@ -372,6 +374,7 @@ export const KnowledgeBaseProvider: React.FC<KnowledgeBaseProviderProps> = ({
           ingroup_permission,
           group_ids,
           is_multimodal: resolvedIsMultimodal,
+          preserve_source_file,
         });
         return newKB;
       } catch (error) {
diff --git a/frontend/app/[locale]/space/components/AgentCard.tsx b/frontend/app/[locale]/space/components/AgentCard.tsx
index 0e005d9be..cd4ecb57a 100644
--- a/frontend/app/[locale]/space/components/AgentCard.tsx
+++ b/frontend/app/[locale]/space/components/AgentCard.tsx
@@ -139,9 +139,9 @@ export default function AgentCard({ agent, onRefresh }: AgentCardProps) {
     }
   };
 
-  // Handle edit - navigate to agents view
+  // Handle edit - navigate to agents view with agent id
   const handleEdit = () => {
-    router.push("/agents");
+    router.push(`/agents?agent_id=${agent.id}`);
   };
 
   const queryClient = useQueryClient();
@@ -166,7 +166,10 @@ export default function AgentCard({ agent, onRefresh }: AgentCardProps) {
     setShowDetail(true);
     setIsLoadingDetails(true);
     try {
-      const result = await searchAgentInfo(parseInt(agent.id));
+      // Use current_version_no if available (the currently published version)
+      // Falls back to 0 only if not set (for unpublished/draft agents)
+      const versionNo = agent.current_version_no ?? 0;
+      const result = await searchAgentInfo(parseInt(agent.id), undefined, versionNo);
       if (result.success) {
         setAgentDetails(result.data);
       } else {
diff --git a/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx b/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
index 38fb3ceb1..6cf23c0a9 100644
--- a/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
@@ -54,7 +54,7 @@ export default function AssetOwnerResourcesComp() {
 
           <Tabs
             defaultActiveKey="users"
-            className="h-full flex flex-col"
+            className="h-full flex flex-col overflow-hidden [&_.ant-tabs-contentHolder]:flex-1 [&_.ant-tabs-contentHolder]:overflow-hidden asset-owner-tabs"
             items={[
               {
                 key: "users",
@@ -108,3 +108,17 @@ export default function AssetOwnerResourcesComp() {
     </div>
   );
 }
+
+<style jsx global>{`
+  .asset-owner-tabs .ant-tabs-content {
+    width: 100%;
+    height: 100%;
+  }
+  .asset-owner-tabs .ant-tabs-tabpane {
+    height: 100%;
+    overflow: hidden;
+  }
+  .asset-owner-tabs .ant-tabs-nav {
+    flex-shrink: 0;
+  }
+`}</style>
diff --git a/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx b/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
index f4d20ae0b..cfff26fe9 100644
--- a/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
@@ -18,6 +18,8 @@ import {
   Pagination,
   Alert,
   Space,
+  Divider,
+  Tooltip
 } from "antd";
 import {
   Users,
@@ -62,7 +64,6 @@ import { useDeployment } from "@/components/providers/deploymentProvider";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import { USER_ROLES } from "@/const/auth";
 import { Can } from "@/components/permission/Can";
-import { Tooltip } from "@/components/ui/tooltip";
 import {
   getPasswordChecks,
   getStrengthLevel,
@@ -1179,167 +1180,182 @@ export default function UserManageComp() {
   };
 
   return (
-    <div className="w-full h-full">
+    <div className="flex flex-col w-full h-full">
       {/* Page header: grouped header without dividing line */}
-      <div className="w-full px-10 pt-10">
-        <motion.div
-          initial={{ opacity: 0, y: -8 }}
-          animate={{ opacity: 1, y: 0 }}
-          transition={{ duration: 0.35 }}
-        >
-          <div className="flex items-center gap-3">
-            <div className="w-12 h-12 rounded-full bg-gradient-to-br from-purple-500 to-indigo-500 flex items-center justify-center shadow-sm">
-              <Building2 className="h-6 w-6 text-white" />
-            </div>
-            <div>
-              <h1 className="text-2xl font-bold text-purple-600 dark:text-purple-500">
-                {t("tenantResources.title") || "Tenant Resource Management"}
-              </h1>
-              <p className="text-slate-600 dark:text-slate-300 mt-1">
-                {t("tenantResources.subtitle") ||
-                  "Manage tenants, users, groups and resources"}
-              </p>
-            </div>
+      <div className="flex w-full px-6 pt-12">
+        <div className="flex items-center gap-3">
+          <div className="w-12 h-12 rounded-full bg-gradient-to-br from-purple-500 to-indigo-500 flex items-center justify-center shadow-sm">
+            <Building2 className="h-6 w-6 text-white" />
           </div>
-        </motion.div>
+          <div>
+            <h1 className="text-2xl font-bold text-purple-600 dark:text-purple-500">
+              {t("tenantResources.title") || "Tenant Resource Management"}
+            </h1>
+            <p className="text-slate-600 dark:text-slate-300 mt-1">
+              {t("tenantResources.subtitle") ||
+                "Manage tenants, users, groups and resources"}
+            </p>
+          </div>
+        </div>
       </div>
-      <Row className="flex-1 min-h-0 h-full" align="stretch">
-        <Can permission="tenant.list:read">
-          <Col className="flex flex-col h-full" style={{ width: 300 }}>
-            <div className="h-full pr-6">
-              <div className="sticky top-6">
-                <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-3">
-                  <TenantList
-                    selected={tenantId}
-                    onSelect={(id) => setTenantId(id)}
-                    tenants={tenantData?.data || []}
-                    total={tenantData?.total}
-                    page={tenantData?.page}
-                    pageSize={tenantData?.page_size}
-                    totalPages={tenantData?.total_pages}
-                    onPageChange={handlePageChange}
-                    onTenantsRefetch={async () => {
-                      setCurrentPage(1);
-                      return refetchTenants();
-                    }}
-                    loading={tenantsLoading}
-                    t={t}
-                    onUserListRefresh={() =>
-                      setUserListRefreshKey((prev) => prev + 1)
-                    }
-                    onInvitationListRefresh={() =>
-                      setInvitationListRefreshKey((prev) => prev + 1)
-                    }
-                    locale={locale}
-                  />
+      <div className="flex-1 min-h-0 h-full">
+        <div className="flex h-full">
+          <Can permission="tenant.list:read">
+            <Col className="flex flex-col h-full" style={{ width: 300 }}>
+              <div className="h-full pr-6">
+                <div className="sticky top-6">
+                  <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-3">
+                    <TenantList
+                      selected={tenantId}
+                      onSelect={(id) => setTenantId(id)}
+                      tenants={tenantData?.data || []}
+                      total={tenantData?.total}
+                      page={tenantData?.page}
+                      pageSize={tenantData?.page_size}
+                      totalPages={tenantData?.total_pages}
+                      onPageChange={handlePageChange}
+                      onTenantsRefetch={async () => {
+                        setCurrentPage(1);
+                        return refetchTenants();
+                      }}
+                      loading={tenantsLoading}
+                      t={t}
+                      onUserListRefresh={() =>
+                        setUserListRefreshKey((prev) => prev + 1)
+                      }
+                      onInvitationListRefresh={() =>
+                        setInvitationListRefreshKey((prev) => prev + 1)
+                      }
+                      locale={locale}
+                    />
+                  </div>
                 </div>
               </div>
-            </div>
-          </Col>
-        </Can>
-        <Col className="flex-1 flex flex-col p-6 overflow-hidden">
-          <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-4 h-full flex flex-col overflow-hidden">
-            {/* Tenant name header */}
-            <div className="mb-4 pb-2 border-b border-gray-200 dark:border-gray-700 flex-shrink-0">
-              {isEditingTenantName ? (
-                <Input
-                  ref={tenantNameInputRef}
-                  value={editingTenantName}
-                  onChange={(e) => setEditingTenantName(e.target.value)}
-                  onBlur={saveTenantName}
-                  onKeyDown={handleTenantNameKeyDown}
-                  className="text-lg font-semibold text-gray-900 dark:text-gray-100"
-                  placeholder={t("tenantResources.tenants.name")}
-                />
-              ) : (
-                <div
-                  className="flex items-center gap-2 group cursor-pointer"
-                  onClick={startEditingTenantName}
-                >
-                  <h2 className="text-lg font-semibold text-gray-900 dark:text-gray-100">
-                    {currentTenantName}
-                  </h2>
-                  <Edit2 className="h-4 w-4 text-gray-400 opacity-0 group-hover:opacity-100 transition-opacity" />
+            </Col>
+          </Can>
+          <Col className="flex-1 flex flex-col p-6 overflow-hidden">
+            <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-4 h-full flex flex-col overflow-hidden">
+              {/* Tenant name header */}
+              <div className="flex">
+                {isEditingTenantName ? (
+                  <Input
+                    ref={tenantNameInputRef}
+                    value={editingTenantName}
+                    onChange={(e) => setEditingTenantName(e.target.value)}
+                    onBlur={saveTenantName}
+                    onKeyDown={handleTenantNameKeyDown}
+                    className="text-lg font-semibold text-gray-900 dark:text-gray-100"
+                    placeholder={t("tenantResources.tenants.name")}
+                  />
+                ) : (
+                  <div
+                    className="flex items-center gap-2 group cursor-pointer"
+                    onClick={startEditingTenantName}
+                  >
+                    <h2 className="text-lg font-semibold text-gray-900 dark:text-gray-100">
+                      {currentTenantName}
+                    </h2>
+                    <Edit2 className="h-4 w-4 text-gray-400 opacity-0 group-hover:opacity-100 transition-opacity" />
+                  </div>
+                )}
+                
+              </div>
+              
+              <div className="flex-1 min-h-0 h-full">
+                <Divider size="small"/>
+                <div className="flex h-full w-full">
+                  {tenantId ? (
+                    <Tabs
+                      defaultActiveKey="users"
+                      className="h-full flex flex-col tenant-resource-tabs w-full overflow-hidden"
+                      items={[
+                        {
+                          key: "users",
+                          label: t("tenantResources.tabs.users") || "Users",
+                          children: (
+                            <UserList
+                              tenantId={tenantId}
+                              refreshKey={userListRefreshKey}
+                            />
+                          ),
+                        },
+                        {
+                          key: "groups",
+                          label: t("tenantResources.tabs.groups") || "Groups",
+                          children: <GroupList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "models",
+                          label: t("tenantResources.tabs.models") || "Models",
+                          children: <ModelList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "knowledge",
+                          label:
+                            t("tenantResources.tabs.knowledge") || "Knowledge Base",
+                          children: <KnowledgeList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "agents",
+                          label: t("tenantResources.tabs.agents") || "Agents",
+                          children: <AgentList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "mcp",
+                          label: t("tenantResources.tabs.mcp") || "MCP",
+                          children: <McpList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "skills",
+                          label: "Skills",
+                          children: <SkillList tenantId={tenantId} />,
+                        },
+                        {
+                          key: "invitations",
+                          label: t("tenantResources.invitation.tab") || "Invitations",
+                          children: (
+                            <InvitationList
+                              tenantId={tenantId}
+                              refreshKey={invitationListRefreshKey}
+                            />
+                          ),
+                        },
+                      ]}
+                    />
+                  ) : (
+                    <div className="flex flex-col items-center justify-center py-12 text-center">
+                      <div className="w-16 h-16 bg-gray-100 dark:bg-gray-700 rounded-full flex items-center justify-center mb-4">
+                        <Users className="h-8 w-8 text-gray-400" />
+                      </div>
+                      <h3 className="text-lg font-medium text-gray-900 dark:text-gray-100">
+                        {t("tenantResources.selectTenantFirst") ||
+                          "Please select a tenant"}
+                      </h3>
+                      <p className="text-gray-500 dark:text-gray-400 max-w-sm">
+                        {t("tenantResources.selectTenantDescription") ||
+                          "Choose a tenant from the list to manage its users, groups, models, and knowledge base."}
+                      </p>
+                    </div>
+                  )}
                 </div>
-              )}
-            </div>
 
-            {tenantId ? (
-              <Tabs
-                defaultActiveKey="users"
-                className="h-full flex flex-col"
-                items={[
-                  {
-                    key: "users",
-                    label: t("tenantResources.tabs.users") || "Users",
-                    children: (
-                      <UserList
-                        tenantId={tenantId}
-                        refreshKey={userListRefreshKey}
-                      />
-                    ),
-                  },
-                  {
-                    key: "groups",
-                    label: t("tenantResources.tabs.groups") || "Groups",
-                    children: <GroupList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "models",
-                    label: t("tenantResources.tabs.models") || "Models",
-                    children: <ModelList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "knowledge",
-                    label:
-                      t("tenantResources.tabs.knowledge") || "Knowledge Base",
-                    children: <KnowledgeList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "agents",
-                    label: t("tenantResources.tabs.agents") || "Agents",
-                    children: <AgentList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "mcp",
-                    label: t("tenantResources.tabs.mcp") || "MCP",
-                    children: <McpList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "skills",
-                    label: "Skills",
-                    children: <SkillList tenantId={tenantId} />,
-                  },
-                  {
-                    key: "invitations",
-                    label: t("tenantResources.invitation.tab") || "Invitations",
-                    children: (
-                      <InvitationList
-                        tenantId={tenantId}
-                        refreshKey={invitationListRefreshKey}
-                      />
-                    ),
-                  },
-                ]}
-              />
-            ) : (
-              <div className="flex flex-col items-center justify-center py-12 text-center">
-                <div className="w-16 h-16 bg-gray-100 dark:bg-gray-700 rounded-full flex items-center justify-center mb-4">
-                  <Users className="h-8 w-8 text-gray-400" />
-                </div>
-                <h3 className="text-lg font-medium text-gray-900 dark:text-gray-100">
-                  {t("tenantResources.selectTenantFirst") ||
-                    "Please select a tenant"}
-                </h3>
-                <p className="text-gray-500 dark:text-gray-400 max-w-sm">
-                  {t("tenantResources.selectTenantDescription") ||
-                    "Choose a tenant from the list to manage its users, groups, models, and knowledge base."}
-                </p>
               </div>
-            )}
-          </div>
-        </Col>
-      </Row>
+            </div>
+          </Col>
+        </div>
+      </div>
     </div>
   );
 }
+
+<style jsx global>{`
+  .tenant-resource-tabs .ant-tabs-content {
+    width: 100%;
+    max-width: 100%;
+    overflow: hidden;
+  }
+  .tenant-resource-tabs .ant-tabs-tabpane {
+    max-width: 100%;
+    overflow: hidden;
+  }
+`}</style>
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
index 41fbf4c93..2e2383ad5 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
@@ -411,20 +411,19 @@ export default function AgentList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
-      <div className="space-y-6 flex-1 overflow-auto">
-        <div className="min-w-0">
-          <Table
-            columns={columns}
-            dataSource={agents as AgentListRow[]}
-            rowKey="id"
-            loading={isLoading}
-            size="small"
-            pagination={{ pageSize: 10 }}
-            locale={{ emptyText: t("space.noAgents") }}
-            scroll={{ x: true }}
-          />
-        </div>
+    <div className="flex flex-col h-full overflow-hidden">
+      <div className="flex-1 overflow-hidden">
+        <Table
+          columns={columns}
+          dataSource={agents as AgentListRow[]}
+          rowKey="id"
+          loading={isLoading}
+          size="small"
+          pagination={{ pageSize: 10 }}
+          locale={{ emptyText: t("space.noAgents") }}
+          scroll={{ y: "calc(100vh - 480px)" }}
+          className="[&_.ant-table]:h-full"
+        />
       </div>
 
       {/* View Modal */}
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
index ec3397219..32af131db 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
@@ -12,9 +12,9 @@ import {
   Popconfirm,
   message,
   Select,
+  Tooltip
 } from "antd";
 import { Edit, Trash2 } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import { useGroupList } from "@/hooks/group/useGroupList";
 import { useUserList } from "@/hooks/user/useUserList";
@@ -278,7 +278,7 @@ export default function GroupList({ tenantId }: { tenantId: string | null }) {
   };
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
+    <div className="h-full w-full flex flex-col overflow-auto">
       <div className="flex items-center justify-between mb-4 flex-shrink-0">
         <div />
         <div>
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
index 688fda8b1..6365ab68a 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
@@ -17,6 +17,7 @@ import {
   Collapse,
   DatePicker,
   Progress,
+  Tooltip 
 } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { useInvitationList } from "@/hooks/invitation/useInvitationList";
@@ -41,7 +42,6 @@ import {
   Copy,
   CircleSlash,
 } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { formatDate } from "@/lib/date";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import {
@@ -443,7 +443,7 @@ export default function InvitationList({
   }, [invitations, tenantId]);
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
+    <div className="flex flex-col h-full overflow-hidden">
       <div className="mb-4 flex justify-between items-center flex-shrink-0">
         <div />
         <div>
@@ -465,8 +465,8 @@ export default function InvitationList({
           loading={isLoading}
           rowKey="invitation_id"
           pagination={{ pageSize: 10 }}
-          scroll={{ x: 1000 }}
-          className="flex-1"
+          scroll={{ y: "calc(100vh - 560px)" }}
+          className="flex-1 [&_.ant-table]:h-full"
         />
       ) : (
         // Multi-tenant view with collapse
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
index 18d70ad51..7b1a703b1 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
@@ -2,11 +2,10 @@
 
 import React, { useMemo, useState } from "react";
 import { useTranslation } from "react-i18next";
-import { Table, Popconfirm, message, Button, Modal, Tag } from "antd";
+import { Table, Popconfirm, message, Button, Modal, Tag, Tooltip } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { Edit, Trash2, BookOpen } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
-import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
+import { MarkdownRenderer } from "@/components/common/markdownRenderer";
 import { useKnowledgeList } from "@/hooks/knowledge/useKnowledgeList";
 import { useGroupList } from "@/hooks/group/useGroupList";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
@@ -255,15 +254,15 @@ export default function KnowledgeList({
   ];
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
+    <div className="flex flex-col h-full overflow-hidden">
       <Table
         columns={columns}
         dataSource={knowledgeBases}
         loading={isLoading}
         rowKey="id"
         pagination={{ pageSize: 10 }}
-        scroll={{ x: 1400 }}
-        className="flex-1"
+        className="flex-1 [&_.ant-table]:h-full"
+        scroll={{ y: "calc(100vh - 510px)" }}
       />
 
       {/* Edit Knowledge Base Modal */}
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
index ba2d20c0d..412ff402f 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
@@ -114,6 +114,7 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
   const [openApiJson, setOpenApiJson] = useState("");
   const [openApiServiceName, setOpenApiServiceName] = useState("");
   const [openApiServerUrl, setOpenApiServerUrl] = useState("");
+  const [openApiHeadersTemplate, setOpenApiHeadersTemplate] = useState("");
   const [importingOpenApi, setImportingOpenApi] = useState(false);
   const [openapiServices, setOpenapiServices] = useState<any[]>([]);
   const [loadingOpenapiServices, setLoadingOpenapiServices] = useState(false);
@@ -445,6 +446,7 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
           service_name: openApiServiceName.trim(),
           server_url: openApiServerUrl.trim(),
           openapi_json: parsedJson,
+          headers_template: openApiHeadersTemplate.trim() ? JSON.parse(openApiHeadersTemplate.trim()) : null,
         }),
       });
 
@@ -453,6 +455,7 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
         setOpenApiJson("");
         setOpenApiServiceName("");
         setOpenApiServerUrl("");
+        setOpenApiHeadersTemplate("");
         await loadOpenapiServices();
       } else {
         const errorData = await response.json();
@@ -757,7 +760,7 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
+    <div className="flex flex-col h-full overflow-hidden">
       <div className="flex justify-between items-center mb-4 flex-shrink-0">
         <div />
         <Button type="primary" icon={<Plus size={16} />} onClick={() => setAddModalVisible(true)}>
@@ -765,47 +768,45 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
         </Button>
       </div>
 
-      <div className="space-y-6 flex-1 overflow-auto">
-        <div className="min-w-0">
-          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.serverList.title")}</Title>
-          <Table
-            columns={serverColumns}
-            dataSource={serverList}
-            rowKey={(record) => `${record.service_name}-${record.mcp_url}`}
-            loading={loading}
-            size="small"
-            pagination={{ pageSize: 7 }}
-            locale={{ emptyText: t("mcpConfig.serverList.empty") }}
-          />
-        </div>
+      <div className="flex-1 overflow-hidden">
+        <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.serverList.title")}</Title>
+        <Table
+          columns={serverColumns}
+          dataSource={serverList}
+          rowKey={(record) => `${record.service_name}-${record.mcp_url}`}
+          loading={loading}
+          size="small"
+          pagination={{ pageSize: 7 }}
+          locale={{ emptyText: t("mcpConfig.serverList.empty") }}
+          scroll={{ y: "calc(100vh - 560px)" }}
+          className="flex-1 [&_.ant-table]:h-full"
+        />
 
-        <div className="min-w-0">
-          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.containerList.title")}</Title>
-          <Table
-            columns={containerColumns}
-            dataSource={containerList}
-            rowKey="container_id"
-            loading={loading}
-            size="small"
-            pagination={{ pageSize: 3 }}
-            locale={{ emptyText: t("mcpConfig.containerList.empty") }}
-            scroll={{ x: true }}
-          />
-        </div>
+        <Title level={5} style={{ marginTop: 24, marginBottom: 12 }}>{t("mcpConfig.containerList.title")}</Title>
+        <Table
+          columns={containerColumns}
+          dataSource={containerList}
+          rowKey="container_id"
+          loading={loading}
+          size="small"
+          pagination={{ pageSize: 3 }}
+          locale={{ emptyText: t("mcpConfig.containerList.empty") }}
+          scroll={{ y: 200 }}
+          className="[&_.ant-table]:h-full"
+        />
 
-        <div className="min-w-0">
-          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.openapiService.list.title")}</Title>
-          <Table
-            columns={openapiServicesColumns}
-            dataSource={openapiServices}
-            rowKey="id"
-            loading={loadingOpenapiServices}
-            size="small"
-            pagination={{ pageSize: 5 }}
-            locale={{ emptyText: t("mcpConfig.openapiService.list.empty") }}
-            scroll={{ x: true }}
-          />
-        </div>
+        <Title level={5} style={{ marginTop: 24, marginBottom: 12 }}>{t("mcpConfig.openapiService.list.title")}</Title>
+        <Table
+          columns={openapiServicesColumns}
+          dataSource={openapiServices}
+          rowKey="id"
+          loading={loadingOpenapiServices}
+          size="small"
+          pagination={{ pageSize: 5 }}
+          locale={{ emptyText: t("mcpConfig.openapiService.list.empty") }}
+          scroll={{ y: 250 }}
+          className="[&_.ant-table]:h-full"
+        />
       </div>
 
       {/* Add Modal */}
@@ -1035,13 +1036,22 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
                         style={{ flex: 3 }}
                       />
                     </div>
-                    <Input.TextArea
-                      placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
-                      value={openApiJson}
-                      onChange={(e) => setOpenApiJson(e.target.value)}
-                      rows={6}
-                      disabled={actionsLocked || importingOpenApi}
-                    />
+                    <div className="space-y-2">
+                      <Input.TextArea
+                        placeholder={t("mcpConfig.addServer.customHeadersPlaceholder")}
+                        value={openApiHeadersTemplate}
+                        onChange={(e) => setOpenApiHeadersTemplate(e.target.value)}
+                        rows={2}
+                        disabled={actionsLocked || importingOpenApi}
+                      />
+                      <Input.TextArea
+                        placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
+                        value={openApiJson}
+                        onChange={(e) => setOpenApiJson(e.target.value)}
+                        rows={6}
+                        disabled={actionsLocked || importingOpenApi}
+                      />
+                    </div>
                     <div className="flex justify-end">
                       <Button
                         type="primary"
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
index 560df8cb8..6715852f7 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
@@ -2,9 +2,8 @@
 
 import React, { useState, useMemo } from "react";
 import { useTranslation } from "react-i18next";
-import { Table, Button, Popconfirm, message, Tag, Segmented } from "antd";
+import { Table, Button, Popconfirm, message, Tag, Segmented, Tooltip } from "antd";
 import { Edit, Trash2, RefreshCw } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import type { TablePaginationConfig } from "antd";
 import { FilterValue, SorterResult } from "antd/es/table/interface";
@@ -361,7 +360,7 @@ export default function ModelList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="h-full flex flex-col overflow-auto">
+    <div className="flex flex-col h-full overflow-hidden">
       <div className="flex items-center justify-between mb-4 flex-shrink-0">
         <div className="flex items-center gap-3">
           <Segmented
@@ -398,8 +397,8 @@ export default function ModelList({ tenantId }: { tenantId: string | null }) {
           total: total,
         }}
         onChange={handlePageChange}
-        scroll={{ x: true }}
-        className="flex-1"
+        scroll={{ y: "calc(100vh - 580px)" }}
+        className="flex-1 [&_.ant-table]:h-full"
       />
 
       <ModelAddDialog
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
index 04d45720d..c25f89b57 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
@@ -13,10 +13,10 @@ import {
   Form,
   Switch,
   InputNumber,
+  Tooltip
 } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { Download } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 
 import {
   fetchSkillsList,
@@ -547,7 +547,6 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
   const { t } = useTranslation("common");
   const { message } = App.useApp();
   const [form] = Form.useForm();
-
   const [paramsModalOpen, setParamsModalOpen] = useState(false);
   const [editingSkill, setEditingSkill] = useState<SkillListItem | null>(null);
   const [savingParams, setSavingParams] = useState(false);
@@ -730,8 +729,8 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
     : "closed";
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
-      <div className="flex justify-end mb-2">
+    <div className="flex flex-col h-full overflow-hidden">
+      <div className="flex justify-end mb-2 flex-shrink-0">
         <Button
           type="primary"
           icon={<Download className="h-4 w-4" />}
@@ -748,7 +747,8 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
         size="small"
         pagination={{ pageSize: 10 }}
         locale={{ emptyText: t("tenantResources.skills.empty") }}
-        scroll={{ x: true }}
+        scroll={{ y: "calc(100vh - 500px)" }}
+        className="flex-1 [&_.ant-table]:h-full"
       />
 
       <Modal
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
index 64f4e6760..13d54ee5c 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
@@ -12,9 +12,9 @@ import {
   Popconfirm,
   message,
   Tag,
+  Tooltip 
 } from "antd";
 import { Edit, Trash2 } from "lucide-react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import { useUserList } from "@/hooks/user/useUserList";
 import { useGroupList } from "@/hooks/group/useGroupList";
@@ -141,6 +141,7 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
         title: t("common.email"),
         dataIndex: "username",
         key: "username",
+        width: "50%"
       },
       {
         title: t("common.type"),
@@ -164,6 +165,7 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
               {roleLabels[role] || role}
             </Tag>;
         },
+        width: "20%"
       },
       {
         title: t("common.actions"),
@@ -197,6 +199,7 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
             </Popconfirm>
           </div>
         ),
+        width: "20%"
       },
     ],
     []
@@ -207,7 +210,7 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
   };
 
   return (
-    <div className="h-full flex flex-col overflow-hidden">
+    <div className="flex flex-col h-full overflow-hidden">
       <Table
         dataSource={users}
         columns={columns}
@@ -219,10 +222,9 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
           total: total,
           onChange: handlePageChange,
         }}
-        scroll={{ x: true }}
-        className="flex-1"
+        className="flex-1 [&_.ant-table]:h-full"
+        scroll={{ y: "calc(100vh - 480px)" }}
       />
-
       <Modal
         title={t("tenantResources.users.editUser")}
         open={modalVisible}
diff --git a/frontend/app/[locale]/users/components/UserProfileComp.tsx b/frontend/app/[locale]/users/components/UserProfileComp.tsx
index 67b34d250..41cfeb0a0 100644
--- a/frontend/app/[locale]/users/components/UserProfileComp.tsx
+++ b/frontend/app/[locale]/users/components/UserProfileComp.tsx
@@ -39,6 +39,7 @@ import { OAuthAccountsSection } from "@/components/settings/OAuthAccountsSection
 import log from "@/lib/logger";
 import { authService } from "@/services/authService";
 import { getPasswordChecks, getStrengthLevel } from "@/lib/utils";
+import { useConfirmModal } from "@/hooks/useConfirmModal";
 import {
   getUserTokens,
   deleteUserToken,
@@ -61,6 +62,7 @@ export default function UserProfileComp() {
   const { message: antdMessage } = App.useApp();
   const { logout, revoke, isLoading } = useAuthenticationContext();
   const { user, groupIds } = useAuthorizationContext();
+  const { confirm } = useConfirmModal();
 
   // Fetch groups for group name mapping
   const { data: groupData } = useGroupList(user?.tenantId || null);
@@ -107,6 +109,7 @@ export default function UserProfileComp() {
   // Check if user is admin or super admin (cannot delete account)
   const isAdminOrSuperAdmin =
     user?.role === USER_ROLES.ADMIN || user?.role === USER_ROLES.SU;
+  const isCasUser = user?.authProvider === "cas";
   const getRoleDisplayName = (role: string) => {
     switch (role) {
       case USER_ROLES.SPEED:
@@ -125,17 +128,20 @@ export default function UserProfileComp() {
   };
 
   // Handle logout
-  const handleLogout = async () => {
-    try {
-      await logout();
-      window.location.href = "/";
-    } catch (error) {
-      antdMessage.error(t("auth.logoutFailed"));
-    }
+  const handleLogout = () => {
+    confirm({
+      title: t("auth.confirmLogout"),
+      content: t("auth.confirmLogoutPrompt"),
+      onOk: () => {
+        logout();
+      },
+    });
   };
 
   // Handle delete account
   const handleDeleteAccount = async () => {
+    if (isAdminOrSuperAdmin || isCasUser) return;
+
     try {
       await revoke();
       antdMessage.success(t("auth.revokeSuccess"));
@@ -469,8 +475,16 @@ export default function UserProfileComp() {
                 </div>
 
                 <button
-                  onClick={() => setIsDeleteModalOpen(true)}
-                  className="w-full px-6 py-3 flex items-center justify-between hover:bg-red-50 dark:hover:bg-red-900/20 transition-colors text-left"
+                  disabled={isCasUser}
+                  onClick={() => {
+                    if (isCasUser) return;
+                    setIsDeleteModalOpen(true);
+                  }}
+                  className={`w-full px-6 py-3 flex items-center justify-between transition-colors text-left ${
+                    isCasUser
+                      ? "cursor-not-allowed opacity-50"
+                      : "hover:bg-red-50 dark:hover:bg-red-900/20"
+                  }`}
                 >
                   <div className="flex items-center gap-3">
                     <div className="w-8 h-8 rounded-lg bg-red-50 dark:bg-red-900/20 flex items-center justify-center">
@@ -695,7 +709,7 @@ export default function UserProfileComp() {
         onOk={handleDeleteAccount}
         onCancel={() => setIsDeleteModalOpen(false)}
         loading={isLoading}
-        disabled={isAdminOrSuperAdmin}
+        disabled={isAdminOrSuperAdmin || isCasUser}
       />
 
       {/* OAuth Linked Accounts */}
diff --git a/frontend/components/agent/AgentImportWizard.tsx b/frontend/components/agent/AgentImportWizard.tsx
index 5ccf79033..504237c1c 100644
--- a/frontend/components/agent/AgentImportWizard.tsx
+++ b/frontend/components/agent/AgentImportWizard.tsx
@@ -393,7 +393,6 @@ export default function AgentImportWizard({
         items: agentsWithConflicts.map(([agentKey, conflict]) => {
           const agentInfo = initialData.agent_info[agentKey] as any;
           return {
-            agent_id: agentInfo?.agent_id,
             name: conflict.renamedName || agentInfo?.name || "",
             display_name: conflict.renamedDisplayName || agentInfo?.display_name || "",
             task_description: agentInfo?.business_description || agentInfo?.description || "",
diff --git a/frontend/components/auth/avatarDropdown.tsx b/frontend/components/auth/avatarDropdown.tsx
index e77f5f1e2..f52f59119 100644
--- a/frontend/components/auth/avatarDropdown.tsx
+++ b/frontend/components/auth/avatarDropdown.tsx
@@ -3,7 +3,14 @@
 import React, { useState } from "react";
 import { useTranslation } from "react-i18next";
 import { Dropdown, Avatar, Spin, Button, Tag, ConfigProvider } from "antd";
-import { UserRound, LogOut, LogIn, UserRoundPlus, UserCircle, Power } from "lucide-react";
+import {
+  UserRound,
+  LogOut,
+  LogIn,
+  UserRoundPlus,
+  UserCircle,
+  Power,
+} from "lucide-react";
 import type { ItemType } from "antd/es/menu/interface";
 import Link from "next/link";
 
@@ -106,6 +113,8 @@ export function AvatarDropdown() {
     );
   }
 
+  const isCasUser = user.authProvider === "cas";
+
   // User has logged in, show user menu
   const menuItems: ItemType[] = [
     {
@@ -159,8 +168,12 @@ export function AvatarDropdown() {
       icon: <Power size={16} />,
       label: t("auth.revoke"),
       // danger: true,
-      className: "hover:!bg-red-100 focus:!bg-red-400 focus:!text-white",
+      disabled: isCasUser,
+      className: isCasUser
+        ? "cursor-not-allowed opacity-50"
+        : "hover:!bg-red-100 focus:!bg-red-400 focus:!text-white",
       onClick: () => {
+        if (isCasUser) return;
         setIsDeleteModalOpen(true);
       },
     },
@@ -195,7 +208,11 @@ export function AvatarDropdown() {
         }}
         onCancel={() => setIsDeleteModalOpen(false)}
         loading={isLoading}
-        disabled={user.role === USER_ROLES.ADMIN || user.role === USER_ROLES.SU}
+        disabled={
+          isCasUser ||
+          user.role === USER_ROLES.ADMIN ||
+          user.role === USER_ROLES.SU
+        }
       />
     </ConfigProvider>
   );
diff --git a/frontend/components/auth/loginModal.tsx b/frontend/components/auth/loginModal.tsx
index 3a4b94a90..7425c3ff8 100644
--- a/frontend/components/auth/loginModal.tsx
+++ b/frontend/components/auth/loginModal.tsx
@@ -3,13 +3,14 @@
 import { useCallback, useState, useEffect } from "react";
 import { useTranslation } from "react-i18next";
 import { Modal, Form, Input, Button, Typography, Space, Divider, Alert } from "antd";
-import { UserRound, LockKeyhole, Github, Link2 } from "lucide-react";
+import { UserRound, LockKeyhole, Github, Link2, KeyRound } from "lucide-react";
 import { usePathname, useRouter, useSearchParams } from "next/navigation";
 
 import { useAuthenticationContext } from "@/components/providers/AuthenticationProvider";
 import { useDeployment } from "@/components/providers/deploymentProvider";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { oauthService } from "@/services/oauthService";
+import { casService, CasConfig } from "@/services/casService";
 import log from "@/lib/logger";
 
 const { Text } = Typography;
@@ -48,6 +49,30 @@ function OAuthLoginButtons() {
   );
 }
 
+function CasLoginButton() {
+  const { t } = useTranslation("common");
+  const [config, setConfig] = useState<CasConfig | null>(null);
+
+  useEffect(() => {
+    casService.getConfig().then(setConfig);
+  }, []);
+
+  if (!config?.enabled || config.login_mode !== "button") return null;
+
+  return (
+    <div className="mt-2 mb-2">
+      <Button
+        block
+        size="large"
+        icon={<KeyRound size={18} />}
+        onClick={() => casService.startLogin()}
+      >
+        {t("auth.casLogin", { provider: config.display_name }) || `${config.display_name} Login`}
+      </Button>
+    </div>
+  );
+}
+
 /**
  * LoginModal Component
  * Handles user authentication through a modal interface
@@ -95,6 +120,15 @@ export function LoginModal() {
     }
   }, [searchParams, router, getOAuthLoginErrorMessage]);
 
+  useEffect(() => {
+    if (!isLoginModalOpen || isAuthenticated || isSpeedMode) return;
+    casService.getConfig().then((config) => {
+      if (config.enabled && config.login_mode === "force") {
+        casService.startLogin();
+      }
+    });
+  }, [isLoginModalOpen, isAuthenticated, isSpeedMode]);
+
   const resetForm = () => {
     setEmailError("");
     setPasswordError(false);
@@ -308,6 +342,8 @@ export function LoginModal() {
             </Button>
           </Form.Item>
 
+          <CasLoginButton />
+
           {/* OAuth login section */}
           <OAuthLoginButtons />
 
diff --git a/frontend/components/ui/Diagram.tsx b/frontend/components/common/Diagram.tsx
similarity index 100%
rename from frontend/components/ui/Diagram.tsx
rename to frontend/components/common/Diagram.tsx
diff --git a/frontend/components/ui/PdfViewer.tsx b/frontend/components/common/PdfViewer.tsx
similarity index 100%
rename from frontend/components/ui/PdfViewer.tsx
rename to frontend/components/common/PdfViewer.tsx
diff --git a/frontend/components/ui/copyButton.tsx b/frontend/components/common/copyButton.tsx
similarity index 100%
rename from frontend/components/ui/copyButton.tsx
rename to frontend/components/common/copyButton.tsx
diff --git a/frontend/components/ui/filePreviewDrawer.tsx b/frontend/components/common/filePreviewDrawer.tsx
similarity index 50%
rename from frontend/components/ui/filePreviewDrawer.tsx
rename to frontend/components/common/filePreviewDrawer.tsx
index 7f7f08c4a..409352e15 100644
--- a/frontend/components/ui/filePreviewDrawer.tsx
+++ b/frontend/components/common/filePreviewDrawer.tsx
@@ -1,12 +1,28 @@
 "use client";
 
-import { useState, useEffect, useCallback, useMemo, useRef, type PointerEvent as ReactPointerEvent, type WheelEvent as ReactWheelEvent } from 'react';
-import { useTranslation } from 'react-i18next';
-import dynamic from 'next/dynamic';
-import { Drawer, Spin, Button, Table } from 'antd';
-import { Download, Maximize2, Minimize2, Minus, Plus, RotateCw, X } from 'lucide-react';
-import { FilePreviewProps } from '@/types/chat';
-import { DetectedFileType, ImageBaseMode } from '@/types/file';
+import {
+  useState,
+  useEffect,
+  useCallback,
+  useMemo,
+  useRef,
+  type PointerEvent as ReactPointerEvent,
+  type WheelEvent as ReactWheelEvent,
+} from "react";
+import { useTranslation } from "react-i18next";
+import dynamic from "next/dynamic";
+import { Drawer, Modal, Spin, Button, Table } from "antd";
+import {
+  Download,
+  Maximize2,
+  Minimize2,
+  Minus,
+  Plus,
+  RotateCw,
+  X,
+} from "lucide-react";
+import { FilePreviewProps } from "@/types/chat";
+import { DetectedFileType, ImageBaseMode } from "@/types/file";
 import {
   CHUNK_SIZE,
   TEXT_RENDER_BLOCK_SIZE,
@@ -26,40 +42,63 @@ import {
   clamp,
   ignoreAbortError,
   getPageWrapperStyle,
-} from '@/lib/filePreviewUtils';
-import { storageService } from '@/services/storageService';
-import { MarkdownRenderer, extractMarkdownHeadings, type MarkdownHeading } from '@/components/ui/markdownRenderer';
-import { formatFileSize } from '@/lib/utils';
-import log from '@/lib/logger';
-
-const PdfViewer = dynamic(() => import('@/components/ui/PdfViewer').then(mod => ({ default: mod.PdfViewer })), {
-  ssr: false,
-  loading: () => (
-    <div className="flex items-center justify-center h-full">
-      <Spin size="large" />
-    </div>
-  ),
-});
+  fetchPreviewBlob,
+  PreviewAccessError,
+  getPreviewAccessReasonFromStatus,
+  type PreviewAccessReason,
+} from "@/lib/filePreviewUtils";
+import { storageService } from "@/services/storageService";
+import {
+  MarkdownRenderer,
+  extractMarkdownHeadings,
+  type MarkdownHeading,
+} from "@/components/common/markdownRenderer";
+import { formatFileSize } from "@/lib/utils";
+import log from "@/lib/logger";
+
+const PdfViewer = dynamic(
+  () =>
+    import("@/components/common/PdfViewer").then((mod) => ({
+      default: mod.PdfViewer,
+    })),
+  {
+    ssr: false,
+    loading: () => (
+      <div className="flex items-center justify-center h-full">
+        <Spin size="large" />
+      </div>
+    ),
+  }
+);
 
 export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
-  const { open, onClose } = props;
-  const { t } = useTranslation('common');
-  const isLocalSource = props.source === 'local';
+  const { open, onClose, previewContext } = props;
+  const { t } = useTranslation("common");
+  const isLocalSource = props.source === "local";
   const localFile = isLocalSource ? props.file : null;
-  const objectName = !isLocalSource ? props.objectName : '';
-  const fileName = isLocalSource && localFile
-    ? localFile.name
-    : ('fileName' in props ? props.fileName : '');
-  const providedFileType = isLocalSource && localFile
-    ? localFile.type
-    : ('fileType' in props ? props.fileType : undefined);
-  const fileSize = isLocalSource && localFile
-    ? localFile.size
-    : ('fileSize' in props ? props.fileSize : undefined);
+  const objectName = !isLocalSource ? props.objectName : "";
+  const fileName =
+    isLocalSource && localFile
+      ? localFile.name
+      : "fileName" in props
+        ? props.fileName
+        : "";
+  const providedFileType =
+    isLocalSource && localFile
+      ? localFile.type
+      : "fileType" in props
+        ? props.fileType
+        : undefined;
+  const fileSize =
+    isLocalSource && localFile
+      ? localFile.size
+      : "fileSize" in props
+        ? props.fileSize
+        : undefined;
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState<string | null>(null);
-  const [textContent, setTextContent] = useState<string>('');
-  const [previewUrl, setPreviewUrl] = useState<string>('');
+  const [textContent, setTextContent] = useState<string>("");
+  const [previewUrl, setPreviewUrl] = useState<string>("");
   const [loadingMore, setLoadingMore] = useState(false);
   const [showMarkdownToc, setShowMarkdownToc] = useState(false);
 
@@ -73,9 +112,15 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const [imageScale, setImageScale] = useState(1);
   const [imageRotation, setImageRotation] = useState(0);
   const [imageLoadError, setImageLoadError] = useState(false);
-  const [imageNaturalSize, setImageNaturalSize] = useState({ width: 0, height: 0 });
-  const [imageViewportSize, setImageViewportSize] = useState({ width: 0, height: 0 });
-  const [imageBaseMode, setImageBaseMode] = useState<ImageBaseMode>('fit');
+  const [imageNaturalSize, setImageNaturalSize] = useState({
+    width: 0,
+    height: 0,
+  });
+  const [imageViewportSize, setImageViewportSize] = useState({
+    width: 0,
+    height: 0,
+  });
+  const [imageBaseMode, setImageBaseMode] = useState<ImageBaseMode>("fit");
   const imageViewportResizeObserverRef = useRef<ResizeObserver | null>(null);
   const [imagePan, setImagePan] = useState({ x: 0, y: 0 });
   const [isImageDragging, setIsImageDragging] = useState(false);
@@ -101,9 +146,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
   const byteOffsetRef = useRef(0);
   const totalBytesRef = useRef<number | null>(null);
-  const remainderRef = useRef('');
+  const remainderRef = useRef("");
   const isFetchingRef = useRef(false);
-  const previewUrlRef = useRef('');
+  const previewUrlRef = useRef("");
   const textDecoderRef = useRef<TextDecoder | null>(null);
   const decoderEncodingRef = useRef<string | null>(null);
   const decoderHasExplicitCharsetRef = useRef(false);
@@ -111,71 +156,99 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const observerRef = useRef<IntersectionObserver | null>(null);
   const markdownContainerRef = useRef<HTMLDivElement | null>(null);
   const textFetchSessionRef = useRef(0);
-  const csvDelimiterRef = useRef<string>(',');
+  const csvDelimiterRef = useRef<string>(",");
+
+  const handleKnowledgePreviewAccessError = useCallback(
+    (reason: PreviewAccessReason) => {
+      if (previewContext !== "knowledgeBase") {
+        return false;
+      }
+      const key =
+        reason === "forbidden"
+          ? "filePreview.knowledge.accessDenied"
+          : "filePreview.knowledge.noStoredCopy";
+      Modal.info({
+        title: t(`${key}.title`),
+        content: t(`${key}.content`),
+        okText: t("common.confirm"),
+        centered: true,
+      });
+      onClose();
+      return true;
+    },
+    [previewContext, t, onClose]
+  );
 
   const resetTextPreviewState = useCallback(() => {
-    setTextContent('');
+    setTextContent("");
     setTxtLines([]);
     setCsvRows([]);
     setLoadingMore(false);
 
     byteOffsetRef.current = 0;
     totalBytesRef.current = null;
-    remainderRef.current = '';
+    remainderRef.current = "";
     isFetchingRef.current = false;
     textDecoderRef.current = null;
     decoderEncodingRef.current = null;
     decoderHasExplicitCharsetRef.current = false;
     decoderAllowGbFallbackRef.current = false;
-    csvDelimiterRef.current = ',';
+    csvDelimiterRef.current = ",";
 
     observerRef.current?.disconnect();
     observerRef.current = null;
   }, []);
 
   const getDetectedFileType = useCallback((): DetectedFileType => {
-    const mime = providedFileType?.toLowerCase() || '';
-
-    if (mime === 'application/pdf') return 'pdf';
-    
-    if (mime === 'application/msword' || 
-        mime === 'application/vnd.openxmlformats-officedocument.wordprocessingml.document' ||
-        mime === 'application/vnd.ms-excel' || 
-        mime === 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet' ||
-        mime === 'application/vnd.ms-powerpoint' || 
-        mime === 'application/vnd.openxmlformats-officedocument.presentationml.presentation') {
-      return isLocalSource ? 'office' : 'pdf';
+    const mime = providedFileType?.toLowerCase() || "";
+
+    if (mime === "application/pdf") return "pdf";
+
+    if (
+      mime === "application/msword" ||
+      mime ===
+        "application/vnd.openxmlformats-officedocument.wordprocessingml.document" ||
+      mime === "application/vnd.ms-excel" ||
+      mime ===
+        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" ||
+      mime === "application/vnd.ms-powerpoint" ||
+      mime ===
+        "application/vnd.openxmlformats-officedocument.presentationml.presentation"
+    ) {
+      return isLocalSource ? "office" : "pdf";
     }
-    
-    if (mime.startsWith('image/')) return 'image';
-    
-    if (mime === 'text/markdown') return 'markdown';
 
-    if (mime === 'text/csv') return 'csv';
+    if (mime.startsWith("image/")) return "image";
 
-    if (mime === 'text/html') return 'html';
+    if (mime === "text/markdown") return "markdown";
 
-    if (mime === 'text/plain') return 'text';
+    if (mime === "text/csv") return "csv";
 
-    const extension = fileName.split('.').pop()?.toLowerCase() || '';
-    
-    if (extension === 'pdf') return 'pdf';
-    if (['doc', 'docx', 'xls', 'xlsx', 'ppt', 'pptx'].includes(extension)) {
-      return isLocalSource ? 'office' : 'pdf';
-    }
-    if (['jpg', 'jpeg', 'png', 'gif', 'webp', 'svg', 'bmp'].includes(extension)) return 'image';
-    if (['md', 'markdown'].includes(extension)) return 'markdown';
-    if (extension === 'csv') return 'csv';
-    if (['html', 'htm'].includes(extension)) return 'html';
-    if (['txt', 'log', 'json', 'xml', 'yaml', 'yml'].includes(extension)) return 'text';
+    if (mime === "text/html") return "html";
+
+    if (mime === "text/plain") return "text";
 
-    return 'unknown';
+    const extension = fileName.split(".").pop()?.toLowerCase() || "";
+
+    if (extension === "pdf") return "pdf";
+    if (["doc", "docx", "xls", "xlsx", "ppt", "pptx"].includes(extension)) {
+      return isLocalSource ? "office" : "pdf";
+    }
+    if (["jpg", "jpeg", "png", "gif", "webp", "svg", "bmp"].includes(extension))
+      return "image";
+    if (["md", "markdown"].includes(extension)) return "markdown";
+    if (extension === "csv") return "csv";
+    if (["html", "htm"].includes(extension)) return "html";
+    if (["txt", "log", "json", "xml", "yaml", "yml"].includes(extension))
+      return "text";
+
+    return "unknown";
   }, [providedFileType, fileName, isLocalSource]);
 
   const detectedFileType = getDetectedFileType();
 
   const markdownHeadings = useMemo<MarkdownHeading[]>(() => {
-    if (detectedFileType !== 'markdown' || !textContent) {
+    if (detectedFileType !== "markdown" || !textContent) {
       return [];
     }
     return extractMarkdownHeadings(textContent);
@@ -188,16 +261,21 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     }
     return blocks;
   }, [txtLines]);
-  
+
   const isEmptyFile = fileSize === 0;
   const isTooLargeToPreview = !!(fileSize && fileSize > 100 * 1024 * 1024);
 
   const normalizedImageRotation = ((imageRotation % 360) + 360) % 360;
   const imageFitScale = useMemo(
-    () => computeRotateFitScale(normalizedImageRotation, imageNaturalSize, imageViewportSize),
-    [imageNaturalSize, imageViewportSize, normalizedImageRotation],
+    () =>
+      computeRotateFitScale(
+        normalizedImageRotation,
+        imageNaturalSize,
+        imageViewportSize
+      ),
+    [imageNaturalSize, imageViewportSize, normalizedImageRotation]
   );
-  const imageBaseScale = imageBaseMode === 'fit' ? imageFitScale : 1;
+  const imageBaseScale = imageBaseMode === "fit" ? imageFitScale : 1;
   const effectiveImageScale = imageScale * imageBaseScale;
   const imageScaleMin = imageBaseScale > 0 ? 0.25 / imageBaseScale : 0.25;
   const imageScaleMax = imageBaseScale > 0 ? 6 / imageBaseScale : 6;
@@ -207,26 +285,38 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (naturalWidth <= 0 || naturalHeight <= 0) {
       return { width: 0, height: 0 };
     }
-    const isQuarterTurn = normalizedImageRotation === 90 || normalizedImageRotation === 270;
-    const displayWidth = (isQuarterTurn ? naturalHeight : naturalWidth) * effectiveImageScale;
-    const displayHeight = (isQuarterTurn ? naturalWidth : naturalHeight) * effectiveImageScale;
+    const isQuarterTurn =
+      normalizedImageRotation === 90 || normalizedImageRotation === 270;
+    const displayWidth =
+      (isQuarterTurn ? naturalHeight : naturalWidth) * effectiveImageScale;
+    const displayHeight =
+      (isQuarterTurn ? naturalWidth : naturalHeight) * effectiveImageScale;
     return { width: displayWidth, height: displayHeight };
   }, [imageNaturalSize, normalizedImageRotation, effectiveImageScale]);
 
-  const clampImagePan = useCallback((pan: { x: number; y: number }) => {
-    const { width: viewportWidth, height: viewportHeight } = imageViewportSize;
-    const { width: displayWidth, height: displayHeight } = imageDisplaySize;
-    if (viewportWidth <= 0 || viewportHeight <= 0 || displayWidth <= 0 || displayHeight <= 0) {
-      return { x: 0, y: 0 };
-    }
+  const clampImagePan = useCallback(
+    (pan: { x: number; y: number }) => {
+      const { width: viewportWidth, height: viewportHeight } =
+        imageViewportSize;
+      const { width: displayWidth, height: displayHeight } = imageDisplaySize;
+      if (
+        viewportWidth <= 0 ||
+        viewportHeight <= 0 ||
+        displayWidth <= 0 ||
+        displayHeight <= 0
+      ) {
+        return { x: 0, y: 0 };
+      }
 
-    const maxPanX = Math.max(0, (displayWidth - viewportWidth) / 2);
-    const maxPanY = Math.max(0, (displayHeight - viewportHeight) / 2);
-    return {
-      x: clamp(pan.x, -maxPanX, maxPanX),
-      y: clamp(pan.y, -maxPanY, maxPanY),
-    };
-  }, [imageDisplaySize, imageViewportSize]);
+      const maxPanX = Math.max(0, (displayWidth - viewportWidth) / 2);
+      const maxPanY = Math.max(0, (displayHeight - viewportHeight) / 2);
+      return {
+        x: clamp(pan.x, -maxPanX, maxPanX),
+        y: clamp(pan.y, -maxPanY, maxPanY),
+      };
+    },
+    [imageDisplaySize, imageViewportSize]
+  );
 
   useEffect(() => {
     imagePanRef.current = imagePan;
@@ -241,13 +331,21 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (imageNaturalSize.width === 0 || imageNaturalSize.height === 0) return;
     if (imageViewportSize.width === 0 || imageViewportSize.height === 0) return;
     const normalizedRotation = ((imageRotation % 360) + 360) % 360;
-    const isQuarterTurn = normalizedRotation === 90 || normalizedRotation === 270;
-    const rotatedWidth = isQuarterTurn ? imageNaturalSize.height : imageNaturalSize.width;
-    const rotatedHeight = isQuarterTurn ? imageNaturalSize.width : imageNaturalSize.height;
-    if (rotatedWidth > imageViewportSize.width || rotatedHeight > imageViewportSize.height) {
-      setImageBaseMode('fit');
+    const isQuarterTurn =
+      normalizedRotation === 90 || normalizedRotation === 270;
+    const rotatedWidth = isQuarterTurn
+      ? imageNaturalSize.height
+      : imageNaturalSize.width;
+    const rotatedHeight = isQuarterTurn
+      ? imageNaturalSize.width
+      : imageNaturalSize.height;
+    if (
+      rotatedWidth > imageViewportSize.width ||
+      rotatedHeight > imageViewportSize.height
+    ) {
+      setImageBaseMode("fit");
     } else {
-      setImageBaseMode('actual');
+      setImageBaseMode("actual");
     }
   }, [open, imageNaturalSize, imageViewportSize, imageRotation]);
 
@@ -277,109 +375,128 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     setIsImageDragging(false);
   }, []);
 
-  const applyImageScale = useCallback((nextScale: number, anchorX = 0, anchorY = 0) => {
-    const currentScale = imageScaleRef.current;
-    if (nextScale === currentScale) {
-      return;
-    }
-    const scaleRatio = nextScale / currentScale;
-    const currentPan = imagePanRef.current;
-    const nextPan = clampImagePan({
-      x: anchorX - scaleRatio * (anchorX - currentPan.x),
-      y: anchorY - scaleRatio * (anchorY - currentPan.y),
-    });
-    imagePanRef.current = nextPan;
-    setImagePan(nextPan);
-    imageScaleRef.current = nextScale;
-    setImageScale(nextScale);
-  }, [clampImagePan]);
+  const applyImageScale = useCallback(
+    (nextScale: number, anchorX = 0, anchorY = 0) => {
+      const currentScale = imageScaleRef.current;
+      if (nextScale === currentScale) {
+        return;
+      }
+      const scaleRatio = nextScale / currentScale;
+      const currentPan = imagePanRef.current;
+      const nextPan = clampImagePan({
+        x: anchorX - scaleRatio * (anchorX - currentPan.x),
+        y: anchorY - scaleRatio * (anchorY - currentPan.y),
+      });
+      imagePanRef.current = nextPan;
+      setImagePan(nextPan);
+      imageScaleRef.current = nextScale;
+      setImageScale(nextScale);
+    },
+    [clampImagePan]
+  );
 
-  const handleImageWheel = useCallback((event: ReactWheelEvent<HTMLDivElement>) => {
-    if (imageLoadError) {
-      return;
-    }
+  const handleImageWheel = useCallback(
+    (event: ReactWheelEvent<HTMLDivElement>) => {
+      if (imageLoadError) {
+        return;
+      }
 
-    event.preventDefault();
+      event.preventDefault();
 
-    const currentScale = imageScaleRef.current;
-    const zoomFactor = Math.exp(-event.deltaY * 0.0015);
-    const nextScale = clamp(currentScale * zoomFactor, imageScaleMin, imageScaleMax);
-    if (nextScale === currentScale) {
-      return;
-    }
+      const currentScale = imageScaleRef.current;
+      const zoomFactor = Math.exp(-event.deltaY * 0.0015);
+      const nextScale = clamp(
+        currentScale * zoomFactor,
+        imageScaleMin,
+        imageScaleMax
+      );
+      if (nextScale === currentScale) {
+        return;
+      }
 
-    const rect = event.currentTarget.getBoundingClientRect();
-    const cursorX = event.clientX - rect.left - rect.width / 2;
-    const cursorY = event.clientY - rect.top - rect.height / 2;
-    applyImageScale(nextScale, cursorX, cursorY);
-  }, [applyImageScale, imageLoadError, imageScaleMin, imageScaleMax]);
+      const rect = event.currentTarget.getBoundingClientRect();
+      const cursorX = event.clientX - rect.left - rect.width / 2;
+      const cursorY = event.clientY - rect.top - rect.height / 2;
+      applyImageScale(nextScale, cursorX, cursorY);
+    },
+    [applyImageScale, imageLoadError, imageScaleMin, imageScaleMax]
+  );
 
-  const handleImagePointerDown = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
-    if (imageLoadError || event.button !== 0) {
-      return;
-    }
+  const handleImagePointerDown = useCallback(
+    (event: ReactPointerEvent<HTMLDivElement>) => {
+      if (imageLoadError || event.button !== 0) {
+        return;
+      }
 
-    event.preventDefault();
-    event.currentTarget.setPointerCapture(event.pointerId);
-    setIsImageDragging(true);
-    dragStateRef.current = {
-      isDragging: true,
-      pointerId: event.pointerId,
-      startX: event.clientX,
-      startY: event.clientY,
-      startPanX: imagePanRef.current.x,
-      startPanY: imagePanRef.current.y,
-    };
-  }, [imageLoadError]);
+      event.preventDefault();
+      event.currentTarget.setPointerCapture(event.pointerId);
+      setIsImageDragging(true);
+      dragStateRef.current = {
+        isDragging: true,
+        pointerId: event.pointerId,
+        startX: event.clientX,
+        startY: event.clientY,
+        startPanX: imagePanRef.current.x,
+        startPanY: imagePanRef.current.y,
+      };
+    },
+    [imageLoadError]
+  );
 
-  const handleImagePointerMove = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
-    const dragState = dragStateRef.current;
-    if (!dragState.isDragging || dragState.pointerId !== event.pointerId) {
-      return;
-    }
+  const handleImagePointerMove = useCallback(
+    (event: ReactPointerEvent<HTMLDivElement>) => {
+      const dragState = dragStateRef.current;
+      if (!dragState.isDragging || dragState.pointerId !== event.pointerId) {
+        return;
+      }
 
-    event.preventDefault();
-    const nextPan = {
-      x: dragState.startPanX + (event.clientX - dragState.startX),
-      y: dragState.startPanY + (event.clientY - dragState.startY),
-    };
-    const clamped = clampImagePan(nextPan);
-    imagePanRef.current = clamped;
-    setImagePan(clamped);
-  }, [clampImagePan]);
+      event.preventDefault();
+      const nextPan = {
+        x: dragState.startPanX + (event.clientX - dragState.startX),
+        y: dragState.startPanY + (event.clientY - dragState.startY),
+      };
+      const clamped = clampImagePan(nextPan);
+      imagePanRef.current = clamped;
+      setImagePan(clamped);
+    },
+    [clampImagePan]
+  );
 
-  const handleImagePointerEnd = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
-    const dragState = dragStateRef.current;
-    if (dragState.pointerId !== event.pointerId) {
-      return;
-    }
+  const handleImagePointerEnd = useCallback(
+    (event: ReactPointerEvent<HTMLDivElement>) => {
+      const dragState = dragStateRef.current;
+      if (dragState.pointerId !== event.pointerId) {
+        return;
+      }
 
-    dragStateRef.current = {
-      isDragging: false,
-      pointerId: null,
-      startX: 0,
-      startY: 0,
-      startPanX: 0,
-      startPanY: 0,
-    };
-    setIsImageDragging(false);
-  }, []);
+      dragStateRef.current = {
+        isDragging: false,
+        pointerId: null,
+        startX: 0,
+        startY: 0,
+        startPanX: 0,
+        startPanY: 0,
+      };
+      setIsImageDragging(false);
+    },
+    []
+  );
 
   const handleImageDoubleClick = useCallback(() => {
-    if (imageScale !== 1 || imageBaseMode !== 'fit') {
-      setImageBaseMode('fit');
+    if (imageScale !== 1 || imageBaseMode !== "fit") {
+      setImageBaseMode("fit");
       setImageScale(1);
       imageScaleRef.current = 1;
     } else {
-      setImageBaseMode('actual');
+      setImageBaseMode("actual");
     }
   }, [imageBaseMode, imageScale]);
 
   const toggleImageBaseMode = useCallback(() => {
-    if (imageBaseMode === 'fit') {
-      setImageBaseMode('actual');
+    if (imageBaseMode === "fit") {
+      setImageBaseMode("actual");
     } else {
-      setImageBaseMode('fit');
+      setImageBaseMode("fit");
     }
     setImageScale(1);
     imageScaleRef.current = 1;
@@ -390,118 +507,178 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     const clamped = clampImagePan(imagePanRef.current);
     imagePanRef.current = clamped;
     setImagePan(clamped);
-  }, [clampImagePan, effectiveImageScale, normalizedImageRotation, imageViewportSize]);
-
-  const fetchTextChunk = useCallback(async (url: string, isFirst = false, sessionId?: number): Promise<void> => {
-    const activeSessionId = sessionId ?? textFetchSessionRef.current;
-    if (!url) {
-      if (isFirst) setLoading(false);
-      else setLoadingMore(false);
-      return;
-    }
-    if (isFetchingRef.current) return;
-    if (totalBytesRef.current !== null && byteOffsetRef.current >= totalBytesRef.current) return;
-
-    isFetchingRef.current = true;
-    if (!isFirst) setLoadingMore(true);
-
-    try {
-      const start = byteOffsetRef.current;
-      const end   = start + CHUNK_SIZE - 1;
-      const resp = await fetch(url, {
-        headers: { Range: `bytes=${start}-${end}` },
-        cache: 'no-store',
-      });
-      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
-      if (handlePreviewChunkBoundaryResponse(
-        resp.status,
-        isFirst,
-        setServerTooLarge,
-        setLoading,
-        setLoadingMore,
-        observerRef,
-        isFetchingRef,
-      )) {
+  }, [
+    clampImagePan,
+    effectiveImageScale,
+    normalizedImageRotation,
+    imageViewportSize,
+  ]);
+
+  const fetchTextChunk = useCallback(
+    async (
+      url: string,
+      isFirst = false,
+      sessionId?: number,
+      signal?: AbortSignal
+    ): Promise<void> => {
+      const activeSessionId = sessionId ?? textFetchSessionRef.current;
+      if (!url) {
+        if (isFirst) setLoading(false);
+        else setLoadingMore(false);
         return;
       }
-      if (!resp.ok && resp.status !== 206) throw new Error(`HTTP ${resp.status}`);
-
-      const contentRange = resp.headers.get('Content-Range');
-      const buf = await resp.arrayBuffer();
-      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
-      const hasMore = updateChunkRangeState(contentRange, buf.byteLength, byteOffsetRef, totalBytesRef);
-      ensurePreviewTextDecoder(
-        resp.headers.get('Content-Type'),
-        textDecoderRef,
-        decoderEncodingRef,
-        decoderHasExplicitCharsetRef,
-        decoderAllowGbFallbackRef,
-      );
-      const raw = decodePreviewChunk(
-        buf,
-        hasMore,
-        textDecoderRef,
-        decoderEncodingRef,
-        decoderAllowGbFallbackRef,
-      );
-      const { remainder, safeText } = splitPreviewSafeText(
-        raw,
-        remainderRef.current,
-        hasMore,
-        detectedFileType,
-      );
-      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
-      remainderRef.current = remainder;
-      appendTextPreviewContent({
-        detectedFileType,
-        safeText,
-        byteOffset: byteOffsetRef.current,
-        currentChunkLength: buf.byteLength,
-        csvDelimiterRef,
-        setTxtLines,
-        setCsvRows,
-        setTextContent,
-      });
-      if (!hasMore) observerRef.current?.disconnect();
-    } finally {
-      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) {
+      if (isFetchingRef.current) return;
+      if (
+        totalBytesRef.current !== null &&
+        byteOffsetRef.current >= totalBytesRef.current
+      )
         return;
-      }
-      isFetchingRef.current = false;
-      if (isFirst) setLoading(false);
-      else setLoadingMore(false);
-    }
-  }, [detectedFileType]);
 
-  const setupSentinelObserver = useCallback((node: HTMLDivElement | null) => {
-    observerRef.current?.disconnect();
-    observerRef.current = null;
-    if (!isValidContainerElement(node)) return;
-    const observer = new IntersectionObserver(entries => {
-      if (entries[0].isIntersecting) {
-        if (!isLocalSource && previewUrlRef.current && (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)) {
-          fetchTextChunk(previewUrlRef.current).catch(err =>
-            log.error('Failed to fetch next text chunk:', err)
-          );
+      isFetchingRef.current = true;
+      if (!isFirst) setLoadingMore(true);
+
+      try {
+        const start = byteOffsetRef.current;
+        const end = start + CHUNK_SIZE - 1;
+        const resp = await fetch(url, {
+          headers: { Range: `bytes=${start}-${end}` },
+          cache: "no-store",
+          credentials: "include",
+          signal,
+        });
+        if (
+          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
+        )
+          return;
+        if (
+          handlePreviewChunkBoundaryResponse(
+            resp.status,
+            isFirst,
+            setServerTooLarge,
+            setLoading,
+            setLoadingMore,
+            observerRef,
+            isFetchingRef
+          )
+        ) {
+          return;
+        }
+        const accessReason = getPreviewAccessReasonFromStatus(resp.status);
+        if (accessReason) {
+          if (handleKnowledgePreviewAccessError(accessReason)) {
+            return;
+          }
+          throw new Error(`HTTP ${resp.status}`);
+        }
+        if (!resp.ok && resp.status !== 206)
+          throw new Error(`HTTP ${resp.status}`);
+
+        const contentRange = resp.headers.get("Content-Range");
+        const buf = await resp.arrayBuffer();
+        if (
+          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
+        )
+          return;
+        const hasMore = updateChunkRangeState(
+          contentRange,
+          buf.byteLength,
+          byteOffsetRef,
+          totalBytesRef
+        );
+        ensurePreviewTextDecoder(
+          resp.headers.get("Content-Type"),
+          textDecoderRef,
+          decoderEncodingRef,
+          decoderHasExplicitCharsetRef,
+          decoderAllowGbFallbackRef
+        );
+        const raw = decodePreviewChunk(
+          buf,
+          hasMore,
+          textDecoderRef,
+          decoderEncodingRef,
+          decoderAllowGbFallbackRef
+        );
+        const { remainder, safeText } = splitPreviewSafeText(
+          raw,
+          remainderRef.current,
+          hasMore,
+          detectedFileType
+        );
+        if (
+          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
+        )
+          return;
+        remainderRef.current = remainder;
+        appendTextPreviewContent({
+          detectedFileType,
+          safeText,
+          byteOffset: byteOffsetRef.current,
+          currentChunkLength: buf.byteLength,
+          csvDelimiterRef,
+          setTxtLines,
+          setCsvRows,
+          setTextContent,
+        });
+        if (!hasMore) observerRef.current?.disconnect();
+      } finally {
+        if (
+          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
+        ) {
+          return;
         }
+        isFetchingRef.current = false;
+        if (isFirst) setLoading(false);
+        else setLoadingMore(false);
       }
-    }, { threshold: 0.1 });
-    observer.observe(node);
-    observerRef.current = observer;
-  }, [fetchTextChunk, isLocalSource]);
+    },
+    [detectedFileType, handleKnowledgePreviewAccessError]
+  );
+
+  const setupSentinelObserver = useCallback(
+    (node: HTMLDivElement | null) => {
+      observerRef.current?.disconnect();
+      observerRef.current = null;
+      if (!isValidContainerElement(node)) return;
+      const observer = new IntersectionObserver(
+        (entries) => {
+          if (entries[0].isIntersecting) {
+            if (
+              !isLocalSource &&
+              previewUrlRef.current &&
+              (totalBytesRef.current === null ||
+                byteOffsetRef.current < totalBytesRef.current)
+            ) {
+              fetchTextChunk(previewUrlRef.current).catch((err) =>
+                log.error("Failed to fetch next text chunk:", err)
+              );
+            }
+          }
+        },
+        { threshold: 0.1 }
+      );
+      observer.observe(node);
+      observerRef.current = observer;
+    },
+    [fetchTextChunk, isLocalSource]
+  );
 
   useEffect(() => {
     if (!open || (!isLocalSource && !objectName)) {
       return;
     }
 
+    let cancelled = false;
+    const abortController = new AbortController();
+    const { signal } = abortController;
+
     const loadPreview = async () => {
       setLoading(true);
       setError(null);
 
       try {
         if (isEmptyFile) {
-          setPreviewUrl('');
+          setPreviewUrl("");
           setLoading(false);
           return;
         }
@@ -511,17 +688,20 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
         if (isLocalSource && localFile) {
           resetTextPreviewState();
           const previousPreviewUrl = previewUrlRef.current;
-          if (previousPreviewUrl.startsWith('blob:')) {
+          if (previousPreviewUrl.startsWith("blob:")) {
             URL.revokeObjectURL(previousPreviewUrl);
           }
-          previewUrlRef.current = '';
+          previewUrlRef.current = "";
 
-          if (isTooLargeToPreview && ['text', 'markdown', 'csv', 'html'].includes(detectedFileType)) {
+          if (
+            isTooLargeToPreview &&
+            ["text", "markdown", "csv", "html"].includes(detectedFileType)
+          ) {
             setLoading(false);
             return;
           }
-          
-          if (detectedFileType === 'image' || detectedFileType === 'pdf') {
+
+          if (detectedFileType === "image" || detectedFileType === "pdf") {
             localPreviewUrl = URL.createObjectURL(localFile);
             setPreviewUrl(localPreviewUrl);
             previewUrlRef.current = localPreviewUrl;
@@ -529,10 +709,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             return;
           }
 
-          if (detectedFileType === 'text') {
+          if (detectedFileType === "text") {
             const text = await decodeLocalTextFile(localFile);
-            const newLines = text.split('\n');
-            if (newLines.at(-1) === '') {
+            const newLines = text.split("\n");
+            if (newLines.at(-1) === "") {
               newLines.pop();
             }
             setTxtLines(newLines);
@@ -540,24 +720,26 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             return;
           }
 
-          if (detectedFileType === 'markdown') {
+          if (detectedFileType === "markdown") {
             setTextContent(await decodeLocalTextFile(localFile));
             setLoading(false);
             return;
           }
 
-          if (detectedFileType === 'html') {
+          if (detectedFileType === "html") {
             const html = await decodeLocalTextFile(localFile);
             setTextContent(html);
             setLoading(false);
             return;
           }
 
-          if (detectedFileType === 'csv') {
+          if (detectedFileType === "csv") {
             const text = await decodeLocalTextFile(localFile);
             const delimiter = detectCsvDelimiter(text);
             csvDelimiterRef.current = delimiter;
-            const newLines = text.split('\n').filter(line => line.trim().length > 0);
+            const newLines = text
+              .split("\n")
+              .filter((line) => line.trim().length > 0);
             setCsvRows(newLines.map((line) => parseCsvLine(line, delimiter)));
             setLoading(false);
             return;
@@ -569,34 +751,87 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
         const url = storageService.getPreviewUrl(objectName, fileName);
 
-          if (['markdown', 'csv', 'text', 'html'].includes(detectedFileType)) {
-            textFetchSessionRef.current += 1;
-            const sessionId = textFetchSessionRef.current;
-            resetTextPreviewState();
-            setPreviewUrl(url);
-            previewUrlRef.current = url;
-            await fetchTextChunk(url, true, sessionId);
+        if (["markdown", "csv", "text", "html"].includes(detectedFileType)) {
+          if (cancelled) return;
+          textFetchSessionRef.current += 1;
+          const sessionId = textFetchSessionRef.current;
+          resetTextPreviewState();
+          setPreviewUrl(url);
+          previewUrlRef.current = url;
+          await fetchTextChunk(url, true, sessionId, signal);
+          return;
+        }
+
+        if (detectedFileType === "pdf" || detectedFileType === "image") {
+          if (cancelled) return;
+          if (isTooLargeToPreview) {
+            setLoading(false);
             return;
           }
+          const previousPreviewUrl = previewUrlRef.current;
+          if (previousPreviewUrl.startsWith("blob:")) {
+            URL.revokeObjectURL(previousPreviewUrl);
+          }
+          previewUrlRef.current = "";
+
+          const blob = await fetchPreviewBlob(url, signal);
+          if (cancelled) return;
+
+          const blobUrl = URL.createObjectURL(blob);
+          previewUrlRef.current = blobUrl;
+          setPreviewUrl(blobUrl);
+          setLoading(false);
+          return;
+        }
 
         setPreviewUrl(url);
         previewUrlRef.current = url;
-
         setLoading(false);
       } catch (err) {
-        log.error('Failed to load preview:', err);
-        setError(err instanceof Error ? err.message : t('filePreview.previewFailed'));
+        if (ignoreAbortError(err) || cancelled) {
+          return;
+        }
+        if (
+          err instanceof PreviewAccessError &&
+          handleKnowledgePreviewAccessError(err.reason)
+        ) {
+          setLoading(false);
+          return;
+        }
+        log.error("Failed to load preview:", err);
+        setError(
+          err instanceof Error ? err.message : t("filePreview.previewFailed")
+        );
         setLoading(false);
       }
     };
 
     void loadPreview();
-  }, [open, objectName, fileName, detectedFileType, t, fetchTextChunk, resetTextPreviewState, isEmptyFile, isLocalSource, localFile]);
+
+    return () => {
+      cancelled = true;
+      abortController.abort();
+      textFetchSessionRef.current += 1;
+    };
+  }, [
+    open,
+    objectName,
+    fileName,
+    detectedFileType,
+    t,
+    fetchTextChunk,
+    resetTextPreviewState,
+    isEmptyFile,
+    isLocalSource,
+    localFile,
+    handleKnowledgePreviewAccessError,
+    isTooLargeToPreview,
+  ]);
 
   useEffect(() => {
     return () => {
       const currentPreviewUrl = previewUrlRef.current;
-      if (currentPreviewUrl.startsWith('blob:')) {
+      if (currentPreviewUrl.startsWith("blob:")) {
         URL.revokeObjectURL(currentPreviewUrl);
       }
     };
@@ -610,13 +845,13 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       setImageRotation(0);
       setImageNaturalSize({ width: 0, height: 0 });
       setImageViewportSize({ width: 0, height: 0 });
-      setImageBaseMode('fit');
+      setImageBaseMode("fit");
       handleImagePanReset();
-      setTextContent('');
+      setTextContent("");
       setTxtLines([]);
       setCsvRows([]);
       setCsvTableHeight(400);
-      setPreviewUrl('');
+      setPreviewUrl("");
       setError(null);
       setImageLoadError(false);
       setLoadingMore(false);
@@ -624,7 +859,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       textFetchSessionRef.current += 1;
       byteOffsetRef.current = 0;
       totalBytesRef.current = null;
-      remainderRef.current = '';
+      remainderRef.current = "";
       isFetchingRef.current = false;
       textDecoderRef.current = null;
       decoderEncodingRef.current = null;
@@ -634,10 +869,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       observerRef.current = null;
       imageViewportResizeObserverRef.current?.disconnect();
       imageViewportResizeObserverRef.current = null;
-      if (previousPreviewUrl.startsWith('blob:')) {
+      if (previousPreviewUrl.startsWith("blob:")) {
         URL.revokeObjectURL(previousPreviewUrl);
       }
-      previewUrlRef.current = '';
+      previewUrlRef.current = "";
     }
   }, [open]);
 
@@ -652,20 +887,20 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (!open) return;
 
     const handleKeyDown = (e: KeyboardEvent) => {
-      if (e.key === 'Escape') {
+      if (e.key === "Escape") {
         onClose();
       }
     };
 
-    globalThis.addEventListener('keydown', handleKeyDown);
-    return () => globalThis.removeEventListener('keydown', handleKeyDown);
+    globalThis.addEventListener("keydown", handleKeyDown);
+    return () => globalThis.removeEventListener("keydown", handleKeyDown);
   }, [open, onClose]);
 
   const handleDownload = async () => {
     try {
       if (isLocalSource && localFile) {
         const url = URL.createObjectURL(localFile);
-        const link = document.createElement('a');
+        const link = document.createElement("a");
         link.href = url;
         link.download = fileName;
         link.click();
@@ -675,7 +910,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
       await storageService.downloadFile(objectName, fileName);
     } catch (err) {
-      log.error('Failed to download file:', err);
+      log.error("Failed to download file:", err);
     }
   };
 
@@ -690,19 +925,22 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
     if (
       isFetchingRef.current ||
-      (totalBytesRef.current !== null && byteOffsetRef.current >= totalBytesRef.current)
+      (totalBytesRef.current !== null &&
+        byteOffsetRef.current >= totalBytesRef.current)
     ) {
       return;
     }
 
-    fetchTextChunk(previewUrlRef.current).catch(err =>
-      log.error('Failed to fetch next text chunk:', err)
+    fetchTextChunk(previewUrlRef.current).catch((err) =>
+      log.error("Failed to fetch next text chunk:", err)
     );
   }, [fetchTextChunk, isLocalSource]);
 
   const handleMarkdownHeadingClick = useCallback((headingId: string) => {
     const container = markdownContainerRef.current;
-    const target = container?.querySelector<HTMLElement>(`#${CSS.escape(headingId)}`) ?? null;
+    const target =
+      container?.querySelector<HTMLElement>(`#${CSS.escape(headingId)}`) ??
+      null;
 
     if (!container || !target) {
       return;
@@ -710,9 +948,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
     const containerRect = container.getBoundingClientRect();
     const targetRect = target.getBoundingClientRect();
-    const nextScrollTop = container.scrollTop + targetRect.top - containerRect.top;
+    const nextScrollTop =
+      container.scrollTop + targetRect.top - containerRect.top;
 
-    container.scrollTo({ top: Math.max(nextScrollTop, 0), behavior: 'smooth' });
+    container.scrollTo({ top: Math.max(nextScrollTop, 0), behavior: "smooth" });
 
     if (globalThis.innerWidth < 768) {
       setShowMarkdownToc(false);
@@ -723,7 +962,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     <div className="flex items-center justify-center h-full">
       <div className="text-center">
         <div className="animate-spin rounded-full h-8 w-8 border-b-2 border-blue-500 mx-auto mb-2"></div>
-        <p className="text-sm text-gray-600">{t('filePreview.loading')}</p>
+        <p className="text-sm text-gray-600">{t("filePreview.loading")}</p>
       </div>
     </div>
   );
@@ -731,7 +970,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderCenteredErrorState = () => (
     <div className="flex items-center justify-center h-full">
       <div className="text-center max-w-md px-4">
-        <p className="text-red-500 text-sm">{t('filePreview.previewFailed')}</p>
+        <p className="text-red-500 text-sm">{t("filePreview.previewFailed")}</p>
       </div>
     </div>
   );
@@ -739,10 +978,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderError = () => renderCenteredErrorState();
 
   const renderPdfViewer = () => (
-    <PdfViewer
-      url={previewUrl}
-      fileName={fileName}
-    />
+    <PdfViewer url={previewUrl} fileName={fileName} />
   );
 
   const renderImageViewer = () => (
@@ -765,14 +1001,16 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             <div
               className="absolute inset-0 flex items-center justify-center"
               style={{
-                perspective: '1000px',
+                perspective: "1000px",
               }}
             >
               <div
                 style={{
                   transform: `translate(${imagePan.x}px, ${imagePan.y}px) scale(${effectiveImageScale}) rotate(${imageRotation}deg)`,
-                  willChange: 'transform',
-                  transition: isImageDragging ? 'none' : 'transform 0.2s ease-in-out',
+                  willChange: "transform",
+                  transition: isImageDragging
+                    ? "none"
+                    : "transform 0.2s ease-in-out",
                 }}
               >
                 <img
@@ -782,7 +1020,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
                   draggable={false}
                   onLoad={(e) => {
                     const img = e.currentTarget;
-                    setImageNaturalSize({ width: img.naturalWidth, height: img.naturalHeight });
+                    setImageNaturalSize({
+                      width: img.naturalWidth,
+                      height: img.naturalHeight,
+                    });
                   }}
                   onError={() => setImageLoadError(true)}
                 />
@@ -797,12 +1038,16 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           <div className="flex items-center gap-1 bg-white/70 backdrop-blur-sm border border-gray-200/60 rounded-full shadow-lg px-3 py-1">
             <button
               onClick={() => {
-                const nextScale = clamp(imageScaleRef.current - 0.25, imageScaleMin, imageScaleMax);
+                const nextScale = clamp(
+                  imageScaleRef.current - 0.25,
+                  imageScaleMin,
+                  imageScaleMax
+                );
                 applyImageScale(nextScale, 0, 0);
               }}
               disabled={effectiveImageScale <= 0.25}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors disabled:opacity-30 text-gray-600"
-              title={t('filePreview.zoomOut')}
+              title={t("filePreview.zoomOut")}
             >
               <Minus size={16} />
             </button>
@@ -813,12 +1058,16 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
             <button
               onClick={() => {
-                const nextScale = clamp(imageScaleRef.current + 0.25, imageScaleMin, imageScaleMax);
+                const nextScale = clamp(
+                  imageScaleRef.current + 0.25,
+                  imageScaleMin,
+                  imageScaleMax
+                );
                 applyImageScale(nextScale, 0, 0);
               }}
               disabled={effectiveImageScale >= 6}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors disabled:opacity-30 text-gray-600"
-              title={t('filePreview.zoomIn')}
+              title={t("filePreview.zoomIn")}
             >
               <Plus size={16} />
             </button>
@@ -829,21 +1078,25 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
               onClick={toggleImageBaseMode}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors text-gray-600"
               title={
-                imageBaseMode === 'fit'
-                  ? t('filePreview.image.actualSize')
-                  : t('filePreview.image.fitPage')
+                imageBaseMode === "fit"
+                  ? t("filePreview.image.actualSize")
+                  : t("filePreview.image.fitPage")
               }
             >
-              {imageBaseMode === 'fit' ? <Maximize2 size={16} /> : <Minimize2 size={16} />}
+              {imageBaseMode === "fit" ? (
+                <Maximize2 size={16} />
+              ) : (
+                <Minimize2 size={16} />
+              )}
             </button>
 
             <button
               onClick={() => {
-                setImageRotation(prev => prev + 90);
+                setImageRotation((prev) => prev + 90);
                 handleImagePanReset();
               }}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors text-gray-600"
-              title={t('filePreview.rotate')}
+              title={t("filePreview.rotate")}
             >
               <RotateCw size={16} />
             </button>
@@ -856,10 +1109,12 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderMarkdownViewer = () => (
     <div className="flex h-full min-h-0 bg-white">
       {markdownHeadings.length > 0 && (
-        <aside className={`${showMarkdownToc ? 'flex' : 'hidden'} md:flex w-64 flex-shrink-0 flex-col border-r border-gray-200 bg-gray-50/70`}>
+        <aside
+          className={`${showMarkdownToc ? "flex" : "hidden"} md:flex w-64 flex-shrink-0 flex-col border-r border-gray-200 bg-gray-50/70`}
+        >
           <div className="flex items-center justify-between border-b border-gray-200 px-3 py-3">
             <span className="text-sm font-medium text-gray-700">
-              {t('filePreview.markdownOutline', { defaultValue: '目录' })}
+              {t("filePreview.markdownOutline", { defaultValue: "目录" })}
             </span>
             <Button
               type="text"
@@ -892,13 +1147,20 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       <div className="flex min-w-0 flex-1 flex-col">
         {markdownHeadings.length > 0 && (
           <div className="border-b border-gray-200 px-4 py-2 md:hidden">
-            <Button type="default" size="small" onClick={() => setShowMarkdownToc(prev => !prev)}>
-              {t('filePreview.markdownOutline', { defaultValue: '目录' })}
+            <Button
+              type="default"
+              size="small"
+              onClick={() => setShowMarkdownToc((prev) => !prev)}
+            >
+              {t("filePreview.markdownOutline", { defaultValue: "目录" })}
             </Button>
           </div>
         )}
-        <div ref={markdownContainerRef} className="flex-1 overflow-auto px-6 pb-6 pt-0">
-          <MarkdownRenderer 
+        <div
+          ref={markdownContainerRef}
+          className="flex-1 overflow-auto px-6 pb-6 pt-0"
+        >
+          <MarkdownRenderer
             content={textContent}
             enableMultimodal={true}
             resolveS3Media={false}
@@ -922,9 +1184,11 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           const el = e.currentTarget;
           if (
             !isLocalSource &&
-            el.scrollTop + el.clientHeight >= el.scrollHeight - el.clientHeight * 0.5 &&
+            el.scrollTop + el.clientHeight >=
+              el.scrollHeight - el.clientHeight * 0.5 &&
             !isFetchingRef.current &&
-            (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
+            (totalBytesRef.current === null ||
+              byteOffsetRef.current < totalBytesRef.current)
           ) {
             fetchNextTextChunk();
           }
@@ -954,14 +1218,16 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     const columns = headerRow.map((col, i) => ({
       key: String(i),
       dataIndex: String(i),
-      title: col || `${t('filePreview.csv.column')} ${i + 1}`,
+      title: col || `${t("filePreview.csv.column")} ${i + 1}`,
       ellipsis: true,
       width: 160,
     }));
 
     const dataSource = dataRows.map((row, rowIdx) => {
       const record: Record<string, string> = { _key: String(rowIdx) };
-      headerRow.forEach((_, i) => { record[String(i)] = row[i] ?? ''; });
+      headerRow.forEach((_, i) => {
+        record[String(i)] = row[i] ?? "";
+      });
       return record;
     });
 
@@ -994,12 +1260,14 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             const el = e.currentTarget as HTMLElement;
             if (
               !isLocalSource &&
-              el.scrollTop + el.clientHeight >= el.scrollHeight - CSV_ROW_HEIGHT * 30 &&
+              el.scrollTop + el.clientHeight >=
+                el.scrollHeight - CSV_ROW_HEIGHT * 30 &&
               !isFetchingRef.current &&
-              (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
+              (totalBytesRef.current === null ||
+                byteOffsetRef.current < totalBytesRef.current)
             ) {
-              fetchTextChunk(previewUrlRef.current).catch(err =>
-                log.error('Failed to fetch next CSV chunk:', err)
+              fetchTextChunk(previewUrlRef.current).catch((err) =>
+                log.error("Failed to fetch next CSV chunk:", err)
               );
             }
           }}
@@ -1007,7 +1275,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
         {loadingMore && (
           <div className="flex items-center justify-center py-3 border-t border-gray-100">
             <div className="animate-spin rounded-full h-5 w-5 border-b-2 border-blue-500 mr-2" />
-            <span className="text-sm text-gray-500">{t('filePreview.loading')}</span>
+            <span className="text-sm text-gray-500">
+              {t("filePreview.loading")}
+            </span>
           </div>
         )}
         <div ref={setupSentinelObserver} className="h-1" />
@@ -1023,9 +1293,11 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           const el = e.currentTarget;
           if (
             !isLocalSource &&
-            el.scrollTop + el.clientHeight >= el.scrollHeight - el.clientHeight * 0.5 &&
+            el.scrollTop + el.clientHeight >=
+              el.scrollHeight - el.clientHeight * 0.5 &&
             !isFetchingRef.current &&
-            (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
+            (totalBytesRef.current === null ||
+              byteOffsetRef.current < totalBytesRef.current)
           ) {
             fetchNextTextChunk();
           }
@@ -1037,11 +1309,11 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
               key={index}
               className="m-0 whitespace-pre-wrap break-words"
               style={{
-                contentVisibility: 'auto',
+                contentVisibility: "auto",
                 containIntrinsicSize: `${Math.max(block.length, 1) * 24}px`,
               }}
             >
-              {block.join('\n') || '\u00A0'}
+              {block.join("\n") || "\u00A0"}
             </pre>
           ))}
         </div>
@@ -1056,25 +1328,29 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
   const renderTooLarge = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500">{t('filePreview.tooLargeToPreview')}</p>
+      <p className="text-gray-500">{t("filePreview.tooLargeToPreview")}</p>
     </div>
   );
 
   const renderEmptyFile = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">{t('filePreview.emptyFile')}</p>
+      <p className="text-gray-500 text-sm">{t("filePreview.emptyFile")}</p>
     </div>
   );
 
   const renderUnsupported = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">{t('filePreview.unsupportedSingleLine')}</p>
+      <p className="text-gray-500 text-sm">
+        {t("filePreview.unsupportedSingleLine")}
+      </p>
     </div>
   );
 
   const renderUploadToPreview = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">{t('filePreview.uploadToPreview')}</p>
+      <p className="text-gray-500 text-sm">
+        {t("filePreview.uploadToPreview")}
+      </p>
     </div>
   );
 
@@ -1085,19 +1361,19 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (error) return renderError();
 
     switch (detectedFileType) {
-      case 'pdf':
+      case "pdf":
         return renderPdfViewer();
-      case 'image':
+      case "image":
         return renderImageViewer();
-      case 'markdown':
+      case "markdown":
         return renderMarkdownViewer();
-      case 'csv':
+      case "csv":
         return renderCsvViewer();
-      case 'text':
+      case "text":
         return renderTextViewer();
-      case 'html':
+      case "html":
         return renderHtmlViewer();
-      case 'office':
+      case "office":
         return renderUploadToPreview();
       default:
         return renderUnsupported();
@@ -1111,8 +1387,14 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       placement="right"
       size="65%"
       styles={{
-        body: { padding: 0, height: '100%', minHeight: 0, display: 'flex', flexDirection: 'column' },
-        header: { padding: '12px 16px', borderBottom: '1px solid #e5e7eb' },
+        body: {
+          padding: 0,
+          height: "100%",
+          minHeight: 0,
+          display: "flex",
+          flexDirection: "column",
+        },
+        header: { padding: "12px 16px", borderBottom: "1px solid #e5e7eb" },
       }}
       closeIcon={<X size={20} />}
       title={
@@ -1133,14 +1415,12 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           icon={<Download size={14} />}
           onClick={handleDownload}
         >
-          {t('filePreview.download')}
+          {t("filePreview.download")}
         </Button>
       }
     >
       <div className="flex h-full flex-col">
-        <div className="flex-1 min-h-0 overflow-hidden">
-        {renderContent()}
-        </div>
+        <div className="flex-1 min-h-0 overflow-hidden">{renderContent()}</div>
       </div>
     </Drawer>
   );
diff --git a/frontend/components/ui/markdownRenderer.tsx b/frontend/components/common/markdownRenderer.tsx
similarity index 99%
rename from frontend/components/ui/markdownRenderer.tsx
rename to frontend/components/common/markdownRenderer.tsx
index 53dfb6962..93dbcce11 100644
--- a/frontend/components/ui/markdownRenderer.tsx
+++ b/frontend/components/common/markdownRenderer.tsx
@@ -16,8 +16,8 @@ import { visit } from "unist-util-visit";
 import { SearchResult } from "@/types/chat";
 import { resolveS3UrlToDataUrl } from "@/services/storageService";
 import { Tooltip, TooltipProvider } from "@/components/ui/tooltip";
-import { CopyButton } from "@/components/ui/copyButton";
-import { Diagram } from "@/components/ui/Diagram";
+import { CopyButton } from "@/components/common/copyButton";
+import { Diagram } from "@/components/common/Diagram";
 
 interface MarkdownRendererProps {
   content: string;
diff --git a/frontend/components/ui/tokenUsageIndicator.tsx b/frontend/components/common/tokenUsageIndicator.tsx
similarity index 98%
rename from frontend/components/ui/tokenUsageIndicator.tsx
rename to frontend/components/common/tokenUsageIndicator.tsx
index 826787e2b..adde20fbf 100644
--- a/frontend/components/ui/tokenUsageIndicator.tsx
+++ b/frontend/components/common/tokenUsageIndicator.tsx
@@ -1,8 +1,8 @@
 "use client";
 
 import React from "react";
-import { Tooltip } from "@/components/ui/tooltip";
 import { TokenMetrics } from "@/types/chat";
+import { Tooltip } from "antd"
 
 interface TokenUsageIndicatorProps {
   latestMetrics: TokenMetrics | null;
diff --git a/frontend/components/navigation/SideNavigation.tsx b/frontend/components/navigation/SideNavigation.tsx
index 77b74fee1..dbef5ace0 100644
--- a/frontend/components/navigation/SideNavigation.tsx
+++ b/frontend/components/navigation/SideNavigation.tsx
@@ -27,6 +27,8 @@ import { SIDER_CONFIG } from "@/const/layoutConstants";
 import { AUTH_EVENTS } from "@/const/auth";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { authEvents } from "@/lib/authEvents";
+import { authFlowState } from "@/lib/authFlow";
+import { casService } from "@/services/casService";
 
 interface SideNavigationProps {
   collapsed?: boolean;
@@ -51,15 +53,50 @@ const ROUTE_CONFIG: RouteConfig[] = [
   { path: "/chat", Icon: Bot, labelKey: "sidebar.startChat", order: 1 },
   { path: "/setup", Icon: Zap, labelKey: "sidebar.quickConfig", order: 2 },
   { path: "/space", Icon: Globe, labelKey: "sidebar.agentSpace", order: 3 },
-  { path: "/market", Icon: ShoppingBag, labelKey: "sidebar.agentMarket", order: 4 },
+  {
+    path: "/market",
+    Icon: ShoppingBag,
+    labelKey: "sidebar.agentMarket",
+    order: 4,
+  },
   { path: "/agents", Icon: Code, labelKey: "sidebar.agentDev", order: 5 },
-  { path: "/knowledges", Icon: BookOpen, labelKey: "sidebar.knowledgeBase", order: 6 },
-  { path: "/mcp-tools", Icon: Puzzle, labelKey: "sidebar.mcpToolsManagement", order: 7 },
-  { path: "/monitoring", Icon: Activity, labelKey: "sidebar.monitoringManagement", order: 8 },
-  { path: "/models", Icon: Settings, labelKey: "sidebar.modelManagement", order: 9 },
-  { path: "/memory", Icon: Database, labelKey: "sidebar.memoryManagement", order: 10 },
+  {
+    path: "/knowledges",
+    Icon: BookOpen,
+    labelKey: "sidebar.knowledgeBase",
+    order: 6,
+  },
+  {
+    path: "/mcp-tools",
+    Icon: Puzzle,
+    labelKey: "sidebar.mcpToolsManagement",
+    order: 7,
+  },
+  {
+    path: "/monitoring",
+    Icon: Activity,
+    labelKey: "sidebar.monitoringManagement",
+    order: 8,
+  },
+  {
+    path: "/models",
+    Icon: Settings,
+    labelKey: "sidebar.modelManagement",
+    order: 9,
+  },
+  {
+    path: "/memory",
+    Icon: Database,
+    labelKey: "sidebar.memoryManagement",
+    order: 10,
+  },
   { path: "/users", Icon: User, labelKey: "sidebar.userManagement", order: 11 },
-  { path: "/tenant-resources", Icon: Building2, labelKey: "sidebar.tenantResources", order: 12 },
+  {
+    path: "/tenant-resources",
+    Icon: Building2,
+    labelKey: "sidebar.tenantResources",
+    order: 12,
+  },
   { path: "/asset-owner-resources", Icon: Building2, labelKey: "sidebar.assetOwnerResources", order: 13 },
 ];
 
@@ -72,9 +109,7 @@ const ROUTE_PATHS = ROUTE_CONFIG.map((route) => route.path);
  * Side navigation component with collapsible menu
  * Displays main navigation items for the application based on user's accessible routes
  */
-export function SideNavigation({
-  collapsed,
-}: SideNavigationProps) {
+export function SideNavigation({ collapsed }: SideNavigationProps) {
   const { t } = useTranslation("common");
   const { accessibleRoutes } = useAuthorizationContext();
   const { isAuthenticated, openAuthPromptModal } = useAuthenticationContext();
@@ -83,7 +118,9 @@ export function SideNavigation({
   const pathname = usePathname();
 
   const [selectedKey, setSelectedKey] = useState("/");
-  const [pendingNavigationPath, setPendingNavigationPath] = useState<string | null>(null);
+  const [pendingNavigationPath, setPendingNavigationPath] = useState<
+    string | null
+  >(null);
   const isCollapsed = typeof collapsed === "boolean" ? collapsed : false;
 
   // Update selected key when pathname changes
@@ -105,7 +142,10 @@ export function SideNavigation({
       }
     };
 
-    const cleanup = authEvents.on(AUTH_EVENTS.LOGIN_SUCCESS, handleLoginSuccess);
+    const cleanup = authEvents.on(
+      AUTH_EVENTS.LOGIN_SUCCESS,
+      handleLoginSuccess
+    );
     return cleanup;
   }, [pendingNavigationPath, isAuthenticated, router]);
 
@@ -148,7 +188,17 @@ export function SideNavigation({
         // Pre-check authentication - show auth prompt if user is not authenticated
         if (!isAuthenticated && !isSpeedMode && route.path !== "/") {
           setPendingNavigationPath(route.path);
-          openAuthPromptModal();
+          casService.getConfig().then((config) => {
+            if (
+              !authFlowState.isExplicitLogoutInProgress() &&
+              config.enabled &&
+              config.login_mode === "force"
+            ) {
+              casService.startLogin(route.path);
+              return;
+            }
+            openAuthPromptModal();
+          });
           return; // Prevent navigation
         }
 
diff --git a/frontend/components/skill/InstallOfficialSkillsModal.tsx b/frontend/components/skill/InstallOfficialSkillsModal.tsx
index e3cc83d1f..b8e8d4ce6 100644
--- a/frontend/components/skill/InstallOfficialSkillsModal.tsx
+++ b/frontend/components/skill/InstallOfficialSkillsModal.tsx
@@ -1,13 +1,12 @@
 "use client";
 
 import React, { useState, useEffect } from "react";
-import { Modal, Spin, message } from "antd";
+import { Modal, Spin, message, Tooltip } from "antd";
 import { useTranslation } from "react-i18next";
 import { CircleCheckBig, CircleOff, CircleDot, LoaderCircle } from "lucide-react";
 
 import { fetchOfficialSkillsWithStatus, installOfficialSkills } from "@/services/skillService";
 import { InstallableSkill } from "@/types/agentConfig";
-import { Tooltip } from "@/components/ui/tooltip";
 
 interface InstallOfficialSkillsModalProps {
   open: boolean;
diff --git a/frontend/const/agentConfig.ts b/frontend/const/agentConfig.ts
index aed7b6404..4c8b96a7f 100644
--- a/frontend/const/agentConfig.ts
+++ b/frontend/const/agentConfig.ts
@@ -53,6 +53,8 @@ export const GENERATE_PROMPT_STREAM_TYPES = {
   AGENT_VAR_NAME: "agent_var_name",
   AGENT_DESCRIPTION: "agent_description",
   AGENT_DISPLAY_NAME: "agent_display_name",
+  GREETING_MESSAGE: "greeting_message",
+  EXAMPLE_QUESTIONS: "example_questions",
 } as const;
 
 export const TOOL_PARAM_TYPES = {
diff --git a/frontend/const/chatConfig.ts b/frontend/const/chatConfig.ts
index 27b3b887d..c206fa752 100644
--- a/frontend/const/chatConfig.ts
+++ b/frontend/const/chatConfig.ts
@@ -117,9 +117,11 @@ messageTypes: {
   STEP_COUNT: "step_count" as const,
   TOKEN_COUNT: "token_count" as const,
   MAX_STEPS_REACHED: "max_steps_reached" as const,
+  VERIFICATION: "verification" as const,
   SEARCH_CONTENT_PLACEHOLDER: "search_content_placeholder" as const,
   VIRTUAL: "virtual" as const,
   PREPROCESS: "preprocess" as const,
+  SKILL_FILES: "skill_files" as const,
 },
 
 // Content type constants for last content type tracking
@@ -133,6 +135,7 @@ contentTypes: {
   SEARCH_CONTENT: "search_content" as const,
   CARD: "card" as const,
   MEMORY_SEARCH: "memory_search" as const,
+  VERIFICATION: "verification" as const,
   PREPROCESS: "preprocess" as const,
 },
 
diff --git a/frontend/hooks/agent/useAgentGeneration.ts b/frontend/hooks/agent/useAgentGeneration.ts
index 4ffa31adb..cfd350e91 100644
--- a/frontend/hooks/agent/useAgentGeneration.ts
+++ b/frontend/hooks/agent/useAgentGeneration.ts
@@ -151,11 +151,16 @@ export function useAgentGeneration({
               }
               break;
             case GENERATE_PROMPT_STREAM_TYPES.AGENT_DISPLAY_NAME:
-              // Only save to cache if user hasn't filled in agent display name themselves
               if (!editedAgent.display_name) {
                 saveGeneratedField(generationAgentId, 'agentDisplayName', data.content);
               }
               break;
+            case GENERATE_PROMPT_STREAM_TYPES.GREETING_MESSAGE:
+              saveGeneratedField(generationAgentId, 'greetingMessage', data.content);
+              break;
+            case GENERATE_PROMPT_STREAM_TYPES.EXAMPLE_QUESTIONS:
+              saveGeneratedField(generationAgentId, 'exampleQuestions', data.content);
+              break;
           }
         },
         (error) => {
@@ -211,6 +216,12 @@ export function useAgentGeneration({
             duty_prompt: cached?.dutyPrompt || editedAgent.duty_prompt || "",
             constraint_prompt: cached?.constraintPrompt || editedAgent.constraint_prompt || "",
             few_shots_prompt: cached?.fewShotsPrompt || editedAgent.few_shots_prompt || "",
+            greeting_message: cached?.greetingMessage || editedAgent.greeting_message || "",
+            example_questions: cached?.exampleQuestions
+              ? (typeof cached.exampleQuestions === "string"
+                ? (() => { try { return JSON.parse(cached.exampleQuestions); } catch { return []; } })()
+                : cached.exampleQuestions)
+              : editedAgent.example_questions || [],
           };
           // Update agent config in store
           updateAgentConfig(configUpdates);
diff --git a/frontend/hooks/agent/useSaveGuard.ts b/frontend/hooks/agent/useSaveGuard.ts
index 6d948deff..2f644e0bc 100644
--- a/frontend/hooks/agent/useSaveGuard.ts
+++ b/frontend/hooks/agent/useSaveGuard.ts
@@ -135,6 +135,7 @@ export const useSaveGuard = () => {
         model_id: currentEditedAgent.model_id ?? undefined,
         max_steps: currentEditedAgent.max_step,
         provide_run_summary: currentEditedAgent.provide_run_summary,
+        verification_config: currentEditedAgent.verification_config,
         enabled: true,
         business_description: currentEditedAgent.business_description,
         duty_prompt: currentEditedAgent.duty_prompt,
@@ -149,6 +150,8 @@ export const useSaveGuard = () => {
         related_agent_ids: relatedAgentIds,
         related_external_agent_ids: relatedExternalAgentIds,
         ingroup_permission: currentEditedAgent.ingroup_permission ?? "READ_ONLY",
+        greeting_message: currentEditedAgent.greeting_message,
+        example_questions: currentEditedAgent.example_questions,
       });
 
       if (result.success) {
diff --git a/frontend/hooks/auth/useAuthenticationState.ts b/frontend/hooks/auth/useAuthenticationState.ts
index 3f8923ca7..402b5c717 100644
--- a/frontend/hooks/auth/useAuthenticationState.ts
+++ b/frontend/hooks/auth/useAuthenticationState.ts
@@ -1,13 +1,20 @@
 "use client";
 
-import { useState, useEffect, useCallback } from "react";
+import { useState, useEffect, useCallback, useRef } from "react";
 import { useTranslation } from "react-i18next";
 import { App } from "antd";
 
 import { useDeployment } from "@/components/providers/deploymentProvider";
 import { useQueryClient } from "@tanstack/react-query";
 import { authService } from "@/services/authService";
-import { getSessionFromStorage, removeSessionFromStorage, checkSessionValid, hasAuthCookies } from "@/lib/session";
+import { casService } from "@/services/casService";
+import {
+  getSessionFromStorage,
+  removeSessionFromStorage,
+  checkSessionValid,
+  getTokenExpiresAt,
+} from "@/lib/session";
+import { authFlowState } from "@/lib/authFlow";
 import { Session, AuthenticationStateReturn } from "@/types/auth";
 import { STATUS_CODES } from "@/const/auth";
 import { authEventUtils } from "@/lib/authEvents";
@@ -30,6 +37,7 @@ export function useAuthenticationState(): AuthenticationStateReturn {
   const [session, setSession] = useState<Session | null>(null);
   const [authServiceUnavailable, setAuthServiceUnavailable] =
     useState<boolean>(false);
+  const isCasLoginInProgressRef = useRef(false);
 
   // Speed mode: skip authentication checks, consider user as authenticated
   useEffect(() => {
@@ -51,6 +59,68 @@ export function useAuthenticationState(): AuthenticationStateReturn {
     setIsAuthChecking(false);
   }, [isSpeedMode]);
 
+  useEffect(() => {
+    if (isSpeedMode || isAuthChecking || isAuthenticated) return;
+    if (isCasLoginInProgressRef.current) return;
+    if (authFlowState.isExplicitLogoutInProgress()) return;
+    if (typeof window === "undefined") return;
+
+    const pathname = window.location.pathname;
+    if (pathname.includes("/oauth/complete")) return;
+
+    let cancelled = false;
+    casService.getConfig().then((config) => {
+      if (
+        cancelled ||
+        isCasLoginInProgressRef.current ||
+        authFlowState.isExplicitLogoutInProgress() ||
+        !config.enabled ||
+        config.login_mode !== "force"
+      ) {
+        return;
+      }
+
+      isCasLoginInProgressRef.current = true;
+      casService.startLogin();
+    });
+
+    return () => {
+      cancelled = true;
+    };
+  }, [isSpeedMode, isAuthChecking, isAuthenticated]);
+
+  useEffect(() => {
+    if (isSpeedMode || !isAuthenticated) return;
+
+    let timeoutId: ReturnType<typeof setTimeout> | null = null;
+    let cancelled = false;
+
+    casService.getConfig().then((config) => {
+      if (cancelled || !config.enabled || config.login_mode === "disabled")
+        return;
+      const expiresAt = getTokenExpiresAt();
+      if (!expiresAt) return;
+
+      const renewAtMs = expiresAt * 1000 - config.renew_before_seconds * 1000;
+      const delayMs = Math.max(0, renewAtMs - Date.now());
+      timeoutId = setTimeout(async () => {
+        const ok = await casService.renewInIframe(config.renew_timeout_seconds);
+        if (!ok || cancelled) return;
+        const renewedSession = getSessionFromStorage();
+        if (renewedSession) {
+          setSession(renewedSession);
+          setIsAuthenticated(true);
+          authEventUtils.emitTokenRefreshed();
+        }
+      }, delayMs);
+    });
+
+    return () => {
+      cancelled = true;
+      if (timeoutId) clearTimeout(timeoutId);
+    };
+  }, [isAuthenticated, session?.expires_at, isSpeedMode]);
+
   const clearLocalSession = useCallback(() => {
     removeSessionFromStorage();
     setSession(null);
@@ -114,11 +184,7 @@ export function useAuthenticationState(): AuthenticationStateReturn {
 
   // Register method
   const register = useCallback(
-    async (
-      email: string,
-      password: string,
-      inviteCode?: string
-    ) => {
+    async (email: string, password: string, inviteCode?: string) => {
       setIsLoading(true);
 
       try {
@@ -157,47 +223,44 @@ export function useAuthenticationState(): AuthenticationStateReturn {
   );
 
   // Logout method
-  const logout = useCallback(
-    async (options: { silent?: boolean } = {}) => {
-      const { silent = false } = options;
+  const logout = useCallback(async (options: { silent?: boolean } = {}) => {
+    const { silent = false } = options;
 
-      try {
-        setIsLoading(true);
+    try {
+      setIsLoading(true);
 
-        if (!silent) {
-          // Call logout API
-          await authService.signOut();
-        }
+      if (!silent) {
+        // Call logout API
+        await authService.signOut();
+      }
 
-        // Clear local session
-        removeSessionFromStorage();
-        setSession(null);
-        setIsAuthenticated(false);
+      // Clear local session
+      removeSessionFromStorage();
+      setSession(null);
+      setIsAuthenticated(false);
 
-        queryClient.clear();
-        if (!silent) {
-          message.success(t("auth.logoutSuccess"));
-        }
+      queryClient.clear();
+      if (!silent) {
+        message.success(t("auth.logoutSuccess"));
+      }
 
-        // Emit logout event
-        authEventUtils.emitLogout();
-      } catch (error: any) {
-        log.error("Logout failed:", error?.message || error);
-        // Even if API call fails, clear local session
-        removeSessionFromStorage();
-        setSession(null);
-        setIsAuthenticated(false);
+      // Emit logout event
+      authEventUtils.emitLogout();
+    } catch (error: any) {
+      log.error("Logout failed:", error?.message || error);
+      // Even if API call fails, clear local session
+      removeSessionFromStorage();
+      setSession(null);
+      setIsAuthenticated(false);
 
-        queryClient.clear();
-        if (!silent) {
-          message.error(t("auth.logoutFailed"));
-        }
-      } finally {
-        setIsLoading(false);
+      queryClient.clear();
+      if (!silent) {
+        message.error(t("auth.logoutFailed"));
       }
-    },
-    []
-  );
+    } finally {
+      setIsLoading(false);
+    }
+  }, []);
 
   // Revoke method
   const revoke = useCallback(async () => {
@@ -233,6 +296,6 @@ export function useAuthenticationState(): AuthenticationStateReturn {
     register,
     logout,
     clearLocalSession,
-    revoke
+    revoke,
   };
 }
diff --git a/frontend/hooks/auth/useAuthenticationUI.ts b/frontend/hooks/auth/useAuthenticationUI.ts
index 2b42641da..748d6d359 100644
--- a/frontend/hooks/auth/useAuthenticationUI.ts
+++ b/frontend/hooks/auth/useAuthenticationUI.ts
@@ -1,6 +1,6 @@
 "use client";
 
-import { useState, useCallback, useEffect } from "react";
+import { useState, useCallback, useEffect, useRef } from "react";
 import { useRouter, usePathname, useSearchParams } from "next/navigation";
 import { App } from "antd";
 import { useTranslation } from "react-i18next";
@@ -9,6 +9,8 @@ import { useDeployment } from "@/components/providers/deploymentProvider";
 import { AUTH_EVENTS } from "@/const/auth";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { authEvents, authEventUtils } from "@/lib/authEvents";
+import { authFlowState } from "@/lib/authFlow";
+import { casService } from "@/services/casService";
 import { AuthenticationUIReturn, RegisterModalOptions } from "@/types/auth";
 
 /**
@@ -33,6 +35,7 @@ export function useAuthenticationUI({
   const { message } = App.useApp();
   const effectivePath = pathname ? getEffectiveRoutePath(pathname) : "/";
   const isOAuthCompletePage = effectivePath === "/oauth/complete";
+  const isRedirectingToCasRef = useRef(false);
 
   // UI state for modals - managed locally within the hook
   const [isLoginModalOpen, setIsLoginModalOpen] = useState(false);
@@ -40,12 +43,12 @@ export function useAuthenticationUI({
   const [registerModalOptions, setRegisterModalOptions] =
     useState<RegisterModalOptions | null>(null);
   const [isAuthPromptModalOpen, setIsAuthPromptModalOpen] = useState(false);
-  const [isSessionExpiredModalOpen, setIsSessionExpiredModalOpen] = useState(false);
+  const [isSessionExpiredModalOpen, setIsSessionExpiredModalOpen] =
+    useState(false);
 
-  const handleUnauthenticatedModalClose = (() => {
+  const handleUnauthenticatedModalClose = () => {
     // Only emit back to home event and redirect if user is not authenticated
     if (!isAuthenticated && !isSpeedMode) {
-        
       // Emit event to notify SideNavigation to reset selected key
       authEventUtils.emitBackToHome();
       // Redirect to home page if not already there
@@ -53,7 +56,7 @@ export function useAuthenticationUI({
         router.push("/");
       }
     }
-  });
+  };
 
   // Modal control functions
   const openLoginModal = useCallback(() => setIsLoginModalOpen(true), []);
@@ -74,14 +77,37 @@ export function useAuthenticationUI({
     handleUnauthenticatedModalClose();
   }, [handleUnauthenticatedModalClose]);
 
-  const openAuthPromptModal = useCallback(() => setIsAuthPromptModalOpen(true), []);
+  const redirectToCasIfForced = useCallback(
+    async (redirect?: string): Promise<boolean> => {
+      if (isRedirectingToCasRef.current) return true;
+      if (authFlowState.isExplicitLogoutInProgress()) return true;
+
+      const config = await casService.getConfig();
+      if (authFlowState.isExplicitLogoutInProgress()) return true;
+      if (!config.enabled || config.login_mode !== "force") return false;
+
+      isRedirectingToCasRef.current = true;
+      casService.startLogin(redirect);
+      return true;
+    },
+    []
+  );
+
+  const openAuthPromptModal = useCallback(() => {
+    redirectToCasIfForced(effectivePath).then((redirected) => {
+      if (!redirected) setIsAuthPromptModalOpen(true);
+    });
+  }, [effectivePath, redirectToCasIfForced]);
 
   const closeAuthPromptModal = useCallback(() => {
     setIsAuthPromptModalOpen(false);
     handleUnauthenticatedModalClose();
   }, [handleUnauthenticatedModalClose]);
 
-  const openSessionExpiredModal = useCallback(() => setIsSessionExpiredModalOpen(true), []);
+  const openSessionExpiredModal = useCallback(
+    () => setIsSessionExpiredModalOpen(true),
+    []
+  );
 
   const closeSessionExpiredModal = useCallback(() => {
     clearLocalSession();
@@ -105,13 +131,15 @@ export function useAuthenticationUI({
     if (isSpeedMode) return;
 
     const handleSessionExpired = () => {
-      // Prevent showing session expired modal when login/register modal is already open
-      // This avoids race conditions when mousemove events trigger session checks
-      // while the user is already filling in the login form
+      // Prevent showing session expired modal when login/register modal is already open.
+      // This avoids race conditions while the user is filling in an auth form.
       if (isLoginModalOpen || isRegisterModalOpen) {
         return;
       }
-      setIsSessionExpiredModalOpen(true);
+
+      redirectToCasIfForced(effectivePath).then((redirected) => {
+        if (!redirected) setIsSessionExpiredModalOpen(true);
+      });
     };
 
     const handleRegisterSuccess = () => {
@@ -134,7 +162,13 @@ export function useAuthenticationUI({
       cleanup();
       cleanupRegister();
     };
-  }, [isSpeedMode, isLoginModalOpen, isRegisterModalOpen]);
+  }, [
+    effectivePath,
+    isSpeedMode,
+    redirectToCasIfForced,
+    isLoginModalOpen,
+    isRegisterModalOpen,
+  ]);
 
   // Auto-open login modal when returning from a failed OAuth redirect
   useEffect(() => {
@@ -154,7 +188,17 @@ export function useAuthenticationUI({
     if (oauthError && !isLoginModalOpen) {
       setIsLoginModalOpen(true);
     }
-  }, [searchParams, isAuthChecking, isAuthenticated, isSpeedMode, isLoginModalOpen, router, isOAuthCompletePage, message, getOAuthErrorMessage]);
+  }, [
+    searchParams,
+    isAuthChecking,
+    isAuthenticated,
+    isSpeedMode,
+    isLoginModalOpen,
+    router,
+    isOAuthCompletePage,
+    message,
+    getOAuthErrorMessage,
+  ]);
 
   useEffect(() => {
     if (!isOAuthCompletePage) return;
@@ -175,9 +219,28 @@ export function useAuthenticationUI({
     if (isSessionExpiredModalOpen) return;
     if (isLoginModalOpen) return;
     if (isRegisterModalOpen) return;
-    openAuthPromptModal();
-  }, [pathname, isAuthenticated, isSpeedMode, isAuthChecking, isSessionExpiredModalOpen, openAuthPromptModal, isOAuthCompletePage]);
+    let cancelled = false;
 
+    redirectToCasIfForced(effectivePath).then((redirected) => {
+      if (!cancelled && !redirected) {
+        setIsAuthPromptModalOpen(true);
+      }
+    });
+
+    return () => {
+      cancelled = true;
+    };
+  }, [
+    effectivePath,
+    isAuthenticated,
+    isSpeedMode,
+    isAuthChecking,
+    isSessionExpiredModalOpen,
+    isLoginModalOpen,
+    isRegisterModalOpen,
+    isOAuthCompletePage,
+    redirectToCasIfForced,
+  ]);
 
   return {
     // Login/Register Modal
diff --git a/frontend/lib/agentGenerationCache.ts b/frontend/lib/agentGenerationCache.ts
index 6799f3d2f..d8dbfb045 100644
--- a/frontend/lib/agentGenerationCache.ts
+++ b/frontend/lib/agentGenerationCache.ts
@@ -30,6 +30,10 @@ export interface AgentGenerationCache {
   agentDisplayName: string;
   /** Generated agent description */
   agentDescription: string;
+  /** Generated greeting message */
+  greetingMessage: string;
+  /** Generated example questions */
+  exampleQuestions: string;
 }
 
 /**
@@ -46,6 +50,8 @@ const DEFAULT_CACHE: AgentGenerationCache = {
   agentName: "",
   agentDisplayName: "",
   agentDescription: "",
+  greetingMessage: "",
+  exampleQuestions: "",
 };
 
 /**
@@ -173,7 +179,7 @@ export function setAgentGenerationStatus(
 export function saveGeneratedField<
   K extends keyof Pick<
     AgentGenerationCache,
-    'dutyPrompt' | 'constraintPrompt' | 'fewShotsPrompt' | 'agentName' | 'agentDisplayName' | 'agentDescription'
+    'dutyPrompt' | 'constraintPrompt' | 'fewShotsPrompt' | 'agentName' | 'agentDisplayName' | 'agentDescription' | 'greetingMessage' | 'exampleQuestions'
   >
 >(
   agentId: number,
diff --git a/frontend/lib/auth.ts b/frontend/lib/auth.ts
index 7c6cafa11..330028bc3 100644
--- a/frontend/lib/auth.ts
+++ b/frontend/lib/auth.ts
@@ -15,6 +15,7 @@ import {
   hasAuthCookies,
   handleSessionExpired,
 } from "@/lib/session";
+import { authFlowState } from "@/lib/authFlow";
 
 /**
  * Role color mapping - Ant Design color presets
@@ -49,7 +50,11 @@ export function generateAvatarUrl(email: string): string {
 export const fetchWithAuth = async (url: string, options: RequestInit = {}) => {
   // Frontend pre-check: detect session expiry without hitting backend
   if (typeof window !== "undefined") {
-    if (hasAuthCookies() && !checkSessionValid()) {
+    if (
+      !authFlowState.isExplicitLogoutInProgress() &&
+      hasAuthCookies() &&
+      !checkSessionValid()
+    ) {
       handleSessionExpired();
       throw new ApiError(
         STATUS_CODES.TOKEN_EXPIRED,
diff --git a/frontend/lib/authFlow.ts b/frontend/lib/authFlow.ts
new file mode 100644
index 000000000..329157120
--- /dev/null
+++ b/frontend/lib/authFlow.ts
@@ -0,0 +1,13 @@
+let explicitLogoutInProgress = false;
+
+export const authFlowState = {
+  beginExplicitLogout: (): void => {
+    explicitLogoutInProgress = true;
+  },
+
+  endExplicitLogout: (): void => {
+    explicitLogoutInProgress = false;
+  },
+
+  isExplicitLogoutInProgress: (): boolean => explicitLogoutInProgress,
+};
diff --git a/frontend/lib/chat/chatMessageExtractor.ts b/frontend/lib/chat/chatMessageExtractor.ts
deleted file mode 100644
index f7d172be4..000000000
--- a/frontend/lib/chat/chatMessageExtractor.ts
+++ /dev/null
@@ -1,292 +0,0 @@
-import { chatConfig, MESSAGE_ROLES } from "@/const/chatConfig";
-import {
-  ApiMessage,
-  SearchResult,
-  AgentStep,
-  ApiMessageItem,
-  ChatMessageType,
-  MinioFileItem,
-} from "@/types/chat";
-import log from "@/lib/logger";
-
-// Replace <user_break> tag with the localized natural language string
-const processSpecialTag = (content: string, t: any): string => {
-  if (!content || typeof content !== "string") {
-    return content;
-  }
-
-  if (content == "<user_break>") {
-    return t("chatStreamHandler.userInterrupted");
-  }
-
-  return content;
-};
-
-export function extractAssistantMsgFromResponse(
-  dialog_msg: ApiMessage,
-  index: number,
-  create_time: number,
-  t: any
-) {
-  let searchResultsContent: SearchResult[] = [];
-  if (
-    dialog_msg.search &&
-    Array.isArray(dialog_msg.search) &&
-    dialog_msg.search.length > 0
-  ) {
-    searchResultsContent = dialog_msg.search.map((item) => ({
-      title: item.title || t("extractMsg.unknownTitle"),
-      url: item.url || "#",
-      text: item.text || t("extractMsg.noContentDescription"),
-      published_date: item.published_date || "",
-      source_type: item.source_type || "",
-      filename: item.filename || "",
-      score: typeof item.score === "number" ? item.score : undefined,
-      score_details: item.score_details || {},
-      tool_sign: item.tool_sign || "",
-      cite_index: typeof item.cite_index === "number" ? item.cite_index : -1,
-    }));
-  }
-
-  // handle images
-  let imagesContent: string[] = [];
-  if (
-    dialog_msg.picture &&
-    Array.isArray(dialog_msg.picture) &&
-    dialog_msg.picture.length > 0
-  ) {
-    imagesContent = dialog_msg.picture;
-  }
-
-  // extract the content of the Message
-  let finalAnswer = "";
-  let steps: AgentStep[] = [];
-  if (dialog_msg.message && Array.isArray(dialog_msg.message)) {
-    dialog_msg.message.forEach((msg: ApiMessageItem) => {
-      switch (msg.type) {
-        case chatConfig.messageTypes.FINAL_ANSWER: {
-          finalAnswer += processSpecialTag(msg.content, t);
-          break;
-        }
-
-        case chatConfig.messageTypes.STEP_COUNT: {
-          steps.push({
-            id: `step-${steps.length + 1}`,
-            title: msg.content.trim(),
-            content: "",
-            expanded: false,
-            contents: [],
-            metrics: null,
-            thinking: { content: "", expanded: false },
-            code: { content: "", expanded: false },
-            output: { content: "", expanded: false },
-          });
-          break;
-        }
-
-        case chatConfig.messageTypes.MODEL_OUTPUT_THINKING: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            const contentId = `model-${Date.now()}-${Math.random()
-              .toString(36)
-              .substring(2, 7)}`;
-            currentStep.contents.push({
-              id: contentId,
-              type: "model_output",
-              subType: "thinking",
-              content: msg.content,
-              expanded: true,
-              timestamp: Date.now(),
-            });
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.EXECUTION_LOGS: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            const contentId = `execution-${Date.now()}-${Math.random()
-              .toString(36)
-              .substring(2, 7)}`;
-            currentStep.contents.push({
-              id: contentId,
-              type: "execution",
-              content: msg.content,
-              expanded: true,
-              timestamp: Date.now(),
-            });
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.ERROR: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            const contentId = `error-${Date.now()}-${Math.random()
-              .toString(36)
-              .substring(2, 7)}`;
-            currentStep.contents.push({
-              id: contentId,
-              type: "error",
-              content: msg.content,
-              expanded: true,
-              timestamp: Date.now(),
-            });
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.SEARCH_CONTENT_PLACEHOLDER: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            try {
-              const placeholderData = JSON.parse(msg.content);
-              const unitId = placeholderData.unit_id;
-
-              if (
-                unitId &&
-                dialog_msg.search_unit_id &&
-                dialog_msg.search_unit_id[unitId.toString()]
-              ) {
-                const unitSearchResults =
-                  dialog_msg.search_unit_id[unitId.toString()];
-                const searchContent = JSON.stringify(unitSearchResults);
-
-                const contentId = `search-content-${Date.now()}-${Math.random()
-                  .toString(36)
-                  .substring(2, 7)}`;
-                currentStep.contents.push({
-                  id: contentId,
-                  type: "search_content",
-                  content: searchContent,
-                  expanded: true,
-                  timestamp: Date.now(),
-                });
-              }
-            } catch (e) {
-              log.error(t("extractMsg.cannotParseSearchPlaceholder"), e);
-            }
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.TOKEN_COUNT: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            try {
-              currentStep.metrics = JSON.parse(msg.content);
-            } catch {
-              currentStep.metrics = null;
-            }
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.CARD: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            const contentId = `card-${Date.now()}-${Math.random()
-              .toString(36)
-              .substring(2, 7)}`;
-            currentStep.contents.push({
-              id: contentId,
-              type: "card",
-              content: msg.content,
-              expanded: true,
-              timestamp: Date.now(),
-            });
-          }
-          break;
-        }
-
-        case chatConfig.messageTypes.TOOL: {
-          const currentStep = steps[steps.length - 1];
-          if (currentStep) {
-            const contentId = `tool-${Date.now()}-${Math.random()
-              .toString(36)
-              .substring(2, 7)}`;
-            currentStep.contents.push({
-              id: contentId,
-              type: "executing", // use the existing executing type to represent the tool call
-              content: msg.content,
-              expanded: true,
-              timestamp: Date.now(),
-            });
-          }
-          break;
-        }
-
-        default:
-          break;
-      }
-    });
-  }
-
-  const formattedAssistantMsg: ChatMessageType = {
-    id: `assistant-${index}-${Date.now()}`,
-    role: MESSAGE_ROLES.ASSISTANT,
-    message_id: dialog_msg.message_id,
-    content: "",
-    opinion_flag: dialog_msg.opinion_flag,
-    timestamp: new Date(create_time),
-    steps: steps,
-    finalAnswer: finalAnswer,
-    agentRun: "",
-    isComplete: true,
-    showRawContent: false,
-    searchResults: searchResultsContent,
-    images: imagesContent,
-    attachments: undefined,
-  };
-  return formattedAssistantMsg;
-}
-
-export function extractUserMsgFromResponse(
-  dialog_msg: ApiMessage,
-  index: number,
-  create_time: number
-) {
-  let userContent = "";
-  if (Array.isArray(dialog_msg.message)) {
-    const stringMessage = dialog_msg.message.find(
-      (m: { type: string; content: string }) => m.type === "string"
-    );
-    userContent = stringMessage?.content || "";
-  } else if (typeof dialog_msg.message === "string") {
-    userContent = dialog_msg.message;
-  } else if (dialog_msg.message && typeof dialog_msg.message === "object") {
-    const msgObj = dialog_msg.message as { content?: string };
-    userContent = msgObj.content || "";
-  }
-
-  let userAttachments: MinioFileItem[] = [];
-  if (
-    dialog_msg.minio_files &&
-    Array.isArray(dialog_msg.minio_files) &&
-    dialog_msg.minio_files.length > 0
-  ) {
-    userAttachments = dialog_msg.minio_files.map((item) => {
-      return {
-        type: item.type || "",
-        name: item.name || "",
-        size: item.size || 0,
-        object_name: item.object_name,
-        url: item.url,
-        description: item.description,
-      };
-    });
-  }
-
-  const formattedUserMsg: ChatMessageType = {
-    id: `user-${index}-${Date.now()}`,
-    role: MESSAGE_ROLES.USER,
-    message_id: dialog_msg.message_id,
-    content: userContent,
-    opinion_flag: dialog_msg.opinion_flag,
-    timestamp: new Date(create_time),
-    showRawContent: true,
-    isComplete: true,
-    attachments: userAttachments.length > 0 ? userAttachments : undefined,
-  };
-  return formattedUserMsg;
-}
diff --git a/frontend/lib/chatMessageExtractor.ts b/frontend/lib/chatMessageExtractor.ts
index 08f73de82..eb0f79aec 100644
--- a/frontend/lib/chatMessageExtractor.ts
+++ b/frontend/lib/chatMessageExtractor.ts
@@ -22,6 +22,40 @@ const processSpecialTag = (content: string, t: any): string => {
   return content;
 };
 
+const createAgentStep = (
+  id: string,
+  title: string,
+  expanded = false
+): AgentStep => ({
+  id,
+  title,
+  content: "",
+  expanded,
+  contents: [],
+  metrics: null,
+  thinking: { content: "", expanded },
+  code: { content: "", expanded },
+  output: { content: "", expanded },
+});
+
+const getOrCreateCurrentStep = (
+  steps: AgentStep[],
+  fallbackTitle: string
+): AgentStep => {
+  const currentStep = steps[steps.length - 1];
+  if (currentStep) {
+    return currentStep;
+  }
+
+  const recoveredStep = createAgentStep(
+    `step-history-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`,
+    fallbackTitle,
+    true
+  );
+  steps.push(recoveredStep);
+  return recoveredStep;
+};
+
 export function extractAssistantMsgFromResponse(
   dialog_msg: ApiMessage,
   index: number,
@@ -70,17 +104,9 @@ export function extractAssistantMsgFromResponse(
         }
 
         case chatConfig.messageTypes.STEP_COUNT: {
-          steps.push({
-            id: `step-${steps.length + 1}`,
-            title: msg.content.trim(),
-            content: "",
-            expanded: false,
-            contents: [],
-            metrics: null,
-            thinking: { content: "", expanded: false },
-            code: { content: "", expanded: false },
-            output: { content: "", expanded: false },
-          });
+          steps.push(
+            createAgentStep(`step-${steps.length + 1}`, msg.content.trim())
+          );
           break;
         }
 
@@ -216,6 +242,22 @@ export function extractAssistantMsgFromResponse(
           break;
         }
 
+        case chatConfig.messageTypes.VERIFICATION: {
+          const currentStep = getOrCreateCurrentStep(steps, "Verification");
+          const contentId = `verification-${Date.now()}-${Math.random()
+            .toString(36)
+            .substring(2, 7)}`;
+          currentStep.contents.push({
+            id: contentId,
+            type: chatConfig.messageTypes.VERIFICATION,
+            subType: "verification",
+            content: msg.content,
+            expanded: true,
+            timestamp: Date.now(),
+          });
+          break;
+        }
+
         case chatConfig.messageTypes.MAX_STEPS_REACHED: {
           // Parse the max steps reached event data for historical messages
           try {
@@ -250,6 +292,24 @@ export function extractAssistantMsgFromResponse(
     });
   }
 
+  let assistantAttachments: MinioFileItem[] = [];
+  if (
+    dialog_msg.minio_files &&
+    Array.isArray(dialog_msg.minio_files) &&
+    dialog_msg.minio_files.length > 0
+  ) {
+    assistantAttachments = dialog_msg.minio_files.map((item) => {
+      return {
+        type: item.type || "",
+        name: item.name || "",
+        size: item.size || 0,
+        object_name: item.object_name,
+        url: item.url,
+        description: item.description,
+      };
+    });
+  }
+
   const formattedAssistantMsg: ChatMessageType = {
     id: `assistant-${index}-${Date.now()}`,
     role: MESSAGE_ROLES.ASSISTANT,
@@ -264,7 +324,7 @@ export function extractAssistantMsgFromResponse(
     showRawContent: false,
     searchResults: searchResultsContent,
     images: imagesContent,
-    attachments: undefined,
+    attachments: assistantAttachments.length > 0 ? assistantAttachments : undefined,
   };
   return formattedAssistantMsg;
 }
@@ -300,7 +360,7 @@ export function extractUserMsgFromResponse(
         size: item.size || 0,
         object_name: item.object_name,
         url: item.url,
-        presigned_url: item.presigned_url,  // Preserve presigned_url for MCP tool access
+        presigned_url: item.presigned_url, // Preserve presigned_url for MCP tool access
         description: item.description,
       };
     });
diff --git a/frontend/lib/filePreviewUtils.ts b/frontend/lib/filePreviewUtils.ts
index 0126241bf..929f01446 100644
--- a/frontend/lib/filePreviewUtils.ts
+++ b/frontend/lib/filePreviewUtils.ts
@@ -353,3 +353,43 @@ export function getPageWrapperStyle(
 
   return { minHeight: placeholderHeight, width: placeholderWidth };
 }
+
+export type PreviewAccessReason = 'forbidden' | 'not_found';
+
+export class PreviewAccessError extends Error {
+  readonly reason: PreviewAccessReason;
+
+  constructor(reason: PreviewAccessReason) {
+    super(reason);
+    this.name = 'PreviewAccessError';
+    this.reason = reason;
+  }
+}
+
+export function getPreviewAccessReasonFromStatus(
+  status: number,
+): PreviewAccessReason | null {
+  if (status === 403) return 'forbidden';
+  if (status === 404) return 'not_found';
+  return null;
+}
+
+/** Fetch remote preview content; throws PreviewAccessError on 403/404. */
+export async function fetchPreviewBlob(
+  url: string,
+  signal?: AbortSignal,
+): Promise<Blob> {
+  const resp = await fetch(url, {
+    cache: 'no-store',
+    credentials: 'include',
+    signal,
+  });
+  const accessReason = getPreviewAccessReasonFromStatus(resp.status);
+  if (accessReason) {
+    throw new PreviewAccessError(accessReason);
+  }
+  if (!resp.ok) {
+    throw new Error(`HTTP ${resp.status}`);
+  }
+  return resp.blob();
+}
diff --git a/frontend/pnpm-workspace.yaml b/frontend/pnpm-workspace.yaml
index 3d5d51424..07399aa05 100644
--- a/frontend/pnpm-workspace.yaml
+++ b/frontend/pnpm-workspace.yaml
@@ -1,2 +1,4 @@
-ignoredBuiltDependencies:
-  - unrs-resolver
+allowBuilds:
+  core-js: true
+  sharp: true
+  unrs-resolver: true
diff --git a/frontend/public/locales/en/common.json b/frontend/public/locales/en/common.json
index 9e1d3d8b8..c3ccbd6c0 100644
--- a/frontend/public/locales/en/common.json
+++ b/frontend/public/locales/en/common.json
@@ -17,6 +17,10 @@
   "filePreview.loadingDocument": "Loading document...",
   "filePreview.loadingPage": "Loading page...",
   "filePreview.previewFailed": "File preview failed",
+  "filePreview.knowledge.accessDenied.title": "Cannot preview",
+  "filePreview.knowledge.accessDenied.content": "You do not have permission to preview this document.",
+  "filePreview.knowledge.noStoredCopy.title": "Cannot preview",
+  "filePreview.knowledge.noStoredCopy.content": "This knowledge base does not keep a copy of the document; preview is unavailable.",
   "filePreview.emptyFile": "This file content is empty",
   "filePreview.uploadToPreview": "Please upload the file before previewing",
   "filePreview.download": "Download",
@@ -274,6 +278,13 @@
   "chatStreamHandler.parseMaxStepsDataFailed": "Failed to parse max steps data:",
 
   "taskWindow.maxStepsReached": "Max steps limit reached ({{completedSteps}} steps), summarizing current work...",
+  "taskWindow.verification.start": "Self-checking...",
+  "taskWindow.verification.pass": "Self-check passed",
+  "taskWindow.verification.warning": "Self-check needs attention",
+  "taskWindow.verification.blocked": "Self-check blocked this action",
+  "taskWindow.verification.repair": "Self-check failed, revising",
+  "taskWindow.verification.finalPass": "Final self-check passed",
+  "taskWindow.verification.finalFail": "Final self-check did not pass",
   "taskWindow.unknownSource": "Unknown Source",
   "taskWindow.knowledgeFile": "Knowledge Base File",
   "taskWindow.urlParseError": "URL parsing error:",
@@ -315,6 +326,12 @@
   "agent.contextMenu.copy": "Copy",
   "agent.copySuffix": "Copy",
   "agent.info.title": "Agent Information",
+  "agent.greeting.tabTitle": "Greeting",
+  "agent.greeting.messageTitle": "Greeting Message",
+  "agent.greeting.messagePlaceholder": "Enter agent greeting, e.g., Hello! I'm your data analysis assistant",
+  "agent.greeting.questionsTitle": "Example Questions",
+  "agent.greeting.addQuestion": "Add Example Question",
+  "agent.greeting.removeQuestion": "Remove",
   "agent.info.name.error.empty": "Name cannot be empty",
   "agent.info.name.error.format": "Name can only contain letters, numbers and underscores, and must start with a letter or underscore",
   "agent.info.name.error.length": "Name length cannot exceed 50 characters",
@@ -327,6 +344,8 @@
   "agent.author.hint": "Default: {{email}}",
   "agent.provideRunSummary": "Provide Run Summary",
   "agent.provideRunSummary.error": "Please select whether to provide run summary",
+  "agent.verification": "Self Verification",
+  "agent.verification.error": "Please select whether to enable self verification",
   "agent.description": "Agent Description",
   "agent.descriptionPlaceholder": "Please enter agent description",
   "agent.userGroup": "User Group",
@@ -367,6 +386,10 @@
   "agent.debug.stop": "Stop",
   "agent.debug.clear": "Clear",
   "agent.debug.send": "Send",
+  "agent.debug.optimizeTitle": "Prompt optimization",
+  "agent.debug.optimizeHint": "Select a reply and provide feedback. The system will optimize the agent's full system prompt.",
+  "agent.debug.selectedQuestion": "Selected question",
+  "agent.debug.selectedAnswer": "Selected answer",
   "agent.debug.userStop": "User manually stopped debugging",
   "agent.debug.cancelError": "Error while canceling request",
   "agent.debug.stopError": "Failed to stop debug mode Agent run, but frontend has stopped:",
@@ -385,6 +408,11 @@
   "agent.debug.compareEmpty": "No output yet",
   "agent.debug.defaultMode": "Default mode",
   "agent.debug.compareMode": "Compare mode",
+  "agent.debug.promptCompare.title": "Prompt compare",
+  "agent.debug.promptCompare.close": "Close",
+  "agent.debug.promptCompare.apply": "Replace with Optimized Content",
+  "agent.debug.promptCompare.original": "Original",
+  "agent.debug.promptCompare.optimized": "Optimized",
 
   "guide.steps.describeBusinessLogic.title": "Describe Business Logic",
 
@@ -406,6 +434,25 @@
   "systemPrompt.optimize.empty": "No optimized content yet",
   "systemPrompt.optimize.replace": "Replace with Optimized Content",
   "systemPrompt.optimize.error": "Failed to optimize this section",
+  "systemPrompt.optimize.generating": "Generating optimized prompt template...",
+  "systemPrompt.optimize.generatingPlaceholder": "Generating, please wait...",
+  "systemPrompt.button.badcase": "Bad Case Optimize",
+  "systemPrompt.finetune.title": "Fine-Tune",
+  "systemPrompt.finetune.modeLabel": "Adjustment Mode",
+  "systemPrompt.finetune.modeGeneral": "Global Optimize",
+  "systemPrompt.finetune.modeGeneralDesc": "Optimize the entire section based on feedback",
+  "systemPrompt.finetune.modeInsert": "Insert Content",
+  "systemPrompt.finetune.modeInsertDesc": "Insert new content at a specific position",
+  "systemPrompt.finetune.modeSelect": "Replace Selection",
+  "systemPrompt.finetune.modeSelectDesc": "Replace the selected range of content",
+  "systemPrompt.finetune.insertPositionLabel": "Insert Position (character index)",
+  "systemPrompt.finetune.insertPositionPlaceholder": "e.g. 50",
+  "systemPrompt.finetune.selectStartLabel": "Selection Start (character index)",
+  "systemPrompt.finetune.selectStartPlaceholder": "e.g. 10",
+  "systemPrompt.finetune.selectEndLabel": "Selection End (character index)",
+  "systemPrompt.finetune.selectEndPlaceholder": "e.g. 100",
+  "systemPrompt.finetune.selectTip": "Select text in the editor below to get position",
+  "systemPrompt.finetune.positionError": "Please enter a valid position number",
   "systemPrompt.expandEdit.backgroundInfo": "Background Info",
   "systemPrompt.expandEdit.close": "Save & Close",
   "systemPrompt.nonEditing.title": "Please Select an Agent First",
@@ -570,6 +617,7 @@
   "knowledgeBase.tag.createdAt": "Created on {{date}}",
   "knowledgeBase.tag.model": "{{model}} Model",
   "knowledgeBase.tag.modelMismatch": "Model Mismatch",
+  "knowledgeBase.tag.noPreserveSourceFile": "Document copy not preserved",
   "knowledgeBase.upload.modelMismatch.description": "The model of the current knowledge base does not match the configured model, file upload is not allowed, please switch the knowledge base or adjust the model configuration",
   "knowledgeBase.list.empty": "No knowledge bases yet, please create one first",
   "knowledgeBase.list.noResults": "No matching knowledge bases found",
@@ -618,6 +666,7 @@
   "knowledgeBase.name.new": "new_base",
   "knowledgeBase.message.getDocumentsFailed": "Failed to get documents",
   "knowledgeBase.create.permission.groupPlaceholder": "No user group",
+  "knowledgeBase.create.preserveSourceFile": "Preserve document copy",
   "knowledgeBase.ingroup.permission.EDIT": "In Group Read/Write",
   "knowledgeBase.ingroup.permission.READ_ONLY": "In Group Read Only",
   "knowledgeBase.ingroup.permission.PRIVATE": "Personal Private",
@@ -1059,6 +1108,7 @@
   "auth.accessDenied": "You do not have permission to access this page",
   "auth.oauthDivider": "or continue with",
   "auth.oauthLogin": "{{provider}} Login",
+  "auth.casLogin": "{{provider}} Login",
   "auth.oauthLoginFailed": "Third-party login failed: {{error}}",
   "auth.oauthLoginFailedGeneric": "Third-party login failed. Please try again.",
   "auth.oauthCompleteTitle": "Complete Account Setup",
diff --git a/frontend/public/locales/zh/common.json b/frontend/public/locales/zh/common.json
index 114984215..09b8bcd4a 100644
--- a/frontend/public/locales/zh/common.json
+++ b/frontend/public/locales/zh/common.json
@@ -17,6 +17,10 @@
   "filePreview.loadingDocument": "文档加载中...",
   "filePreview.loadingPage": "页面加载中...",
   "filePreview.previewFailed": "文件预览失败",
+  "filePreview.knowledge.accessDenied.title": "无法预览",
+  "filePreview.knowledge.accessDenied.content": "您没有权限访问该文档。",
+  "filePreview.knowledge.noStoredCopy.title": "无法预览",
+  "filePreview.knowledge.noStoredCopy.content": "当前知识库未保存该文档副本，无法预览。",
   "filePreview.emptyFile": "文件内容为空",
   "filePreview.uploadToPreview": "请上传文件后预览",
   "filePreview.download": "下载",
@@ -275,6 +279,13 @@
   "chatStreamHandler.parseMaxStepsDataFailed": "解析最大步数数据失败:",
 
   "taskWindow.maxStepsReached": "已达到最大步数限制（{{completedSteps}} 步），正在总结当前工作...",
+  "taskWindow.verification.start": "正在自检...",
+  "taskWindow.verification.pass": "自检通过",
+  "taskWindow.verification.warning": "自检发现需关注项",
+  "taskWindow.verification.blocked": "自检已阻断当前动作",
+  "taskWindow.verification.repair": "自检未通过，正在修正",
+  "taskWindow.verification.finalPass": "最终自检通过",
+  "taskWindow.verification.finalFail": "最终自检未通过",
   "taskWindow.unknownSource": "未知来源",
   "taskWindow.knowledgeFile": "知识库文件",
   "taskWindow.urlParseError": "URL解析错误:",
@@ -317,6 +328,12 @@
   "agent.contextMenu.copy": "复制",
   "agent.copySuffix": "副本",
   "agent.info.title": "智能体信息",
+  "agent.greeting.tabTitle": "开场白",
+  "agent.greeting.messageTitle": "问候语",
+  "agent.greeting.messagePlaceholder": "请输入智能体问候语，例如：你好！我是你的数据分析助手",
+  "agent.greeting.questionsTitle": "示例问题",
+  "agent.greeting.addQuestion": "添加示例问题",
+  "agent.greeting.removeQuestion": "删除",
   "agent.info.name.error.empty": "名称不能为空",
   "agent.info.name.error.format": "名称只能包含字母、数字和下划线，且必须以字母或下划线开头",
   "agent.info.name.error.length": "名称长度不能超过50个字符",
@@ -329,6 +346,8 @@
   "agent.author.hint": "默认：{{email}}",
   "agent.provideRunSummary": "提供运行摘要",
   "agent.provideRunSummary.error": "请选择是否提供运行摘要",
+  "agent.verification": "自验证",
+  "agent.verification.error": "请选择是否启用自验证",
   "agent.description": "智能体描述",
   "agent.userGroup": "用户组",
   "agent.userGroup.empty": "暂无用户组",
@@ -369,6 +388,10 @@
   "agent.debug.stop": "停止",
   "agent.debug.clear": "清空",
   "agent.debug.send": "发送",
+  "agent.debug.optimizeTitle": "提示词优化",
+  "agent.debug.optimizeHint": "选择一条回复，输入优化反馈，系统将自动优化智能体的完整系统提示词。",
+  "agent.debug.selectedQuestion": "选中的问题",
+  "agent.debug.selectedAnswer": "选中的回复",
   "agent.debug.userStop": "用户手动停止调试",
   "agent.debug.cancelError": "取消请求时出错",
   "agent.debug.stopError": "停止调试模式智能体运行失败，但前端已停止:",
@@ -387,6 +410,11 @@
   "agent.debug.compareEmpty": "暂无输出",
   "agent.debug.defaultMode": "默认模式",
   "agent.debug.compareMode": "对比模式",
+  "agent.debug.promptCompare.title": "提示词对比",
+  "agent.debug.promptCompare.close": "关闭",
+  "agent.debug.promptCompare.apply": "一键替换",
+  "agent.debug.promptCompare.original": "优化前",
+  "agent.debug.promptCompare.optimized": "优化后",
 
   "guide.steps.describeBusinessLogic.title": "描述业务逻辑",
 
@@ -562,6 +590,7 @@
   "knowledgeBase.tag.createdAt": "创建于{{date}}",
   "knowledgeBase.tag.model": "{{model}}模型",
   "knowledgeBase.tag.modelMismatch": "模型不匹配",
+  "knowledgeBase.tag.noPreserveSourceFile": "不保留文档副本",
   "knowledgeBase.upload.modelMismatch.description": "当前知识库的模型与配置模型不匹配，无法上传文件，请切换知识库或调整模型配置",
   "knowledgeBase.list.empty": "暂无知识库，请先创建知识库",
   "knowledgeBase.list.noResults": "没有找到匹配的知识库",
@@ -608,6 +637,7 @@
   "knowledgeBase.name.new": "新知识库",
   "knowledgeBase.message.getDocumentsFailed": "获取文档列表失败",
   "knowledgeBase.create.permission.groupPlaceholder": "无所属用户组",
+  "knowledgeBase.create.preserveSourceFile": "保留文档副本",
   "knowledgeBase.ingroup.permission.EDIT": "同组可编辑",
   "knowledgeBase.ingroup.permission.READ_ONLY": "同组只读",
   "knowledgeBase.ingroup.permission.PRIVATE": "私有",
@@ -1049,6 +1079,7 @@
   "auth.accessDenied": "您没有权限访问此页面",
   "auth.oauthDivider": "或使用第三方登录",
   "auth.oauthLogin": "{{provider}} 登录",
+  "auth.casLogin": "{{provider}} 登录",
   "auth.oauthLoginFailed": "第三方登录失败：{{error}}",
   "auth.oauthLoginFailedGeneric": "第三方登录失败，请重试",
   "auth.oauthCompleteTitle": "补充账号信息",
@@ -2802,5 +2833,16 @@
   "systemPrompt.optimize.optimized": "优化后",
   "systemPrompt.optimize.empty": "暂未生成优化内容",
   "systemPrompt.optimize.replace": "一键替换",
-  "systemPrompt.optimize.error": "该部分优化失败"
+  "systemPrompt.optimize.error": "该部分优化失败",
+  "systemPrompt.optimize.generating": "正在生成优化后的 prompt 模板...",
+  "systemPrompt.optimize.generatingPlaceholder": "正在生成中，请稍候...",
+
+  "systemPrompt.finetune.modeLabel": "使用要求",
+  "systemPrompt.finetune.modeGeneral": "全局优化",
+  "systemPrompt.finetune.modeGeneralDesc": "基于评价反馈对整个部分进行优化",
+  "systemPrompt.finetune.modeInsert": "插入内容",
+  "systemPrompt.finetune.modeInsertDesc": "在指定位置插入新的内容",
+  "systemPrompt.finetune.modeSelect": "替换选中",
+  "systemPrompt.finetune.modeSelectDesc": "替换选中的内容范围"
+
 }
diff --git a/frontend/server.js b/frontend/server.js
index f0e615577..e88304b8b 100644
--- a/frontend/server.js
+++ b/frontend/server.js
@@ -87,14 +87,10 @@ function setAuthCookies(res, session) {
 
   if (session.expires_at) {
     cookies.push(
-      cookie.serialize(
-        COOKIE_NAMES.EXPIRES_AT,
-        String(session.expires_at),
-        {
-          ...buildCookieOptions(false), // readable by frontend JS
-          maxAge: expiresInSeconds, // Same as access token
-        }
-      )
+      cookie.serialize(COOKIE_NAMES.EXPIRES_AT, String(session.expires_at), {
+        ...buildCookieOptions(false), // readable by frontend JS
+        maxAge: expiresInSeconds, // Same as access token
+      })
     );
   }
 
@@ -106,10 +102,19 @@ function setAuthCookies(res, session) {
 function clearAuthCookies(res) {
   const expired = { maxAge: 0, path: "/" };
   res.setHeader("Set-Cookie", [
-    cookie.serialize(COOKIE_NAMES.ACCESS_TOKEN, "", { ...expired, httpOnly: true }),
-    cookie.serialize(COOKIE_NAMES.REFRESH_TOKEN, "", { ...expired, httpOnly: true }),
+    cookie.serialize(COOKIE_NAMES.ACCESS_TOKEN, "", {
+      ...expired,
+      httpOnly: true,
+    }),
+    cookie.serialize(COOKIE_NAMES.REFRESH_TOKEN, "", {
+      ...expired,
+      httpOnly: true,
+    }),
     cookie.serialize(COOKIE_NAMES.EXPIRES_AT, "", expired),
-    cookie.serialize(COOKIE_NAMES.OAUTH_PENDING, "", { ...expired, httpOnly: true }),
+    cookie.serialize(COOKIE_NAMES.OAUTH_PENDING, "", {
+      ...expired,
+      httpOnly: true,
+    }),
   ]);
 }
 
@@ -154,6 +159,12 @@ const AUTH_INTERCEPT_ENDPOINTS = new Set([
   "/api/user/oauth/link",
   "/api/user/oauth/pending",
   "/api/user/oauth/complete",
+  "/api/user/cas/config",
+  "/api/user/cas/login",
+  "/api/user/cas/callback",
+  "/api/user/cas/renew",
+  "/api/user/cas/renew_callback",
+  "/api/user/cas/logout_callback",
 ]);
 
 function collectRequestBody(req) {
@@ -171,8 +182,11 @@ function collectRequestBody(req) {
  * If no refresh_token cookie exists, return 401 immediately.
  */
 function prepareAuthRequestBody(pathname, body, cookies, res) {
-  if (pathname === "/api/user/refresh_token") {
-    const refreshToken = cookies[COOKIE_NAMES.REFRESH_TOKEN];
+  if (
+    pathname === "/api/user/refresh_token" ) {
+    const refreshToken =
+    cookies[COOKIE_NAMES.REFRESH_TOKEN]
+  ;
     if (!refreshToken) {
       res.writeHead(401, { "Content-Type": "application/json" });
       res.end(JSON.stringify({ detail: "No refresh token cookie found" }));
@@ -194,144 +208,204 @@ function forwardAuthRequest(req, res, targetUrl) {
   const transport = parsedTarget.protocol === "https:" ? https : http;
   const cookies = parseCookies(req);
 
-  collectRequestBody(req).then((rawBody) => {
-    const body = prepareAuthRequestBody(req.parsedPathname, rawBody, cookies, res);
+  if (
+    req.parsedPathname === "/api/user/refresh_token" &&
+    !cookies[COOKIE_NAMES.REFRESH_TOKEN]
+  ) {
+    res.writeHead(204);
+    res.end();
+    return;
+  }
+
+  collectRequestBody(req)
+    .then((rawBody) => {
+      const body = prepareAuthRequestBody(req.parsedPathname, rawBody, cookies, res);
 
     // If body is null, prepareAuthRequestBody already sent the error response
     if (body === null) {
       return;
     }
 
-    const forwardHeaders = { ...req.headers, host: parsedTarget.host };
+      const forwardHeaders = { ...req.headers, host: parsedTarget.host };
 
-    // Inject access_token from cookie as Authorization header for the backend
-    if (cookies[COOKIE_NAMES.ACCESS_TOKEN] && !forwardHeaders["authorization"]) {
-      forwardHeaders["authorization"] = `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`;
-    }
+      // Inject access_token from cookie as Authorization header for the backend
+      if (
+        cookies[COOKIE_NAMES.ACCESS_TOKEN] &&
+        !forwardHeaders["authorization"]
+      ) {
+        forwardHeaders["authorization"] =
+          `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`;
+      }
 
-    if (
-      cookies[COOKIE_NAMES.OAUTH_PENDING] &&
-      (req.parsedPathname === "/api/user/oauth/pending" ||
-        req.parsedPathname === "/api/user/oauth/complete")
-    ) {
-      forwardHeaders["x-oauth-pending-token"] = cookies[COOKIE_NAMES.OAUTH_PENDING];
-    }
+      if (
+        cookies[COOKIE_NAMES.OAUTH_PENDING] &&
+        (req.parsedPathname === "/api/user/oauth/pending" ||
+          req.parsedPathname === "/api/user/oauth/complete")
+      ) {
+        forwardHeaders["x-oauth-pending-token"] =
+          cookies[COOKIE_NAMES.OAUTH_PENDING];
+      }
 
-    // Update content-length if body was modified
-    if (body.length !== rawBody.length) {
-      forwardHeaders["content-length"] = String(body.length);
-    }
+      // Update content-length if body was modified
+      if (body.length !== rawBody.length) {
+        forwardHeaders["content-length"] = String(body.length);
+      }
 
-    const options = {
-      hostname: parsedTarget.hostname,
-      port: parsedTarget.port,
-      path: req.url,
-      method: req.method,
-      headers: forwardHeaders,
-    };
-
-    const proxyReq = transport.request(options, (proxyRes) => {
-      const responseChunks = [];
-      proxyRes.on("data", (chunk) => responseChunks.push(chunk));
-      proxyRes.on("end", () => {
-        const responseBody = Buffer.concat(responseChunks);
-        let finalBody = responseBody;
-
-        try {
-          const contentType = proxyRes.headers["content-type"] || "";
-          if (contentType.includes("application/json") && responseBody.length > 0) {
-            const data = JSON.parse(responseBody.toString());
-
-            const isLogout = req.parsedPathname === "/api/user/logout";
-            const isRevoke = req.parsedPathname === "/api/user/revoke";
-
-            if (isLogout || isRevoke) {
-              clearAuthCookies(res);
-            } else if (
-              req.parsedPathname === "/api/user/oauth/callback" &&
-              data.data &&
-              data.data.requires_account_completion &&
-              data.data.pending_token
+      const options = {
+        hostname: parsedTarget.hostname,
+        port: parsedTarget.port,
+        path: req.url,
+        method: req.method,
+        headers: forwardHeaders,
+      };
+
+      const proxyReq = transport.request(options, (proxyRes) => {
+        const responseChunks = [];
+        proxyRes.on("data", (chunk) => responseChunks.push(chunk));
+        proxyRes.on("end", () => {
+          const responseBody = Buffer.concat(responseChunks);
+          let finalBody = responseBody;
+
+          try {
+            const contentType = proxyRes.headers["content-type"] || "";
+            if (
+              contentType.includes("application/json") &&
+              responseBody.length > 0
             ) {
-              setPendingOAuthCookie(res, data.data.pending_token);
-              const locale = getPreferredLocale(cookies);
-              res.writeHead(302, { Location: `/${locale}/oauth/complete` });
-              res.end();
-              return;
-            } else if (data.data && data.data.session) {
-              const session = data.data.session;
-              setAuthCookies(res, session);
-
-              const isOAuthCallback = req.parsedPathname === "/api/user/oauth/callback";
-              if (isOAuthCallback) {
-                res.writeHead(302, { Location: "/" });
+              const data = JSON.parse(responseBody.toString());
+
+              const isLogout = req.parsedPathname === "/api/user/logout";
+              const isRevoke = req.parsedPathname === "/api/user/revoke";
+
+              if (isLogout || isRevoke) {
+                clearAuthCookies(res);
+              } else if (
+                req.parsedPathname === "/api/user/oauth/callback" &&
+                data.data &&
+                data.data.requires_account_completion &&
+                data.data.pending_token
+              ) {
+                setPendingOAuthCookie(res, data.data.pending_token);
+                const locale = getPreferredLocale(cookies);
+                res.writeHead(302, { Location: `/${locale}/oauth/complete` });
+                res.end();
+                return;
+              } else if (data.data && data.data.session) {
+                const session = data.data.session;
+                setAuthCookies(res, session);
+
+                const isOAuthCallback =
+                  req.parsedPathname === "/api/user/oauth/callback";
+                const isCasCallback =
+                  req.parsedPathname === "/api/user/cas/callback";
+                const isCasRenewCallback =
+                  req.parsedPathname === "/api/user/cas/renew_callback";
+                if (isOAuthCallback) {
+                  res.writeHead(302, { Location: "/" });
+                  res.end();
+                  return;
+                }
+                if (isCasCallback) {
+                  res.writeHead(302, {
+                    Location: data.data.redirect_url || "/",
+                  });
+                  res.end();
+                  return;
+                }
+                if (isCasRenewCallback) {
+                  const html = Buffer.from(`<!doctype html><html><body><script>
+window.parent && window.parent.postMessage({ type: "cas-renew-success" }, window.location.origin);
+</script></body></html>`);
+                  const responseHeaders = {
+                    "content-type": "text/html; charset=utf-8",
+                    "content-length": String(html.length),
+                  };
+                  const existingSetCookie = res.getHeader("Set-Cookie") || [];
+                  const cookiesToSend = Array.isArray(existingSetCookie)
+                    ? existingSetCookie
+                    : [existingSetCookie];
+                  if (cookiesToSend.filter(Boolean).length > 0) {
+                    responseHeaders["set-cookie"] =
+                      cookiesToSend.filter(Boolean);
+                  }
+                  res.writeHead(200, responseHeaders);
+                  res.end(html);
+                  return;
+                }
+
+                if (req.parsedPathname === "/api/user/oauth/complete") {
+                  clearPendingOAuthCookie(res);
+                }
+
+                const sanitized = { ...data };
+                sanitized.data = { ...data.data };
+                sanitized.data.session = {
+                  expires_at: session.expires_at,
+                  expires_in_seconds: session.expires_in_seconds,
+                };
+                finalBody = Buffer.from(JSON.stringify(sanitized));
+              } else if (
+                req.parsedPathname === "/api/user/oauth/callback" &&
+                data.data &&
+                data.data.oauth_error
+              ) {
+                const errorParams = new URLSearchParams({
+                  oauth_error: data.data.oauth_error,
+                  oauth_error_description:
+                    data.data.oauth_error_description || "",
+                });
+                res.writeHead(302, { Location: `/?${errorParams.toString()}` });
                 res.end();
                 return;
               }
-
-              if (req.parsedPathname === "/api/user/oauth/complete") {
-                clearPendingOAuthCookie(res);
-              }
-
-              const sanitized = { ...data };
-              sanitized.data = { ...data.data };
-              sanitized.data.session = {
-                expires_at: session.expires_at,
-                expires_in_seconds: session.expires_in_seconds,
-              };
-              finalBody = Buffer.from(JSON.stringify(sanitized));
-            } else if (req.parsedPathname === "/api/user/oauth/callback" && data.data && data.data.oauth_error) {
-              const errorParams = new URLSearchParams({
-                oauth_error: data.data.oauth_error,
-                oauth_error_description: data.data.oauth_error_description || "",
-              });
-              res.writeHead(302, { Location: `/?${errorParams.toString()}` });
-              res.end();
-              return;
             }
+          } catch {
+            // If JSON parsing fails, pass through unchanged
           }
-        } catch {
-          // If JSON parsing fails, pass through unchanged
-        }
 
-        // Copy response headers, but override content-length and set cookies
-        const responseHeaders = { ...proxyRes.headers };
-        responseHeaders["content-length"] = String(finalBody.length);
-        // Merge Set-Cookie: proxyRes cookies + our auth cookies
-        const existingSetCookie = res.getHeader("Set-Cookie") || [];
-        const upstreamSetCookie = proxyRes.headers["set-cookie"] || [];
-        const mergedCookies = [
-          ...(Array.isArray(existingSetCookie) ? existingSetCookie : [existingSetCookie]),
-          ...(Array.isArray(upstreamSetCookie) ? upstreamSetCookie : [upstreamSetCookie]),
-        ].filter(Boolean);
-
-        delete responseHeaders["set-cookie"];
-        if (mergedCookies.length > 0) {
-          responseHeaders["set-cookie"] = mergedCookies;
-        }
+          // Copy response headers, but override content-length and set cookies
+          const responseHeaders = { ...proxyRes.headers };
+          responseHeaders["content-length"] = String(finalBody.length);
+          // Merge Set-Cookie: proxyRes cookies + our auth cookies
+          const existingSetCookie = res.getHeader("Set-Cookie") || [];
+          const upstreamSetCookie = proxyRes.headers["set-cookie"] || [];
+          const mergedCookies = [
+            ...(Array.isArray(existingSetCookie)
+              ? existingSetCookie
+              : [existingSetCookie]),
+            ...(Array.isArray(upstreamSetCookie)
+              ? upstreamSetCookie
+              : [upstreamSetCookie]),
+          ].filter(Boolean);
+
+          delete responseHeaders["set-cookie"];
+          if (mergedCookies.length > 0) {
+            responseHeaders["set-cookie"] = mergedCookies;
+          }
 
-        res.writeHead(proxyRes.statusCode, responseHeaders);
-        res.end(finalBody);
+          res.writeHead(proxyRes.statusCode, responseHeaders);
+          res.end(finalBody);
+        });
+      });
+
+      proxyReq.on("error", (err) => {
+        console.error("[Auth Proxy] Forward error:", err.message);
+        if (!res.headersSent) {
+          res.writeHead(502, { "Content-Type": "application/json" });
+          res.end(JSON.stringify({ detail: "Backend unavailable" }));
+        }
       });
-    });
 
-    proxyReq.on("error", (err) => {
-      console.error("[Auth Proxy] Forward error:", err.message);
+      proxyReq.write(body);
+      proxyReq.end();
+    })
+    .catch((err) => {
+      console.error("[Auth Proxy] Body read error:", err.message);
       if (!res.headersSent) {
-        res.writeHead(502, { "Content-Type": "application/json" });
-        res.end(JSON.stringify({ detail: "Backend unavailable" }));
+        res.writeHead(500, { "Content-Type": "application/json" });
+        res.end(JSON.stringify({ detail: "Internal proxy error" }));
       }
     });
-
-    proxyReq.write(body);
-    proxyReq.end();
-  }).catch((err) => {
-    console.error("[Auth Proxy] Body read error:", err.message);
-    if (!res.headersSent) {
-      res.writeHead(500, { "Content-Type": "application/json" });
-      res.end(JSON.stringify({ detail: "Internal proxy error" }));
-    }
-  });
 }
 
 // ============================================================================
@@ -339,8 +413,14 @@ function forwardAuthRequest(req, res, targetUrl) {
 // ============================================================================
 proxy.on("proxyReq", (proxyReq, req) => {
   const cookies = parseCookies(req);
-  if (cookies[COOKIE_NAMES.ACCESS_TOKEN] && !proxyReq.getHeader("authorization")) {
-    proxyReq.setHeader("Authorization", `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`);
+  if (
+    cookies[COOKIE_NAMES.ACCESS_TOKEN] &&
+    !proxyReq.getHeader("authorization")
+  ) {
+    proxyReq.setHeader(
+      "Authorization",
+      `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`
+    );
   }
 });
 
@@ -375,12 +455,18 @@ app.prepare().then(() => {
           pathname.startsWith("/api/file/storage") ||
           pathname.startsWith("/api/file/preprocess");
         if (isRuntime) {
-          proxy.web(req, res, { target: RUNTIME_HTTP_BACKEND, changeOrigin: true });
+          proxy.web(req, res, {
+            target: RUNTIME_HTTP_BACKEND,
+            changeOrigin: true,
+          });
         } else if (
           pathname === "/api/skills/create" ||
           pathname.startsWith("/api/skills/stop/")
         ) {
-          proxy.web(req, res, { target: RUNTIME_HTTP_BACKEND, changeOrigin: true });
+          proxy.web(req, res, {
+            target: RUNTIME_HTTP_BACKEND,
+            changeOrigin: true,
+          });
         } else {
           proxy.web(req, res, { target: HTTP_BACKEND, changeOrigin: true });
         }
diff --git a/frontend/services/agentConfigService.ts b/frontend/services/agentConfigService.ts
index 8e0f9da0d..a955aa410 100644
--- a/frontend/services/agentConfigService.ts
+++ b/frontend/services/agentConfigService.ts
@@ -200,7 +200,9 @@ export const fetchPublishedAgentList = async () => {
       group_ids: agent.group_ids || [],
       is_new: agent.is_new || false,
       permission: agent.permission,
-      published_version_no: agent.published_version_no,
+      current_version_no: agent.current_version_no,
+      greeting_message: agent.greeting_message,
+      example_questions: agent.example_questions || [],
     }));
 
     return {
@@ -407,6 +409,7 @@ export interface UpdateAgentInfoPayload {
   max_steps?: number;
   provide_run_summary?: boolean;
   enable_context_manager?: boolean;
+  verification_config?: Record<string, any>;
   enabled?: boolean;
   business_description?: string;
   business_logic_model_name?: string;
@@ -418,6 +421,8 @@ export interface UpdateAgentInfoPayload {
   related_agent_ids?: number[];
   related_external_agent_ids?: number[];
   ingroup_permission?: string;
+  greeting_message?: string;
+  example_questions?: string[];
 }
 
 export const updateAgentInfo = async (payload: UpdateAgentInfoPayload) => {
@@ -769,6 +774,7 @@ export const searchAgentInfo = async (
       prompt_template_id: data.prompt_template_id ?? 0,
       prompt_template_name: data.prompt_template_name ?? "system_default",
       provide_run_summary: data.provide_run_summary,
+      verification_config: data.verification_config,
       enabled: data.enabled,
       is_available: data.is_available,
       unavailable_reasons: data.unavailable_reasons || [],
@@ -806,6 +812,8 @@ export const searchAgentInfo = async (
           })
         : [],
       skills: data.skills || [],
+      greeting_message: data.greeting_message || "",
+      example_questions: data.example_questions || [],
       current_version_no: data.current_version_no,
     };
 
diff --git a/frontend/services/agentVersionService.ts b/frontend/services/agentVersionService.ts
index 31dec3eb0..d520e05cb 100644
--- a/frontend/services/agentVersionService.ts
+++ b/frontend/services/agentVersionService.ts
@@ -33,6 +33,7 @@ export interface Agent {
   tenant_id: string;
   enabled: boolean;
   provide_run_summary: boolean;
+  verification_config?: Record<string, any>;
   business_description?: string;
   business_logic_model_name?: string;
   business_logic_model_id?: number;
@@ -547,4 +548,4 @@ export async function updateVersion(
       message: error instanceof Error ? error.message : "Failed to update version",
     };
   }
-}
\ No newline at end of file
+}
diff --git a/frontend/services/api.ts b/frontend/services/api.ts
index 490b3c56d..ef8b97ff4 100644
--- a/frontend/services/api.ts
+++ b/frontend/services/api.ts
@@ -30,6 +30,11 @@ export const API_ENDPOINTS = {
     accounts: `${API_BASE_URL}/user/oauth/accounts`,
     unlink: (provider: string) => `${API_BASE_URL}/user/oauth/accounts/${provider}`,
   },
+  cas: {
+    config: `${API_BASE_URL}/user/cas/config`,
+    login: `${API_BASE_URL}/user/cas/login`,
+    renew: `${API_BASE_URL}/user/cas/renew`,
+  },
   conversation: {
     list: `${API_BASE_URL}/conversation/list`,
     create: `${API_BASE_URL}/conversation/create`,
diff --git a/frontend/services/authService.ts b/frontend/services/authService.ts
index 1735adc1a..7589622b4 100644
--- a/frontend/services/authService.ts
+++ b/frontend/services/authService.ts
@@ -14,6 +14,7 @@ import { ASSET_OWNER_TENANT_ID, STATUS_CODES, USER_ROLES } from "@/const/auth";
 
 import { generateAvatarUrl } from "@/lib/auth";
 import { fetchWithAuth } from "@/lib/auth";
+import { authFlowState } from "@/lib/authFlow";
 import {
   removeSessionFromStorage,
   getSessionFromStorage,
@@ -162,7 +163,9 @@ export const authService = {
       return {
         error: {
           message:
-            error instanceof Error ? error.message : "Network error, please try again later",
+            error instanceof Error
+              ? error.message
+              : "Network error, please try again later",
           code:
             error instanceof Error && "code" in error
               ? (error as any).code
@@ -268,19 +271,29 @@ export const authService = {
   },
 
   signOut: async (): Promise<{ error: null }> => {
+    authFlowState.beginExplicitLogout();
     try {
-      await fetchWithAuth(API_ENDPOINTS.user.logout, {
+      const response = await fetchWithAuth(API_ENDPOINTS.user.logout, {
         method: "POST",
+        keepalive: true,
       });
+      const data = await response.json().catch(() => null);
+      const casLogoutUrl = data?.data?.cas_logout_url;
 
       // server.js clears HttpOnly cookies; clear local user info
       removeSessionFromStorage();
+      if (casLogoutUrl && typeof window !== "undefined") {
+        window.location.href = casLogoutUrl;
+      } else {
+        authFlowState.endExplicitLogout();
+      }
 
       return { error: null };
     } catch (error) {
       log.error("Logout failed:", error);
 
       removeSessionFromStorage();
+      authFlowState.endExplicitLogout();
 
       return { error: null };
     }
@@ -331,11 +344,16 @@ export const authService = {
           ),
           email: data.data.user.user_email,
           role: data.data.user.user_role,
+          authProvider: data.data.user.auth_provider,
           avatarUrl: data.data.user.avatarUrl,
-          permissions: data.data.user.permissions.map((permission:string) => permission.toLowerCase()),
-          accessibleRoutes: data.data.user.accessibleRoutes.map((router:string) => router.toLowerCase()),
-        }
-      }
+          permissions: data.data.user.permissions.map((permission: string) =>
+            permission.toLowerCase()
+          ),
+          accessibleRoutes: data.data.user.accessibleRoutes.map(
+            (router: string) => router.toLowerCase()
+          ),
+        },
+      };
       return userData as AuthInfoResponse;
     } catch (error) {
       log.error("Failed to get user Info:", error);
@@ -374,7 +392,9 @@ export const authService = {
       if (errorCode === ErrorCode.INVALID_CREDENTIALS) {
         return {
           errorCode: ErrorCode.INVALID_CREDENTIALS,
-          error: error?.message || getI18nErrorMessage(ErrorCode.INVALID_CREDENTIALS),
+          error:
+            error?.message ||
+            getI18nErrorMessage(ErrorCode.INVALID_CREDENTIALS),
         };
       }
       if (errorCode === ErrorCode.PASSWORD_WEAK) {
@@ -386,7 +406,9 @@ export const authService = {
       if (errorCode === ErrorCode.PASSWORD_SAME_AS_OLD) {
         return {
           errorCode: ErrorCode.PASSWORD_SAME_AS_OLD,
-          error: error?.message || getI18nErrorMessage(ErrorCode.PASSWORD_SAME_AS_OLD),
+          error:
+            error?.message ||
+            getI18nErrorMessage(ErrorCode.PASSWORD_SAME_AS_OLD),
         };
       }
 
diff --git a/frontend/services/casService.ts b/frontend/services/casService.ts
new file mode 100644
index 000000000..2c2dd2cb0
--- /dev/null
+++ b/frontend/services/casService.ts
@@ -0,0 +1,69 @@
+import { API_ENDPOINTS } from "@/services/api";
+import log from "@/lib/logger";
+
+export interface CasConfig {
+  enabled: boolean;
+  login_mode: "button" | "force" | "disabled";
+  renew_before_seconds: number;
+  renew_timeout_seconds: number;
+  display_name: string;
+}
+
+const disabledConfig: CasConfig = {
+  enabled: false,
+  login_mode: "disabled",
+  renew_before_seconds: 300,
+  renew_timeout_seconds: 10,
+  display_name: "CAS",
+};
+
+export const casService = {
+  getConfig: async (): Promise<CasConfig> => {
+    try {
+      const response = await fetch(API_ENDPOINTS.cas.config);
+      if (!response.ok) return disabledConfig;
+      const data = await response.json();
+      return { ...disabledConfig, ...(data.data || {}) };
+    } catch (error) {
+      log.warn("Failed to fetch CAS config:", error);
+      return disabledConfig;
+    }
+  },
+
+  startLogin: (redirect?: string): void => {
+    const target = redirect || window.location.pathname + window.location.search;
+    window.location.href = `${API_ENDPOINTS.cas.login}?redirect=${encodeURIComponent(target)}`;
+  },
+
+  renewInIframe: (timeoutSeconds: number): Promise<boolean> => {
+    if (typeof window === "undefined") return Promise.resolve(false);
+
+    return new Promise((resolve) => {
+      const iframe = document.createElement("iframe");
+      iframe.src = API_ENDPOINTS.cas.renew;
+      iframe.style.display = "none";
+      iframe.setAttribute("aria-hidden", "true");
+
+      let settled = false;
+      const cleanup = () => {
+        window.removeEventListener("message", onMessage);
+        iframe.remove();
+      };
+      const finish = (ok: boolean) => {
+        if (settled) return;
+        settled = true;
+        cleanup();
+        resolve(ok);
+      };
+      const onMessage = (event: MessageEvent) => {
+        if (event.origin !== window.location.origin) return;
+        if (event.data?.type === "cas-renew-success") finish(true);
+        if (event.data?.type === "cas-renew-failed") finish(false);
+      };
+
+      window.addEventListener("message", onMessage);
+      document.body.appendChild(iframe);
+      window.setTimeout(() => finish(false), Math.max(1, timeoutSeconds) * 1000);
+    });
+  },
+};
diff --git a/frontend/services/knowledgeBaseService.ts b/frontend/services/knowledgeBaseService.ts
index bd13de32d..da760e0bf 100644
--- a/frontend/services/knowledgeBaseService.ts
+++ b/frontend/services/knowledgeBaseService.ts
@@ -155,7 +155,10 @@ class KnowledgeBaseService {
     userId: string
   ): Promise<Array<{ id: string; name: string }>> {
     try {
-      const url = new URL(API_ENDPOINTS.idata.knowledgeSpaces, window.location.origin);
+      const url = new URL(
+        API_ENDPOINTS.idata.knowledgeSpaces,
+        window.location.origin
+      );
       url.searchParams.set("idata_api_base", idataApiBase);
       url.searchParams.set("api_key", apiKey);
       url.searchParams.set("user_id", userId);
@@ -170,8 +173,12 @@ class KnowledgeBaseService {
       // Check for error response from middleware (has code field)
       if (result.code !== undefined && result.code !== 0) {
         const errorCode = result.code || response.status;
-        const errorMessage = result.message || "Failed to fetch iData knowledge spaces";
-        log.error("iData API error:", { code: errorCode, message: errorMessage });
+        const errorMessage =
+          result.message || "Failed to fetch iData knowledge spaces";
+        log.error("iData API error:", {
+          code: errorCode,
+          message: errorMessage,
+        });
         throw new ApiError(errorCode, errorMessage);
       }
 
@@ -212,7 +219,10 @@ class KnowledgeBaseService {
       if (result.code !== undefined && result.code !== 0) {
         const errorCode = result.code || response.status;
         const errorMessage = result.message || "Failed to fetch iData datasets";
-        log.error("iData API error:", { code: errorCode, message: errorMessage });
+        log.error("iData API error:", {
+          code: errorCode,
+          message: errorMessage,
+        });
         throw new ApiError(errorCode, errorMessage);
       }
 
@@ -367,7 +377,10 @@ class KnowledgeBaseService {
   /**
    * Fetch Haotian knowledge sets via backend proxy.
    */
-  async getHaotianKnowledgeSets(listUrl: string, externalAuthorization: string): Promise<{
+  async getHaotianKnowledgeSets(
+    listUrl: string,
+    externalAuthorization: string
+  ): Promise<{
     knowledge_sets: Array<{
       name: string;
       knowledge_bases: Array<{ dify_dataset_id: string; name: string }>;
@@ -394,7 +407,10 @@ class KnowledgeBaseService {
   /**
    * Test Haotian connection via backend proxy.
    */
-  async testHaotianConnection(listUrl: string, externalAuthorization: string): Promise<{
+  async testHaotianConnection(
+    listUrl: string,
+    externalAuthorization: string
+  ): Promise<{
     success: boolean;
     error?: string;
   }> {
@@ -416,7 +432,8 @@ class KnowledgeBaseService {
     } catch (error) {
       return {
         success: false,
-        error: error instanceof Error ? error.message : "Connection test failed",
+        error:
+          error instanceof Error ? error.message : "Connection test failed",
       };
     }
   }
@@ -561,7 +578,10 @@ class KnowledgeBaseService {
                       null,
                     is_multimodal: resolveIsMultimodal(indexInfo, stats),
                     // Use embedding_model_name (display_name) from backend, fallback to ES stats
-                    embeddingModel: indexInfo.embedding_model_name || stats.embedding_model || "unknown",
+                    embeddingModel:
+                      indexInfo.embedding_model_name ||
+                      stats.embedding_model ||
+                      "unknown",
                     summaryFrequency: indexInfo.summary_frequency || null,
                     lastSummaryTime: indexInfo.last_summary_time || null,
                     knowledge_sources:
@@ -579,6 +599,7 @@ class KnowledgeBaseService {
                     tokenNum: 0,
                     source: "nexent",
                     tenant_id: indexInfo.tenant_id,
+                    preserve_source_file: indexInfo.preserve_source_file ?? true,
                   };
                 }
               );
@@ -758,6 +779,7 @@ class KnowledgeBaseService {
         ingroup_permission?: string;
         group_ids?: number[];
         is_multimodal?: boolean;
+        preserve_source_file?: boolean;
       } = {
         name: params.name,
         description: params.description || "",
@@ -772,6 +794,9 @@ class KnowledgeBaseService {
       if (params.group_ids && params.group_ids.length > 0) {
         requestBody.group_ids = params.group_ids;
       }
+      if (params.preserve_source_file !== undefined) {
+        requestBody.preserve_source_file = params.preserve_source_file;
+      }
 
       const response = await fetch(
         API_ENDPOINTS.knowledgeBase.indexDetail(params.name),
@@ -1525,9 +1550,7 @@ class KnowledgeBaseService {
   }
 
   // Embedding model status and configuration
-  async getEmbeddingModelStatus(
-    indexName: string
-  ): Promise<{
+  async getEmbeddingModelStatus(indexName: string): Promise<{
     status: "configured" | "legacy" | "missing";
     needs_config: boolean;
     index_name: string;
@@ -1554,7 +1577,9 @@ class KnowledgeBaseService {
         const errorData = await response.json().catch(() => ({}));
         throw new ApiError(
           response.status,
-          errorData.detail || errorData.message || "Failed to get embedding model status"
+          errorData.detail ||
+            errorData.message ||
+            "Failed to get embedding model status"
         );
       }
 
diff --git a/frontend/services/promptService.ts b/frontend/services/promptService.ts
index 2899fd370..399511a72 100644
--- a/frontend/services/promptService.ts
+++ b/frontend/services/promptService.ts
@@ -4,6 +4,8 @@ import {
   GeneratePromptParams,
   OptimizePromptSectionParams,
   OptimizePromptSectionResponse,
+  OptimizePromptBadCaseParams,
+  OptimizePromptBadCaseResponse,
   StreamResponseData,
 } from '@/types/agentConfig';
 import { fetchWithAuth, getAuthHeaders } from '@/lib/auth';
@@ -81,3 +83,5 @@ export const optimizePromptSection = async (
   const result = await response.json();
   return result.data as OptimizePromptSectionResponse;
 };
+
+// optimizePromptBadCase removed: badcase optimization is now fully automated in agent debug.
diff --git a/frontend/services/sessionService.ts b/frontend/services/sessionService.ts
index 273f3c9bd..817eede03 100644
--- a/frontend/services/sessionService.ts
+++ b/frontend/services/sessionService.ts
@@ -26,6 +26,10 @@ export const sessionService = {
         body: JSON.stringify({}),
       });
 
+      if (response.status === 204) {
+        return null;
+      }
+
       if (!response.ok) {
         return null;
       }
diff --git a/frontend/stores/agentConfigStore.ts b/frontend/stores/agentConfigStore.ts
index bdbf54cac..e1a1b9545 100644
--- a/frontend/stores/agentConfigStore.ts
+++ b/frontend/stores/agentConfigStore.ts
@@ -10,7 +10,13 @@
 
 import { create } from "zustand";
 
-import { Agent, Tool, AgentConfigUpdate, Skill } from "@/types/agentConfig";
+import {
+  Agent,
+  Tool,
+  AgentConfigUpdate,
+  Skill,
+  DEFAULT_AGENT_VERIFICATION_CONFIG,
+} from "@/types/agentConfig";
 import { getAgentGenerationCache } from "@/lib/agentGenerationCache";
 
 /**
@@ -38,9 +44,12 @@ export type EditableAgent = Pick<
   | "business_logic_model_id"
   | "prompt_template_id"
   | "prompt_template_name"
+  | "verification_config"
   | "sub_agent_id_list"
   | "group_ids"
   | "ingroup_permission"
+  | "greeting_message"
+  | "example_questions"
 > & {
   skills: Skill[];
   external_sub_agent_id_list?: number[];
@@ -168,9 +177,12 @@ function createEmptyEditableAgent(llmConfig?: { id: number | null; name: string;
     business_logic_model_id: llmConfig?.id || 0,
     prompt_template_id: 0,
     prompt_template_name: "system_default",
+    verification_config: { ...DEFAULT_AGENT_VERIFICATION_CONFIG },
     sub_agent_id_list: [],
     group_ids: [],
     ingroup_permission: "READ_ONLY",
+    greeting_message: "",
+    example_questions: [],
   };
 }
 
@@ -197,11 +209,14 @@ const toEditable = (agent: Agent | null): EditableAgent =>
         business_logic_model_id: agent.business_logic_model_id || 0,
         prompt_template_id: agent.prompt_template_id ?? 0,
         prompt_template_name: agent.prompt_template_name || "system_default",
+        verification_config: agent.verification_config || { ...DEFAULT_AGENT_VERIFICATION_CONFIG },
         sub_agent_id_list: agent.sub_agent_id_list || [],
         external_sub_agent_id_list: agent.external_sub_agent_id_list || [],
         group_ids: agent.group_ids || [],
         ingroup_permission: agent.ingroup_permission || "READ_ONLY",
         prompts_hidden: agent.prompts_hidden,
+        greeting_message: agent.greeting_message || "",
+        example_questions: agent.example_questions || [],
       }
     : { ...emptyEditableAgent };
 
@@ -312,12 +327,16 @@ const isDirty = (
       editedAgent.business_logic_model_id !== 0 ||
       (editedAgent.prompt_template_id ?? 0) !== 0 ||
       (editedAgent.prompt_template_name || "system_default") !== "system_default" ||
+      JSON.stringify(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) !==
+        JSON.stringify(DEFAULT_AGENT_VERIFICATION_CONFIG) ||
       normalizeArray(editedAgent.group_ids || []).length > 0 ||
       normalizeArray(editedAgent.sub_agent_id_list || []).length > 0 ||
       normalizeArray(editedAgent.external_sub_agent_id_list || []).length > 0 ||
       editedAgent.tools.length > 0 ||
       editedAgent.skills.length > 0 ||
-      editedAgent.ingroup_permission !== "READ_ONLY"
+      editedAgent.ingroup_permission !== "READ_ONLY" ||
+      editedAgent.greeting_message !== "" ||
+      (editedAgent.example_questions || []).length > 0
     );
   }
 
@@ -338,6 +357,8 @@ const isDirty = (
     baselineAgent.business_logic_model_id !== editedAgent.business_logic_model_id ||
     (baselineAgent.prompt_template_id ?? 0) !== (editedAgent.prompt_template_id ?? 0) ||
     (baselineAgent.prompt_template_name || "system_default") !== (editedAgent.prompt_template_name || "system_default") ||
+    JSON.stringify(baselineAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) !==
+      JSON.stringify(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) ||
     JSON.stringify(normalizeArray(baselineAgent.group_ids ?? [])) !==
       JSON.stringify(normalizeArray(editedAgent.group_ids ?? [])) ||
     JSON.stringify(normalizeArray(baselineAgent.sub_agent_id_list ?? [])) !==
@@ -346,7 +367,9 @@ const isDirty = (
       JSON.stringify(normalizeArray(editedAgent.external_sub_agent_id_list ?? [])) ||
     isToolsDirty(baselineAgent.tools, editedAgent.tools) ||
     isSkillsDirty(baselineAgent.skills, editedAgent.skills) ||
-    baselineAgent.ingroup_permission !== editedAgent.ingroup_permission
+    baselineAgent.ingroup_permission !== editedAgent.ingroup_permission ||
+    baselineAgent.greeting_message !== editedAgent.greeting_message ||
+    JSON.stringify(baselineAgent.example_questions ?? []) !== JSON.stringify(editedAgent.example_questions ?? [])
   );
 };
 
@@ -384,6 +407,12 @@ export const useAgentConfigStore = create<AgentConfigStoreState>((set, get) => (
         if (cached.dutyPrompt) cacheUpdates.duty_prompt = cached.dutyPrompt;
         if (cached.constraintPrompt) cacheUpdates.constraint_prompt = cached.constraintPrompt;
         if (cached.fewShotsPrompt) cacheUpdates.few_shots_prompt = cached.fewShotsPrompt;
+        if (cached.greetingMessage) cacheUpdates.greeting_message = cached.greetingMessage;
+        if (cached.exampleQuestions) {
+          cacheUpdates.example_questions = typeof cached.exampleQuestions === "string"
+            ? (() => { try { return JSON.parse(cached.exampleQuestions); } catch { return []; } })()
+            : cached.exampleQuestions;
+        }
         
         // Only restore agent metadata if not already set in baseline
         if (cached.agentName && !editedAgent.name) cacheUpdates.name = cached.agentName;
@@ -508,4 +537,3 @@ export const useAgentConfigStore = create<AgentConfigStoreState>((set, get) => (
     return get().baselineAgent;
   },
 }));
-
diff --git a/frontend/types/agentConfig.ts b/frontend/types/agentConfig.ts
index 0287fbff9..e717da7cd 100644
--- a/frontend/types/agentConfig.ts
+++ b/frontend/types/agentConfig.ts
@@ -24,10 +24,51 @@ export type AgentConfigUpdate = Partial<Pick<
   | "business_logic_model_name"
   | "prompt_template_id"
   | "prompt_template_name"
+  | "verification_config"
   | "group_ids"
   | "ingroup_permission"
+  | "greeting_message"
+  | "example_questions"
 >>;
 
+export interface AgentVerificationConfig {
+  enabled: boolean;
+  step_verification_enabled: boolean;
+  final_verification_enabled: boolean;
+  llm_verification_enabled?: boolean;
+  max_final_rounds: number;
+  strictness: "lenient" | "balanced" | "strict";
+  fail_policy: "repair_then_controlled_summary" | "warn";
+  pass_score?: number;
+  critical_events: Array<
+    | "tool_precheck"
+    | "tool_result"
+    | "retrieval"
+    | "code_execution"
+    | "handoff"
+    | "final_answer"
+  >;
+}
+
+export const DEFAULT_AGENT_VERIFICATION_CONFIG: AgentVerificationConfig = {
+  enabled: true,
+  step_verification_enabled: true,
+  final_verification_enabled: true,
+  llm_verification_enabled: true,
+  max_final_rounds: 2,
+  strictness: "balanced",
+  fail_policy: "repair_then_controlled_summary",
+  pass_score: 0.75,
+  critical_events: [
+    "tool_precheck",
+    "tool_result",
+    "retrieval",
+    "code_execution",
+    "handoff",
+    "final_answer",
+  ],
+};
+
 // ========== Core Interfaces ==========
 
 export interface Agent {
@@ -42,6 +83,7 @@ export interface Agent {
   max_step: number;
   provide_run_summary: boolean;
   enable_context_manager?: boolean;
+  verification_config?: AgentVerificationConfig;
   tools: Tool[];
   skills?: Skill[];  // Skills configured for this agent
   duty_prompt?: string;
@@ -67,6 +109,8 @@ export interface Agent {
   prompts_hidden?: boolean;
   current_version_no?: number;
   is_a2a_server?: boolean;
+  greeting_message?: string;
+  example_questions?: string[];
 }
 
 export interface Tool {
@@ -460,11 +504,14 @@ export interface GeneratePromptParams {
 export interface OptimizePromptSectionParams {
   agent_id: number;
   task_description: string;
-  model_id: string;
+  model_id: number;
   section_type: "duty" | "constraint" | "few_shots";
   section_title: string;
   current_content: string;
   feedback: string;
+  mode?: "general" | "insert" | "select";
+  start_pos?: number;
+  end_pos?: number;
   tool_ids?: number[];
   sub_agent_ids?: number[];
   knowledge_base_display_names?: string[];
@@ -477,6 +524,32 @@ export interface OptimizePromptSectionResponse {
   optimized_content: string;
 }
 
+export interface BadCaseItem {
+  question: string;
+  answer: string;
+  label?: string;
+  reason?: string;
+}
+
+export interface OptimizePromptBadCaseParams {
+  agent_id: number;
+  model_id: number;
+  current_content: string;
+  bad_cases: BadCaseItem[];
+  section_type: string;
+  section_title: string;
+  tool_ids?: number[];
+  sub_agent_ids?: number[];
+  knowledge_base_display_names?: string[];
+}
+
+export interface OptimizePromptBadCaseResponse {
+  section_type: string;
+  section_title: string;
+  original_content: string;
+  optimized_content: string;
+}
+
 /**
  * Stream Response Data Structure
  */
diff --git a/frontend/types/auth.ts b/frontend/types/auth.ts
index 69d0d436c..f7781e6eb 100644
--- a/frontend/types/auth.ts
+++ b/frontend/types/auth.ts
@@ -9,6 +9,7 @@ export interface User {
   role: UserRole;
   avatarUrl?: string;
   tenantId?: string;
+  authProvider?: "local" | "cas";
 }
 
 // Session type definition
diff --git a/frontend/types/chat.ts b/frontend/types/chat.ts
index dca79e3dc..60778e98c 100644
--- a/frontend/types/chat.ts
+++ b/frontend/types/chat.ts
@@ -36,11 +36,12 @@ export interface StepContent {
         typeof chatConfig.messageTypes.VIRTUAL |
         typeof chatConfig.messageTypes.MEMORY_SEARCH |
         typeof chatConfig.messageTypes.PREPROCESS |
+        typeof chatConfig.messageTypes.VERIFICATION |
         typeof chatConfig.messageTypes.MAX_STEPS_REACHED
   content: string
   expanded: boolean
   timestamp: number
-  subType?: "thinking" | "code" | "deep_thinking" | "progress" | "file_processed" | "truncation" | "complete" | "error"
+  subType?: "thinking" | "code" | "deep_thinking" | "progress" | "file_processed" | "truncation" | "complete" | "error" | "verification"
   isLoading?: boolean
   _preserve?: boolean
   _messageContainer?: {
@@ -74,7 +75,7 @@ metrics: TokenMetrics | null
 
 export interface ChatAgentSelectorProps {
   selectedAgentId: string | null;
-  onAgentSelect: (agentId: string | null) => void;
+  onAgentSelect: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
   disabled?: boolean;
   isInitialMode?: boolean;
 }
@@ -139,6 +140,7 @@ type LocalFilePreviewSource = {
 export type FilePreviewProps = {
   open: boolean;
   onClose: () => void;
+  previewContext?: 'knowledgeBase';
 } & (RemoteFilePreviewSource | LocalFilePreviewSource);
 
 // Main chat message type
@@ -204,9 +206,11 @@ export interface ChatStreamMainProps {
   currentConversationId?: number;
   shouldScrollToBottom?: boolean;
   selectedAgentId?: string | null;
-  onAgentSelect?: (agentId: string | null) => void;
+  onAgentSelect?: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
   onCitationHover?: () => void;
   onScroll?: () => void;
+  agentGreeting?: string | null;
+  agentExampleQuestions?: string[];
 }
 
 // Card item type for task window
diff --git a/frontend/types/knowledgeBase.ts b/frontend/types/knowledgeBase.ts
index 7caf4986c..ed32fad3d 100644
--- a/frontend/types/knowledgeBase.ts
+++ b/frontend/types/knowledgeBase.ts
@@ -37,6 +37,7 @@ export interface KnowledgeBase {
   tenant_id?: string;
   summaryFrequency?: string | null;
   lastSummaryTime?: string | null;
+  preserve_source_file?: boolean;
 }
 
 // Create knowledge base parameter type
@@ -49,6 +50,7 @@ export interface KnowledgeBaseCreateParams {
   ingroup_permission?: string;
   group_ids?: number[];
   is_multimodal?: boolean;
+  preserve_source_file?: boolean;
 }
 
 // Document type
diff --git a/k8s/helm/deploy.sh b/k8s/helm/deploy.sh
index 7a583307d..07522d22c 100755
--- a/k8s/helm/deploy.sh
+++ b/k8s/helm/deploy.sh
@@ -611,7 +611,7 @@ apply() {
                 sleep 5
                 for svc in $backend_services; do
                     echo "  Waiting for nexent-$svc..."
-                    if kubectl wait --for=condition=ready pod -l app=nexent-$svc -n $NAMESPACE --timeout=300s 2>/dev/null; then
+                    if kubectl rollout status "deployment/nexent-$svc" -n "$NAMESPACE" --timeout=300s >/dev/null 2>&1; then
                         echo "  nexent-$svc is ready."
                     else
                         echo "  Error: nexent-$svc did not become ready within timeout."
diff --git a/k8s/helm/nexent/charts/nexent-common/files/init.sql b/k8s/helm/nexent/charts/nexent-common/files/init.sql
index f27f2ad85..399c50917 100644
--- a/k8s/helm/nexent/charts/nexent-common/files/init.sql
+++ b/k8s/helm/nexent/charts/nexent-common/files/init.sql
@@ -337,9 +337,12 @@ CREATE TABLE IF NOT EXISTS nexent.ag_tenant_agent_t (
     is_new BOOLEAN DEFAULT FALSE,
     provide_run_summary BOOLEAN DEFAULT FALSE,
     enable_context_manager BOOLEAN DEFAULT FALSE,
+    verification_config JSONB,
     version_no INTEGER DEFAULT 0 NOT NULL,
     current_version_no INTEGER NULL,
     ingroup_permission VARCHAR(30),
+    greeting_message TEXT,
+    example_questions JSONB,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -397,6 +400,9 @@ COMMENT ON COLUMN nexent.ag_tenant_agent_t.version_no IS 'Version number. 0 = dr
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.current_version_no IS 'Current published version number. NULL means no version published yet';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.ingroup_permission IS 'In-group permission: EDIT, READ_ONLY, PRIVATE';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.enable_context_manager IS 'Whether to enable context management (compression) for this agent';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
+COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
 
 -- Create index for is_new queries
 CREATE INDEX IF NOT EXISTS idx_ag_tenant_agent_t_is_new
@@ -1862,3 +1868,238 @@ FOR EACH ROW
 EXECUTE FUNCTION update_mcp_community_record_update_time();
 
 COMMENT ON TRIGGER update_mcp_community_record_update_time_trigger ON nexent.mcp_community_record_t IS 'Trigger to maintain update_time';
+
+CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
+    cas_session_id SERIAL PRIMARY KEY,
+    session_id VARCHAR(100) NOT NULL UNIQUE,
+    user_id VARCHAR(100) NOT NULL,
+    cas_user_id VARCHAR(200) NOT NULL,
+    cas_session_index VARCHAR(500),
+    status VARCHAR(30) NOT NULL DEFAULT 'active',
+    expires_at TIMESTAMP NOT NULL,
+    revoked_at TIMESTAMP,
+    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    created_by VARCHAR(100),
+    updated_by VARCHAR(100),
+    delete_flag VARCHAR(1) DEFAULT 'N'
+);
+
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
+    ON nexent.user_cas_session_t (session_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
+    ON nexent.user_cas_session_t (user_id);
+CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
+    ON nexent.user_cas_session_t (cas_user_id);
+
+COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
+COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
+COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
+
+-- Rename params -> config_values, add config_schemas to ag_skill_info_t
+-- Add tenant_id column for multi-tenancy support
+ALTER TABLE nexent.ag_skill_info_t ADD COLUMN IF NOT EXISTS tenant_id VARCHAR(100);
+
+-- Add config_values and config_schemas to ag_skill_info_t
+DO $$
+BEGIN
+    IF EXISTS (
+        SELECT 1 FROM information_schema.columns
+        WHERE table_schema = 'nexent'
+          AND table_name   = 'ag_skill_info_t'
+          AND column_name  = 'params'
+    ) THEN
+        ALTER TABLE nexent.ag_skill_info_t RENAME COLUMN params TO config_values;
+    END IF;
+END $$;
+ALTER TABLE nexent.ag_skill_info_t ADD COLUMN IF NOT EXISTS config_schemas JSON;
+
+-- Comments for ag_skill_info_t columns
+COMMENT ON COLUMN nexent.ag_skill_info_t.tenant_id IS 'Tenant ID for multi-tenancy. NULL for pre-existing skills.';
+COMMENT ON COLUMN nexent.ag_skill_info_t.config_values IS 'Runtime parameter values from config/config.yaml';
+COMMENT ON COLUMN nexent.ag_skill_info_t.config_schemas IS 'Parameter metadata list from config/schema.yaml';
+
+-- Add config_values and config_schemas to ag_skill_instance_t
+ALTER TABLE nexent.ag_skill_instance_t ADD COLUMN IF NOT EXISTS config_values JSON;
+ALTER TABLE nexent.ag_skill_instance_t ADD COLUMN IF NOT EXISTS config_schemas JSON;
+
+-- Comments for ag_skill_instance_t columns
+COMMENT ON COLUMN nexent.ag_skill_instance_t.config_values IS 'Per-agent runtime parameter values from config/config.yaml';
+COMMENT ON COLUMN nexent.ag_skill_instance_t.config_schemas IS 'Per-agent parameter schema overrides from config/schema.yaml';
+
+-- Migration: ASSET_OWNER role permissions and invitation type comment
+-- Date: 2026-05-29
+-- Description: Add ASSET_OWNER role permissions, SU asset-owner invite permissions,
+--              update invitation code_type comment, and ensure ag_skill_info_t.tenant_id exists
+-- Source: commit 15cece97692db2372a978cbdf21b5d5316e79f30 (init.sql)
+
+SET search_path TO nexent;
+
+BEGIN;
+
+COMMENT ON COLUMN nexent.tenant_invitation_code_t.code_type IS
+    'Invitation code type: ADMIN_INVITE, DEV_INVITE, USER_INVITE, ASSET_OWNER_INVITE';
+
+INSERT INTO nexent.role_permission_t
+    (role_permission_id, user_role, permission_category, permission_type, permission_subtype)
+VALUES
+    (188, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'CREATE'),
+    (189, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'READ'),
+    (190, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'UPDATE'),
+    (191, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'DELETE'),
+    (192, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/'),
+    (193, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/agents'),
+    (194, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/knowledges'),
+    (195, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/chat'),
+    (196, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/space'),
+    (197, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/market'),
+    (198, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/models'),
+    (199, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'CREATE'),
+    (200, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'READ'),
+    (201, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'UPDATE'),
+    (202, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'DELETE'),
+    (203, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'CREATE'),
+    (204, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'READ'),
+    (205, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'UPDATE'),
+    (206, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'DELETE'),
+    (207, 'ASSET_OWNER', 'RESOURCE', 'KB', 'CREATE'),
+    (208, 'ASSET_OWNER', 'RESOURCE', 'KB', 'READ'),
+    (209, 'ASSET_OWNER', 'RESOURCE', 'KB', 'UPDATE'),
+    (210, 'ASSET_OWNER', 'RESOURCE', 'KB', 'DELETE'),
+    (211, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'CREATE'),
+    (212, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'READ'),
+    (213, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'UPDATE'),
+    (214, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'DELETE'),
+    (215, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'CREATE'),
+    (216, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'READ'),
+    (217, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'UPDATE'),
+    (218, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'DELETE'),
+    (219, 'ASSET_OWNER', 'RESOURCE', 'USER.ROLE', 'READ'),
+    (220, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/users'),
+    (221, 'SU', 'VISIBILITY', 'LEFT_NAV_MENU', '/asset-owner-resources')
+ON CONFLICT (role_permission_id) DO NOTHING;
+
+COMMIT;
+
+-- Migration: Add preserve_source_file to knowledge_record_t table
+-- Date: 2026-06-01
+-- Description: Whether to preserve uploaded source documents after vectorization (default: true)
+
+ALTER TABLE nexent.knowledge_record_t
+ADD COLUMN IF NOT EXISTS preserve_source_file BOOLEAN NOT NULL DEFAULT true;
+
+COMMENT ON COLUMN nexent.knowledge_record_t.preserve_source_file IS 'Whether to preserve uploaded source documents after vectorization';
+
+-- Migration: Add ag_agent_repository_t table
+-- Date: 2026-06-05
+-- Description: Agent marketplace repository for frozen shareable agent snapshots.
+
+SET search_path TO nexent;
+
+BEGIN;
+
+CREATE SEQUENCE IF NOT EXISTS nexent.ag_agent_repository_t_agent_repository_id_seq;
+
+CREATE TABLE IF NOT EXISTS nexent.ag_agent_repository_t (
+    agent_repository_id BIGINT NOT NULL DEFAULT nextval('nexent.ag_agent_repository_t_agent_repository_id_seq'),
+    publisher_tenant_id VARCHAR(100) NOT NULL,
+    publisher_user_id VARCHAR(100) NOT NULL,
+    agent_id INTEGER NOT NULL,
+    source_version_no INTEGER NOT NULL,
+    name VARCHAR(100) NOT NULL,
+    display_name VARCHAR(100),
+    description TEXT,
+    author VARCHAR(100),
+    category_id INTEGER,
+    tags TEXT[],
+    tool_count INTEGER,
+    version_label VARCHAR(100),
+    agent_info_json JSONB NOT NULL,
+    status VARCHAR(30) DEFAULT 'NOT_SHARED',
+    create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
+    update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
+    created_by VARCHAR(100),
+    updated_by VARCHAR(100),
+    delete_flag VARCHAR(1) DEFAULT 'N',
+    CONSTRAINT ag_agent_repository_t_pkey PRIMARY KEY (agent_repository_id)
+);
+
+ALTER SEQUENCE nexent.ag_agent_repository_t_agent_repository_id_seq
+    OWNED BY nexent.ag_agent_repository_t.agent_repository_id;
+
+ALTER TABLE nexent.ag_agent_repository_t OWNER TO root;
+
+COMMENT ON TABLE nexent.ag_agent_repository_t IS 'Agent marketplace repository for frozen shareable agent snapshots';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_repository_id IS 'Agent repository listing ID, unique primary key';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_tenant_id IS 'Publisher tenant ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_user_id IS 'Publisher user ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_id IS 'Root agent ID from ag_tenant_agent_t; upsert key with publisher_tenant_id';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.source_version_no IS 'Published version number frozen at share time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.name IS 'Root agent programmatic name for display and search';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.display_name IS 'Root agent display name';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.description IS 'Root agent description';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.author IS 'Agent author';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.category_id IS 'Optional marketplace category ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.tags IS 'Marketplace tags';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.tool_count IS 'Total tool count across all agents in the bundle (display only)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.version_label IS 'Repository entry version label for display (e.g. v1.0)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_info_json IS 'Frozen ExportAndImportDataFormat snapshot with optional skills';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.status IS 'Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.create_time IS 'Creation time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.update_time IS 'Update time';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.created_by IS 'Creator ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.updated_by IS 'Updater ID';
+COMMENT ON COLUMN nexent.ag_agent_repository_t.delete_flag IS 'Soft delete flag: Y/N';
+
+CREATE UNIQUE INDEX IF NOT EXISTS uq_agent_repository_tenant_agent_active
+    ON nexent.ag_agent_repository_t (publisher_tenant_id, agent_id)
+    WHERE delete_flag = 'N';
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_publisher_delete
+    ON nexent.ag_agent_repository_t (publisher_tenant_id, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_status_delete
+    ON nexent.ag_agent_repository_t (status, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_name_delete
+    ON nexent.ag_agent_repository_t (name, delete_flag);
+
+CREATE INDEX IF NOT EXISTS idx_agent_repository_tags_gin
+    ON nexent.ag_agent_repository_t USING GIN (tags);
+
+CREATE OR REPLACE FUNCTION update_ag_agent_repository_update_time()
+RETURNS TRIGGER AS $$
+BEGIN
+    NEW.update_time = CURRENT_TIMESTAMP;
+    RETURN NEW;
+END;
+$$ LANGUAGE plpgsql;
+
+COMMENT ON FUNCTION update_ag_agent_repository_update_time() IS 'Auto-update update_time for ag_agent_repository_t';
+
+DROP TRIGGER IF EXISTS update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t;
+CREATE TRIGGER update_ag_agent_repository_update_time_trigger
+BEFORE UPDATE ON nexent.ag_agent_repository_t
+FOR EACH ROW
+EXECUTE FUNCTION update_ag_agent_repository_update_time();
+
+COMMENT ON TRIGGER update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t IS 'Trigger to maintain update_time';
+
+COMMIT;
+
+-- Migration: Add selected_agent_version_no to ag_agent_relation_t
+-- Date: 2026-06-09
+-- Description: Pin child agent version on parent-child relations at publish time.
+
+SET search_path TO nexent;
+
+BEGIN;
+
+ALTER TABLE nexent.ag_agent_relation_t
+    ADD COLUMN IF NOT EXISTS selected_agent_version_no INTEGER;
+
+COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS
+    'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
+
+COMMIT;
diff --git a/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml b/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
index 1b473b633..0f1a4a5a3 100644
--- a/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
+++ b/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
@@ -166,3 +166,23 @@ data:
   OAUTH_SSL_VERIFY: {{ .Values.config.oauth.sslVerify | quote }}
   OAUTH_CA_BUNDLE: {{ .Values.config.oauth.caBundle | quote }}
   OAUTH_CALLBACK_BASE_URL: {{ .Values.config.oauth.callbackBaseUrl | quote }}
+
+  # ===== CAS SSO Configuration =====
+  CAS_ENABLED: {{ .Values.config.cas.enabled | quote }}
+  CAS_SERVER_URL: {{ .Values.config.cas.serverUrl | quote }}
+  CAS_VALIDATE_PATH: {{ .Values.config.cas.validatePath | quote }}
+  CAS_CALLBACK_BASE_URL: {{ .Values.config.cas.callbackBaseUrl | quote }}
+  CAS_LOGIN_MODE: {{ .Values.config.cas.loginMode | quote }}
+  CAS_USER_ATTRIBUTE: {{ .Values.config.cas.userAttribute | quote }}
+  CAS_EMAIL_ATTRIBUTE: {{ .Values.config.cas.emailAttribute | quote }}
+  CAS_ROLE_ATTRIBUTE: {{ .Values.config.cas.roleAttribute | quote }}
+  CAS_TENANT_ATTRIBUTE: {{ .Values.config.cas.tenantAttribute | quote }}
+  CAS_ROLE_MAP_JSON: {{ .Values.config.cas.roleMapJson | quote }}
+  CAS_SESSION_MAX_AGE_SECONDS: {{ .Values.config.cas.sessionMaxAgeSeconds | quote }}
+  LOCAL_SESSION_MAX_AGE_SECONDS: {{ .Values.config.cas.localSessionMaxAgeSeconds | quote }}
+  CAS_RENEW_BEFORE_SECONDS: {{ .Values.config.cas.renewBeforeSeconds | quote }}
+  CAS_RENEW_TIMEOUT_SECONDS: {{ .Values.config.cas.renewTimeoutSeconds | quote }}
+  CAS_SYNTHETIC_EMAIL_DOMAIN: {{ .Values.config.cas.syntheticEmailDomain | quote }}
+  CAS_LOGOUT_URL: {{ .Values.config.cas.logoutUrl | quote }}
+  CAS_SSL_VERIFY: {{ .Values.config.cas.sslVerify | quote }}
+  CAS_CA_BUNDLE: {{ .Values.config.cas.caBundle | quote }}
diff --git a/k8s/helm/nexent/charts/nexent-common/values.yaml b/k8s/helm/nexent/charts/nexent-common/values.yaml
index 788ae7290..7b27ba302 100644
--- a/k8s/helm/nexent/charts/nexent-common/values.yaml
+++ b/k8s/helm/nexent/charts/nexent-common/values.yaml
@@ -139,6 +139,29 @@ config:
     sslVerify: "true"
     caBundle: ""
     callbackBaseUrl: "http://localhost:30000"
+  cas:
+    enabled: "false"
+    serverUrl: ""
+    validatePath: "/p3/serviceValidate"
+    callbackBaseUrl: "http://localhost:30000"
+    # Supported values:
+    # - disabled: disable CAS login entry and automatic CAS redirects.
+    # - button: show CAS as an optional login entry.
+    # - force: automatically redirect unauthenticated users to CAS login.
+    loginMode: "disabled"
+    userAttribute: ""
+    emailAttribute: "email"
+    roleAttribute: "role"
+    tenantAttribute: "tenant_id"
+    roleMapJson: ""
+    sessionMaxAgeSeconds: "3600"
+    localSessionMaxAgeSeconds: "3600"
+    renewBeforeSeconds: "300"
+    renewTimeoutSeconds: "10"
+    syntheticEmailDomain: "cas.local"
+    logoutUrl: ""
+    sslVerify: "true"
+    caBundle: ""
 
 # Secrets used by common templates
 secrets:
diff --git a/k8s/helm/nexent/charts/nexent-data-process/values.yaml b/k8s/helm/nexent/charts/nexent-data-process/values.yaml
index 189292667..d6bb70a7f 100644
--- a/k8s/helm/nexent/charts/nexent-data-process/values.yaml
+++ b/k8s/helm/nexent/charts/nexent-data-process/values.yaml
@@ -12,7 +12,7 @@ resources:
       memory: 512Mi
       cpu: 0.5
     limits:
-      memory: 4Gi
+      memory: 64Gi
       cpu: 8
 
 config:
diff --git a/k8s/helm/nexent/values.yaml b/k8s/helm/nexent/values.yaml
index ce5bc454a..6224d0949 100644
--- a/k8s/helm/nexent/values.yaml
+++ b/k8s/helm/nexent/values.yaml
@@ -40,6 +40,33 @@ global:
 
 # Optional monitoring stack. Set provider to one of:
 # otlp, phoenix, langfuse, langsmith, grafana, zipkin.
+nexent-common:
+  # Shared ConfigMap values rendered into the Kubernetes nexent-config ConfigMap.
+  config:
+    cas:
+      enabled: "false"
+      serverUrl: ""
+      validatePath: "/p3/serviceValidate"
+      callbackBaseUrl: "http://localhost:30000"
+      # Supported values:
+      # - disabled: disable CAS login entry and automatic CAS redirects.
+      # - button: show CAS as an optional login entry.
+      # - force: automatically redirect unauthenticated users to CAS login.
+      loginMode: "disabled"
+      userAttribute: ""
+      emailAttribute: "email"
+      roleAttribute: "role"
+      tenantAttribute: "tenant_id"
+      roleMapJson: ""
+      sessionMaxAgeSeconds: "3600"
+      localSessionMaxAgeSeconds: "3600"
+      renewBeforeSeconds: "300"
+      renewTimeoutSeconds: "10"
+      syntheticEmailDomain: "cas.local"
+      logoutUrl: ""
+      sslVerify: "true"
+      caBundle: ""
+
 nexent-elasticsearch:
   enabled: true
 nexent-postgresql:
diff --git a/make/data_process/Dockerfile b/make/data_process/Dockerfile
index 8d9a8a723..998e2352a 100644
--- a/make/data_process/Dockerfile
+++ b/make/data_process/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.10-slim
+FROM python:3.11-slim
 ARG MIRROR
 ARG APT_MIRROR
 LABEL authors="nexent"
@@ -45,11 +45,12 @@ RUN uv sync --no-cache-dir --extra data-process $(test -n "$MIRROR" && echo "-i
     uv cache clean
 # Layer 2: install sdk in link mode
 COPY sdk /opt/sdk
-RUN uv pip install --no-cache-dir /opt/sdk $(test -n "$MIRROR" && echo "-i $MIRROR") && \
+RUN uv pip install --no-cache-dir "/opt/sdk[performance]" $(test -n "$MIRROR" && echo "-i $MIRROR") && \
     uv cache clean
 
 # Pre-download tiktoken cl100k_base model to avoid network issues during runtime
 RUN uv run python -c "import tiktoken; enc = tiktoken.get_encoding('cl100k_base')"
+
 # Layer 3: copy backend code
 COPY backend /opt/backend
 
diff --git a/make/main/Dockerfile b/make/main/Dockerfile
index 0f4027619..0e32b04b7 100644
--- a/make/main/Dockerfile
+++ b/make/main/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.10-slim
+FROM python:3.11-slim
 ARG MIRROR
 ARG APT_MIRROR
 LABEL authors="nexent"
diff --git a/make/mcp/Dockerfile b/make/mcp/Dockerfile
index 03cb3f1c3..e011bf5fe 100644
--- a/make/mcp/Dockerfile
+++ b/make/mcp/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.10-slim
+FROM python:3.11-slim
 
 ARG MIRROR
 ARG APT_MIRROR
@@ -38,7 +38,7 @@ RUN if [ -n "$MCP_PROXY_VERSION" ]; then \
 
 # Install Node.js 20 from official binaries (pin exact version to avoid repo issues)
 ARG NODE_VERSION=20.17.0
-RUN set -euo pipefail && \
+RUN set -eu && \
     arch="$(dpkg --print-architecture)" && \
     case "${arch}" in \
         amd64) node_arch="x64" ;; \
diff --git a/scripts/deployment/common.sh b/scripts/deployment/common.sh
index 5855af1a0..006561553 100755
--- a/scripts/deployment/common.sh
+++ b/scripts/deployment/common.sh
@@ -319,11 +319,6 @@ deployment_validate() {
     deployment_error "Local config schemaVersion $DEPLOYMENT_LOADED_SCHEMA_VERSION is incompatible with $DEPLOYMENT_SCHEMA_VERSION. Re-run with --reconfigure."
     return 1
   fi
-  if [ -n "$DEPLOYMENT_LOADED_APP_VERSION" ] && [ -n "${APP_VERSION:-}" ] && [ -z "${DEPLOYMENT_APP_VERSION_EXPLICIT:-}" ] && [ "$DEPLOYMENT_LOADED_APP_VERSION" != "$APP_VERSION" ]; then
-    deployment_error "Local config appVersion $DEPLOYMENT_LOADED_APP_VERSION does not match current appVersion $APP_VERSION. Re-run with --reconfigure or pass --app-version."
-    return 1
-  fi
-
   local old_ifs="$IFS"
   local component
   IFS=','
diff --git a/scripts/offline/build_offline_package.sh b/scripts/offline/build_offline_package.sh
index f69eaea80..ff2141c83 100755
--- a/scripts/offline/build_offline_package.sh
+++ b/scripts/offline/build_offline_package.sh
@@ -4,7 +4,6 @@ set -e
 
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
-DEPLOYMENT_COMMON="$PROJECT_ROOT/scripts/deployment/common.sh"
 
 DEFAULT_VERSION="latest"
 DEFAULT_PLATFORM="amd64"
@@ -15,16 +14,6 @@ VERSION=""
 PLATFORM=""
 OUTPUT_DIR=""
 INCLUDE_SOURCE=""
-DRY_RUN="false"
-COMMON_ARGS=()
-
-if [ -f "$DEPLOYMENT_COMMON" ]; then
-  # shellcheck source=/dev/null
-  source "$DEPLOYMENT_COMMON"
-else
-  echo "Error: shared deployment helper not found: $DEPLOYMENT_COMMON"
-  exit 1
-fi
 
 show_help() {
   echo "Usage: $0 [OPTIONS]"
@@ -40,10 +29,6 @@ show_help() {
   echo "                           Default: $DEFAULT_OUTPUT_DIR"
   echo "  --include-source BOOL   Include source code (true or false)"
   echo "                           Default: $DEFAULT_INCLUDE_SOURCE"
-  echo "  --components LIST       Deployment components for image selection"
-  echo "  --image-source SOURCE   general, mainland, or local-latest"
-  echo "  --registry-profile NAME Legacy alias for --image-source general|mainland"
-  echo "  --config FILE           Deployment config with components and image source"
   echo "  --dry-run               Show execution plan without actual operations"
   echo "  --help                  Show this help message"
   echo ""
@@ -75,15 +60,7 @@ parse_args() {
         shift 2
         ;;
       --dry-run)
-        DRY_RUN="true"
-        shift
-        ;;
-      --components|--image-source|--registry-profile|--app-version|--monitoring-provider|--port-policy|--config|--local-config)
-        COMMON_ARGS+=("$1" "$2")
-        shift 2
-        ;;
-      --use-local-config|--reconfigure)
-        COMMON_ARGS+=("$1")
+        dry_run=true
         shift
         ;;
       --help)
@@ -107,32 +84,13 @@ parse_args() {
     echo "Error: Platform must be 'amd64' or 'arm64'"
     exit 1
   fi
-}
 
-prepare_deployment_image_config() {
-  export APP_VERSION="$VERSION"
-  deployment_prepare_config "${COMMON_ARGS[@]}" --app-version "$VERSION" || exit 1
-
-  case "$DEPLOYMENT_REGISTRY_PROFILE" in
-    mainland)
-      [ -f "$PROJECT_ROOT/docker/.env.mainland" ] && source "$PROJECT_ROOT/docker/.env.mainland"
-      ;;
-    general|local-latest)
-      [ -f "$PROJECT_ROOT/docker/.env.general" ] && source "$PROJECT_ROOT/docker/.env.general"
-      ;;
-  esac
-
-  deployment_apply_image_source
-}
-
-show_dry_run_plan() {
+  if [[ "$dry_run" == "true" ]]; then
     echo "=== DRY RUN MODE ==="
     echo "Version: $VERSION"
     echo "Platform: $PLATFORM"
     echo "Output directory: $OUTPUT_DIR"
     echo "Include source: $INCLUDE_SOURCE"
-    echo "Components: $DEPLOYMENT_COMPONENTS"
-    echo "Image source: $DEPLOYMENT_IMAGE_SOURCE"
     echo ""
     echo "Images to pull:"
     get_nexent_images
@@ -140,49 +98,38 @@ show_dry_run_plan() {
     echo ""
     echo "No actual operations will be performed."
     exit 0
+  fi
 }
 
 get_nexent_images() {
-  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_IMAGE"
-  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_WEB_IMAGE"
-  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_MCP_DOCKER_IMAGE"
-  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "data-process" && echo "$NEXENT_DATA_PROCESS_IMAGE"
-  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "terminal" && echo "$OPENSSH_SERVER_IMAGE"
-  true
+  local version_tag="$VERSION"
+
+  local nexent_images=(
+    "nexent/nexent:${version_tag}"
+    "nexent/nexent-web:${version_tag}"
+    "nexent/nexent-data-process:${version_tag}"
+    "nexent/nexent-mcp:${version_tag}"
+  )
+
+  for img in "${nexent_images[@]}"; do
+    echo "$img"
+  done
 }
 
 get_third_party_images() {
-  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "infrastructure"; then
-    echo "$ELASTICSEARCH_IMAGE"
-    echo "$POSTGRESQL_IMAGE"
-    echo "$REDIS_IMAGE"
-    echo "$MINIO_IMAGE"
-  fi
-  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "supabase"; then
-    echo "$SUPABASE_KONG"
-    echo "$SUPABASE_GOTRUE"
-    echo "$SUPABASE_DB"
-  fi
-  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "monitoring"; then
-    echo "otel/opentelemetry-collector-contrib:0.151.0"
-    case "$DEPLOYMENT_MONITORING_PROVIDER" in
-      phoenix) echo "arizephoenix/phoenix:15" ;;
-      grafana)
-        echo "grafana/tempo:2.10.5"
-        echo "grafana/grafana:12.4"
-        ;;
-      zipkin) echo "openzipkin/zipkin:latest" ;;
-      langfuse)
-        echo "docker.io/langfuse/langfuse-worker:3"
-        echo "docker.io/langfuse/langfuse:3"
-        echo "docker.io/clickhouse/clickhouse-server:26.3-alpine"
-        echo "docker.io/minio/minio:RELEASE.2023-12-20T01-00-02Z"
-        echo "docker.io/redis:alpine"
-        echo "docker.io/postgres:15-alpine"
-        ;;
-    esac
-  fi
-  true
+  local third_party_images=(
+    "docker.elastic.co/elasticsearch/elasticsearch:8.17.4"
+    "docker.io/library/postgres:15-alpine"
+    "docker.io/library/redis:alpine"
+    "quay.io/minio/minio:RELEASE.2023-12-20T01-00-02Z"
+    "docker.io/library/kong:2.8.1"
+    "docker.io/supabase/gotrue:v2.170.0"
+    "docker.io/supabase/postgres:15.8.1.060"
+  )
+
+  for img in "${third_party_images[@]}"; do
+    echo "$img"
+  done
 }
 
 pull_with_retry() {
@@ -415,11 +362,6 @@ LOADSCRIPT
 
 main() {
   parse_args "$@"
-  prepare_deployment_image_config
-
-  if [[ "$DRY_RUN" == "true" ]]; then
-    show_dry_run_plan
-  fi
 
   echo ""
   echo "========================================"
@@ -429,8 +371,6 @@ main() {
   echo "Platform: $PLATFORM"
   echo "Output directory: $OUTPUT_DIR"
   echo "Include source: $INCLUDE_SOURCE"
-  echo "Components: $DEPLOYMENT_COMPONENTS"
-  echo "Image source: $DEPLOYMENT_IMAGE_SOURCE"
   echo "========================================"
 
   rm -rf "$OUTPUT_DIR"
diff --git a/sdk/nexent/__init__.py b/sdk/nexent/__init__.py
index 781fcf495..d0de150cb 100644
--- a/sdk/nexent/__init__.py
+++ b/sdk/nexent/__init__.py
@@ -3,8 +3,7 @@
 from .memory import *
 from .storage import *
 from .vector_database import *
-from .container import *
 from .skills import *
 
 
-__all__ = ["core", "memory", "storage", "vector_database", "container", "datamate", "skills"]
+__all__ = ["core", "memory", "storage", "vector_database", "datamate", "skills"]
diff --git a/sdk/nexent/container/docker_client.py b/sdk/nexent/container/docker_client.py
index 166d27b49..80aa6f8c3 100644
--- a/sdk/nexent/container/docker_client.py
+++ b/sdk/nexent/container/docker_client.py
@@ -11,12 +11,34 @@
 
 import docker
 from docker.errors import APIError, DockerException, NotFound
-from fastmcp import Client
-from fastmcp.client.transports import StreamableHttpTransport, SSETransport
 
 from .container_client_base import ContainerClient, ContainerConfig
 from .docker_config import DockerContainerConfig
 
+Client = None
+StreamableHttpTransport = None
+SSETransport = None
+
+
+def _ensure_fastmcp_imports() -> tuple[type, type, type]:
+    global Client, StreamableHttpTransport, SSETransport
+
+    if Client is None:
+        from fastmcp import Client as FastMCPClient
+
+        Client = FastMCPClient
+
+    if StreamableHttpTransport is None or SSETransport is None:
+        from fastmcp.client.transports import (
+            StreamableHttpTransport as FastMCPStreamableHttpTransport,
+            SSETransport as FastMCPSSETransport,
+        )
+
+        StreamableHttpTransport = FastMCPStreamableHttpTransport
+        SSETransport = FastMCPSSETransport
+
+    return Client, StreamableHttpTransport, SSETransport
+
 logger = logging.getLogger("nexent.container.docker")
 
 
@@ -35,7 +57,7 @@ class ContainerConnectionError(Exception):
 class DockerContainerClient(ContainerClient):
     """Docker container client implementation"""
 
-    DEFAULT_NETWORK_NAME = "nexent_nexent"
+    DEFAULT_NETWORK_NAME = "nexent_network"
 
     def __init__(self, config: DockerContainerConfig):
         """
@@ -381,6 +403,8 @@ async def _wait_for_service_ready(
         Raises:
             ContainerConnectionError: If service is not ready after max retries
         """
+        client_cls, streamable_http_transport_cls, sse_transport_cls = _ensure_fastmcp_imports()
+
         for i in range(max_retries):
             try:
                 # Select transport based on URL ending and set headers
@@ -388,23 +412,23 @@ async def _wait_for_service_ready(
                 headers = {"Authorization": authorization_token} if authorization_token else {}
 
                 if url_stripped.endswith("/sse"):
-                    transport = SSETransport(
+                    transport = sse_transport_cls(
                         url=url_stripped,
                         headers=headers
                     )
                 elif url_stripped.endswith("/mcp"):
-                    transport = StreamableHttpTransport(
+                    transport = streamable_http_transport_cls(
                         url=url_stripped,
                         headers=headers
                     )
                 else:
                     # Default to StreamableHttpTransport for unrecognized formats
-                    transport = StreamableHttpTransport(
+                    transport = streamable_http_transport_cls(
                         url=url_stripped,
                         headers=headers
                     )
 
-                client = Client(transport=transport)
+                client = client_cls(transport=transport)
                 async with client:
                     if client.is_connected():
                         logger.info(f"Service ready at {url}")
diff --git a/sdk/nexent/container/k8s_client.py b/sdk/nexent/container/k8s_client.py
index c1fa4db53..c2fb72741 100644
--- a/sdk/nexent/container/k8s_client.py
+++ b/sdk/nexent/container/k8s_client.py
@@ -8,6 +8,7 @@
 import asyncio
 import logging
 import socket
+import re
 import uuid
 
 import kubernetes
@@ -23,6 +24,47 @@
 
 logger = logging.getLogger("nexent.container.kubernetes")
 
+# Kubernetes naming constraints: lowercase alphanumeric or dash, cannot start/end with dash,
+# cannot have consecutive dashes, max 253 characters
+K8S_NAME_PATTERN = re.compile(r"[^a-z0-9-]+")
+K8S_CONSECUTIVE_DASHES = re.compile(r"-+")
+
+
+def _sanitize_k8s_name(name: str) -> str:
+    """Convert arbitrary string to valid Kubernetes resource name.
+
+    Rules:
+    - Convert to lowercase
+    - Replace invalid characters with dash
+    - Collapse consecutive dashes
+    - Remove leading/trailing dashes
+    - Must start with alphanumeric
+
+    Args:
+        name: Input string to sanitize
+
+    Returns:
+        Valid Kubernetes name (lowercase alphanumeric and dashes only)
+    """
+    if not name:
+        return "unknown"
+
+    # Lowercase and replace invalid chars with dash
+    sanitized = K8S_NAME_PATTERN.sub("-", name.lower())
+
+    # Collapse consecutive dashes
+    sanitized = K8S_CONSECUTIVE_DASHES.sub("-", sanitized)
+
+    # Remove leading/trailing dashes
+    sanitized = sanitized.strip("-")
+
+    # Ensure it starts with alphanumeric
+    if sanitized and not sanitized[0].isalnum():
+        sanitized = "x" + sanitized
+
+    # Fallback if empty
+    return sanitized if sanitized else "unknown"
+
 
 class ContainerError(Exception):
     """Raised when container operation fails"""
@@ -77,9 +119,9 @@ def __init__(self, config: KubernetesContainerConfig):
 
     def _generate_pod_name(self, service_name: str, tenant_id: str, user_id: str) -> str:
         """Generate unique pod name with service, tenant, and user segments."""
-        safe_name = "".join(c if c.isalnum() or c == "-" else "-" for c in service_name)
-        tenant_part = (tenant_id or "")[:8]
-        user_part = (user_id or "")[:8]
+        safe_name = _sanitize_k8s_name(service_name)
+        tenant_part = _sanitize_k8s_name(tenant_id)[:8]
+        user_part = _sanitize_k8s_name(user_id)[:8]
         uuid_part = uuid.uuid4().hex[:8]
         return f"mcp-{safe_name}-{tenant_part}-{user_part}-{uuid_part}"
 
@@ -486,7 +528,7 @@ def list_containers(
 
                 # Filter by service_name if provided
                 if service_name:
-                    safe_name = "".join(c if c.isalnum() or c == "-" else "-" for c in service_name)
+                    safe_name = _sanitize_k8s_name(service_name)
                     pod_component = labels.get(self.LABEL_COMPONENT, "")
                     if safe_name not in pod_component:
                         continue
diff --git a/sdk/nexent/core/agents/agent_model.py b/sdk/nexent/core/agents/agent_model.py
index 82fb81167..62e75cb59 100644
--- a/sdk/nexent/core/agents/agent_model.py
+++ b/sdk/nexent/core/agents/agent_model.py
@@ -75,6 +75,67 @@ class ToolConfig(BaseModel):
     usage: Optional[str] = Field(description="MCP server name", default=None)
     metadata: Optional[Dict[str, Any]] = Field(description="Metadata", default=None)
 
+
+VerificationEvent = Literal[
+    "tool_precheck",
+    "tool_result",
+    "retrieval",
+    "code_execution",
+    "handoff",
+    "final_answer",
+]
+VerificationStrictness = Literal["lenient", "balanced", "strict"]
+VerificationFailPolicy = Literal["repair_then_controlled_summary", "warn"]
+
+
+class AgentVerificationConfig(BaseModel):
+    """Configuration for layered ReAct self-verification."""
+
+    enabled: bool = Field(description="Whether self-verification is enabled", default=True)
+    step_verification_enabled: bool = Field(
+        description="Whether to verify critical ReAct step events",
+        default=True,
+    )
+    final_verification_enabled: bool = Field(
+        description="Whether to verify final answer candidates before returning them",
+        default=True,
+    )
+    llm_verification_enabled: bool = Field(
+        description="Whether to use the LLM as a final-answer verifier after deterministic checks",
+        default=True,
+    )
+    max_final_rounds: int = Field(
+        description="Maximum number of final-answer verification attempts",
+        default=2,
+        ge=1,
+        le=5,
+    )
+    strictness: VerificationStrictness = Field(
+        description="Verification strictness profile",
+        default="balanced",
+    )
+    fail_policy: VerificationFailPolicy = Field(
+        description="Policy when final verification still fails after repair attempts",
+        default="repair_then_controlled_summary",
+    )
+    pass_score: float = Field(
+        description="Minimum verifier score for final answers",
+        default=0.75,
+        ge=0.0,
+        le=1.0,
+    )
+    critical_events: List[VerificationEvent] = Field(
+        description="Critical ReAct events that should be verified",
+        default_factory=lambda: [
+            "tool_precheck",
+            "tool_result",
+            "retrieval",
+            "code_execution",
+            "handoff",
+            "final_answer",
+        ],
+    )
+
 class AgentConfig(BaseModel):
     name: str = Field(description="Agent name")
     description: str = Field(description="Agent description")
@@ -100,6 +161,10 @@ class AgentConfig(BaseModel):
         description="Pre-built context components for system prompt assembly",
         default=None
     )
+    verification_config: AgentVerificationConfig = Field(
+        description="Layered ReAct self-verification configuration",
+        default_factory=AgentVerificationConfig,
+    )
 
 
 class AgentHistory(BaseModel):
diff --git a/sdk/nexent/core/agents/core_agent.py b/sdk/nexent/core/agents/core_agent.py
index e029f012e..9397b2bfa 100644
--- a/sdk/nexent/core/agents/core_agent.py
+++ b/sdk/nexent/core/agents/core_agent.py
@@ -2,6 +2,7 @@
 import ast
 import time
 import threading
+from datetime import datetime
 from textwrap import dedent
 from typing import Any, Optional, List, Dict
 from collections.abc import Generator
@@ -27,6 +28,8 @@
     import PIL.Image
 
 from .agent_context import ContextManager
+from .agent_model import AgentVerificationConfig
+from .verification import VerificationController, VerificationResult
 from ..utils.token_estimation import msg_token_count
 
 def parse_code_blobs(text: str) -> str:
@@ -212,9 +215,24 @@ def _build_final_answer_messages(task: str, agent_prompt_templates: Dict[str, An
 
 
 class CoreAgent(CodeAgent):
-    def __init__(self, observer: MessageObserver, prompt_templates: Dict[str, Any] | None = None, *args, **kwargs):
+    def __init__(
+        self,
+        observer: MessageObserver,
+        prompt_templates: Dict[str, Any] | None = None,
+        verification_config: AgentVerificationConfig | None = None,
+        *args,
+        **kwargs
+    ):
         super().__init__(prompt_templates=prompt_templates, *args, **kwargs)
         self.observer = observer
+        self.verification_config = verification_config or AgentVerificationConfig(enabled=False)
+        self.verification_controller = VerificationController(
+            config=self.verification_config,
+            observer=observer,
+            agent_name=self.agent_name,
+            model=self.model,
+            logger=self.logger,
+        )
         self.stop_event = threading.Event()
         self._history_step_count = 0  # For ContextManager, record boundary for compression
         self.context_manager: ContextManager = None
@@ -226,6 +244,78 @@ def __init__(self, observer: MessageObserver, prompt_templates: Dict[str, Any] |
         # identifiers; omitting "python" and "py" ensures ```python blocks are not extracted.
         self.code_block_tags = ["", ""]
 
+    def _verification_tool_names(self) -> List[str]:
+        names = set()
+        for container in (getattr(self, "tools", {}) or {}, getattr(self, "managed_agents", {}) or {}):
+            try:
+                names.update(str(name) for name in container.keys())
+            except AttributeError:
+                continue
+        names.add("final_answer")
+        return sorted(names)
+
+    def _append_verification_feedback(self, action_step: ActionStep, result: VerificationResult) -> None:
+        feedback = self.verification_controller.build_feedback_observation(result)
+        if action_step.observations:
+            action_step.observations += feedback
+        else:
+            action_step.observations = feedback
+
+    def _build_verification_memory_summary(
+        self,
+        current_step: ActionStep | None = None,
+        max_chars: int = 8000,
+    ) -> str:
+        summaries = []
+        steps = list(self.memory.steps[-8:])
+        if current_step is not None:
+            steps.append(current_step)
+        for step in steps:
+            if isinstance(step, TaskStep):
+                summaries.append(f"Task: {truncate_content(str(step.task), max_length=1200)}")
+            elif isinstance(step, ActionStep):
+                code = truncate_content(str(getattr(step, "code_action", "") or ""), max_length=1200)
+                observations = truncate_content(str(getattr(step, "observations", "") or ""), max_length=1800)
+                output = truncate_content(str(getattr(step, "action_output", "") or ""), max_length=1200)
+                summaries.append(
+                    f"Step {getattr(step, 'step_number', '?')}:\n"
+                    f"Code: {code}\n"
+                    f"Observation: {observations}\n"
+                    f"Output: {output}"
+                )
+        return truncate_content("\n\n".join(summaries), max_length=max_chars)
+
+    def _finalize_failed_verification_candidate(
+        self,
+        action_step: ActionStep,
+        verification_result: VerificationResult,
+        verification_round: int,
+        max_rounds: int,
+        candidate_answer: Any,
+    ) -> tuple[bool, Any]:
+        if verification_round < max_rounds:
+            verification_result.phase = "repair"
+            self.verification_controller.emit(
+                verification_result,
+                verification_round,
+            )
+            self._append_verification_feedback(action_step, verification_result)
+            action_step.is_final_answer = False
+            return False, None
+
+        verification_result.phase = "final_fail"
+        self.verification_controller.emit(
+            verification_result,
+            verification_round,
+        )
+        controlled_answer = self.verification_controller.build_controlled_failure_answer(
+            candidate_answer,
+            verification_result,
+        )
+        action_step.is_final_answer = True
+        action_step.action_output = controlled_answer
+        return True, controlled_answer
+
     def _log_model_call_parameters(self, input_messages: List[ChatMessage], stop_sequences: List[str], additional_args: Dict[str, Any]) -> None:
         """
         Log model call parameters with content truncation for readability.
@@ -348,7 +438,22 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             # Record parsing results
             self.observer.add_message(
                 self.agent_name, ProcessType.PARSE, code_action)
+            verification_controller = getattr(self, "verification_controller", None)
+            if verification_controller:
+                precheck = verification_controller.verify_before_tool_call(
+                    code_action=code_action,
+                    step_number=memory_step.step_number,
+                    available_tool_names=self._verification_tool_names(),
+                )
+                if not precheck.passed and precheck.severity == "blocking":
+                    self._append_verification_feedback(memory_step, precheck)
+                    raise AgentExecutionError(
+                        precheck.repair_instruction or precheck.user_visible_note or "Action failed verification.",
+                        self.logger,
+                    )
 
+        except AgentExecutionError:
+            raise
         except Exception:
             self.logger.log_markdown(
                 content=model_output, title="AGENT FINAL ANSWER", level=LogLevel.INFO)
@@ -414,7 +519,7 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             error_msg = str(e)
             self.logger.log(
                 f"[Code Execution] step={memory_step.step_number} failed after {exec_duration_ms:.1f}ms: {error_msg}",
-                level=LogLevel.WARNING,
+                level=LogLevel.ERROR,
             )
             raise AgentExecutionError(error_msg, self.logger)
 
@@ -430,6 +535,23 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             observation += "Last output from code snippet:\n" + truncated_output
         memory_step.observations = observation
 
+        verification_controller = getattr(self, "verification_controller", None)
+        if verification_controller:
+            postcheck = verification_controller.verify_after_tool_call(
+                code_action=code_action,
+                observation=memory_step.observations,
+                step_number=memory_step.step_number,
+                is_final_answer=bool(code_output.is_final_answer),
+            )
+            if not postcheck.passed and postcheck.severity == "blocking":
+                self._append_verification_feedback(memory_step, postcheck)
+                raise AgentExecutionError(
+                    postcheck.repair_instruction or postcheck.user_visible_note or "Action result failed verification.",
+                    self.logger,
+                )
+            if postcheck.severity == "warning":
+                self._append_verification_feedback(memory_step, postcheck)
+
         # Pre-truncate observations when ContextManager is enabled. Keeps the
         # head + tail of long outputs around a truncation marker so downstream
         # compression sees bounded-length step records and the model can still
@@ -478,7 +600,11 @@ def run(self, task: str, stream: bool = False, reset: bool = True, images: Optio
         ```
         """
         max_steps = max_steps or self.max_steps
-        self.task = task
+        # Prepend current time to the user task instead of baking it into the
+        # system prompt. This keeps the system prefix stable so prompt/KV caches
+        # can hit across requests; only the trailing user message varies.
+        time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+        self.task = f"[Current time: {time_str}]\n\n{task}"
         if additional_args is not None:
             self.state.update(additional_args)
             self.task += f"""
@@ -597,6 +723,17 @@ def _run_stream(
         action_step = None
         self.step_number = 1
         returned_final_answer = False
+        final_verification_round = 0
+        verification_config = getattr(
+            self,
+            "verification_config",
+            AgentVerificationConfig(enabled=False),
+        )
+        max_final_verification_rounds = (
+            verification_config.max_final_rounds
+            if verification_config and verification_config.enabled
+            else 1
+        )
         while not returned_final_answer and self.step_number <= max_steps and not self.stop_event.is_set():
             step_start_time = time.time()
 
@@ -608,24 +745,73 @@ def _run_stream(
                     yield output
 
                 if isinstance(output, ActionOutput) and output.is_final_answer:
-                    final_answer = output.output
+                    candidate_answer = output.output
                     self.logger.log(
-                        Text(f"Final answer: {final_answer}", style=f"bold {YELLOW_HEX}"),
+                        Text(f"Final answer: {candidate_answer}", style=f"bold {YELLOW_HEX}"),
                         level=LogLevel.INFO,
                     )
 
-                    if self.final_answer_checks:
-                        self._validate_final_answer(final_answer)
-                    returned_final_answer = True
-                    action_step.is_final_answer = True
+                    if verification_config.enabled and verification_config.final_verification_enabled:
+                        final_verification_round += 1
+                        verification_result = self.verification_controller.verify_final_answer(
+                            task=task,
+                            candidate=candidate_answer,
+                            memory_summary=self._build_verification_memory_summary(action_step),
+                            round_number=final_verification_round,
+                        )
+                        if verification_result.passed:
+                            final_answer = candidate_answer
+                            if self.final_answer_checks:
+                                self._validate_final_answer(final_answer)
+                            returned_final_answer = True
+                            action_step.is_final_answer = True
+                        else:
+                            returned_final_answer, final_answer = self._finalize_failed_verification_candidate(
+                                action_step=action_step,
+                                verification_result=verification_result,
+                                verification_round=final_verification_round,
+                                max_rounds=max_final_verification_rounds,
+                                candidate_answer=candidate_answer,
+                            )
+                    else:
+                        final_answer = candidate_answer
+                        if self.final_answer_checks:
+                            self._validate_final_answer(final_answer)
+                        returned_final_answer = True
+                        action_step.is_final_answer = True
 
             except FinalAnswerError:
                 # When the model does not output code, directly treat the large model content as the final answer
-                final_answer = action_step.model_output
-                if isinstance(final_answer, str):
-                    final_answer = convert_code_format(final_answer)
-                returned_final_answer = True
-                action_step.is_final_answer = True
+                candidate_answer = action_step.model_output
+                if isinstance(candidate_answer, str):
+                    candidate_answer = convert_code_format(candidate_answer)
+
+                if verification_config.enabled and verification_config.final_verification_enabled:
+                    final_verification_round += 1
+                    verification_result = self.verification_controller.verify_final_answer(
+                        task=task,
+                        candidate=candidate_answer,
+                        memory_summary=self._build_verification_memory_summary(action_step),
+                        round_number=final_verification_round,
+                    )
+                    if verification_result.passed:
+                        final_answer = candidate_answer
+                        if self.final_answer_checks:
+                            self._validate_final_answer(final_answer)
+                        returned_final_answer = True
+                        action_step.is_final_answer = True
+                    else:
+                        returned_final_answer, final_answer = self._finalize_failed_verification_candidate(
+                            action_step=action_step,
+                            verification_result=verification_result,
+                            verification_round=final_verification_round,
+                            max_rounds=max_final_verification_rounds,
+                            candidate_answer=candidate_answer,
+                        )
+                else:
+                    final_answer = candidate_answer
+                    returned_final_answer = True
+                    action_step.is_final_answer = True
 
             except AgentError as e:
                 action_step.error = e
@@ -652,6 +838,19 @@ def _run_stream(
             # _handle_max_steps_reached already yields the final step internally
             # and sets action_step.error, so don't yield again to avoid duplicate error
             final_answer = self._handle_max_steps_reached(task)
+            if verification_config.enabled and verification_config.final_verification_enabled:
+                final_verification_round += 1
+                verification_result = self.verification_controller.verify_final_answer(
+                    task=task,
+                    candidate=final_answer,
+                    memory_summary=self._build_verification_memory_summary(),
+                    round_number=final_verification_round,
+                )
+                if not verification_result.passed:
+                    final_answer = self.verification_controller.build_controlled_failure_answer(
+                        final_answer,
+                        verification_result,
+                    )
         yield FinalAnswerStep(handle_agent_output_types(final_answer))
 
 
@@ -796,7 +995,7 @@ def _handle_max_steps_reached(self, task: str) -> Any:
         except Exception as e:
             # Fallback to error message if streaming fails
             model_output = f"Error in generating final LLM output: {e}"
-            self.logger.log(f"Error in final answer generation: {e}", level=LogLevel.WARNING)
+            self.logger.log(f"Error in final answer generation: {e}", level=LogLevel.ERROR)
 
         # Finalize the memory step
         final_memory_step.timing.end_time = time.time()
diff --git a/sdk/nexent/core/agents/nexent_agent.py b/sdk/nexent/core/agents/nexent_agent.py
index a5efcbe82..ed43b6691 100644
--- a/sdk/nexent/core/agents/nexent_agent.py
+++ b/sdk/nexent/core/agents/nexent_agent.py
@@ -46,10 +46,8 @@ def _tool_name(tool_obj: Any) -> str:
 
 def _is_retriever_tool(tool_obj: Any) -> bool:
     """Classify tools that should use RETRIEVER rather than TOOL semantics."""
-    return (
-        type(tool_obj).__name__ == "KnowledgeBaseSearchTool"
-        or _tool_name(tool_obj) == "knowledge_base_search"
-    )
+    name = type(tool_obj).__name__
+    return name in ("KnowledgeBaseSearchTool", "SearchMemoryTool")
 
 
 def _build_tool_input(callable_obj: Callable, args: tuple, kwargs: Dict[str, Any]) -> Dict[str, Any]:
@@ -200,11 +198,16 @@ def create_local_tool(self, tool_config: ToolConfig):
             raise ValueError(f"{class_name} not found in local")
         else:
             if class_name == "KnowledgeBaseSearchTool":
-                # Filter out conflicting parameters from params to avoid conflicts
-                # These parameters have exclude=True and cannot be passed to __init__
-                # due to smolagents.tools.Tool wrapper restrictions
+                # Filter out conflicting parameters from params to avoid conflicts.
+                # Parameters declared with exclude=True cannot be passed to __init__
+                # due to smolagents.tools.Tool wrapper restrictions; they are set as
+                # attributes on the instance after construction, sourced from metadata.
+                # `document_paths` is intentionally hidden from the LLM and only
+                # populated via tool_params from the northbound interface.
                 filtered_params = {k: v for k, v in params.items()
-                                   if k not in ["vdb_core", "embedding_model", "observer", "rerank_model", "display_name_to_index_map"]}
+                                   if k not in ["vdb_core", "embedding_model", "observer",
+                                                 "rerank_model", "display_name_to_index_map",
+                                                 "document_paths"]}
                 # Create instance with only non-excluded parameters
                 tools_obj = tool_class(**filtered_params)
                 # Set excluded parameters directly as attributes after instantiation
@@ -218,6 +221,13 @@ def create_local_tool(self, tool_config: ToolConfig):
                     "rerank_model", None) if tool_config.metadata else None
                 tools_obj.display_name_to_index_map = tool_config.metadata.get(
                     "display_name_to_index_map", {}) if tool_config.metadata else {}
+                # Internal access control: restrict results to documents whose
+                # path_or_url is in the allow list. Only the northbound interface
+                # may populate this; never the LLM.
+                tools_obj.set_document_paths(
+                    tool_config.metadata.get(
+                        "document_paths") if tool_config.metadata else None
+                )
             elif class_name in ["DifySearchTool", "DataMateSearchTool"]:
                 # These parameters have exclude=True and cannot be passed to __init__
                 filtered_params = {k: v for k, v in params.items()
@@ -253,6 +263,19 @@ def create_local_tool(self, tool_config: ToolConfig):
                                        storage_client=tool_config.metadata.get("storage_client", []),
                                        validate_url_access=validate_url_access,
                                        **params)
+            elif class_name in ["StoreMemoryTool", "SearchMemoryTool"]:
+                tools_obj = tool_class()
+                tools_obj.observer = self.observer
+                tools_obj.memory_config = tool_config.metadata.get(
+                    "memory_config", {}) if tool_config.metadata else {}
+                tools_obj.tenant_id = tool_config.metadata.get(
+                    "tenant_id", "") if tool_config.metadata else ""
+                tools_obj.user_id = tool_config.metadata.get(
+                    "user_id", "") if tool_config.metadata else ""
+                tools_obj.agent_id = tool_config.metadata.get(
+                    "agent_id", "") if tool_config.metadata else ""
+                tools_obj.memory_user_config = tool_config.metadata.get(
+                    "memory_user_config", None) if tool_config.metadata else None
             else:
                 tools_obj = tool_class(**params)
                 if hasattr(tools_obj, 'observer'):
@@ -411,6 +434,7 @@ def create_single_agent(self, agent_config: AgentConfig):
                 description=agent_config.description,
                 max_steps=agent_config.max_steps,
                 prompt_templates=prompt_templates,
+                verification_config=agent_config.verification_config,
                 provide_run_summary=agent_config.provide_run_summary,
                 managed_agents=managed_agents_list,
                 additional_authorized_imports=SAFE_PYTHON_INTERPRETER_IMPORTS,
diff --git a/sdk/nexent/core/agents/verification.py b/sdk/nexent/core/agents/verification.py
new file mode 100644
index 000000000..e75f41c42
--- /dev/null
+++ b/sdk/nexent/core/agents/verification.py
@@ -0,0 +1,732 @@
+from __future__ import annotations
+
+import ast
+import json
+import re
+from dataclasses import dataclass, field
+from typing import Any, Dict, List, Optional
+
+from smolagents.models import ChatMessage, MessageRole
+from smolagents.utils import truncate_content
+
+from ...monitor import get_monitoring_manager
+from ..utils.observer import MessageObserver, ProcessType
+from .agent_model import AgentVerificationConfig
+
+
+@dataclass
+class VerificationCheck:
+    name: str
+    passed: bool
+    reason: str = ""
+    fix_hint: str = ""
+
+
+@dataclass
+class VerificationResult:
+    passed: bool
+    severity: str
+    event: str
+    score: float = 1.0
+    phase: str = "pass"
+    failed_criteria: List[str] = field(default_factory=list)
+    repair_instruction: str = ""
+    user_visible_note: str = ""
+    checks: List[VerificationCheck] = field(default_factory=list)
+
+    def to_payload(self, round_number: int = 0, message: Optional[str] = None) -> Dict[str, Any]:
+        return {
+            "phase": self.phase,
+            "event": self.event,
+            "round": round_number,
+            "severity": self.severity,
+            "score": round(float(self.score), 3),
+            "failed_criteria": self.failed_criteria,
+            "repair_instruction": self.repair_instruction,
+            "user_visible_note": self.user_visible_note,
+            "message": message or self.user_visible_note or self.repair_instruction,
+            "passed": self.passed,
+        }
+
+
+class _SilentObserver:
+    """Observer shim used to prevent verifier LLM tokens from appearing in chat UI."""
+
+    current_mode = ProcessType.MODEL_OUTPUT_THINKING
+
+    def add_model_new_token(self, _new_token):
+        return None
+
+    def add_model_reasoning_content(self, _reasoning_content):
+        return None
+
+    def flush_remaining_tokens(self):
+        return None
+
+
+class VerificationController:
+    """Layered verification for critical ReAct events and final answers."""
+
+    _ERROR_RE = re.compile(
+        r"(traceback|exception|error:|failed|timeout|unauthorized|permission denied)",
+        re.IGNORECASE,
+    )
+    _EMPTY_RE = re.compile(r"^\s*(execution logs:\s*)?(last output from code snippet:\s*)?\s*$", re.IGNORECASE)
+    _RAW_TAG_RE = re.compile(r"</?(code|RUN)>|<DISPLAY:[^>]+>|</DISPLAY>", re.IGNORECASE)
+    _CITATION_RE = re.compile(r"\[\[[a-e]\d+\]\]")
+    _LIGHTWEIGHT_CONVERSATION_RE = re.compile(
+        r"^\s*(你好|您好|嗨|哈喽|hello|hi|hey|早上好|上午好|中午好|下午好|晚上好|"
+        r"在吗|你是谁|你会干什么|介绍一下你自己|谢谢|好的|好|可以|没事|再见|"
+        r"thanks|thank you|ok|bye)\s*[。！？!?.]*\s*$",
+        re.IGNORECASE,
+    )
+    _EVIDENCE_DEMAND_RE = re.compile(
+        r"(搜索|检索|查询|查找|分析|调研|根据|基于|引用|证据|来源|文档|文件|代码|项目|数据库|"
+        r"最新|今天|昨天|现在|当前|执行|运行|部署|修复|报错|日志|search|retrieve|cite|source|"
+        r"evidence|file|code|database|latest|today|run|execute|deploy|error|log)",
+        re.IGNORECASE,
+    )
+
+    def __init__(
+        self,
+        config: AgentVerificationConfig,
+        observer: MessageObserver,
+        agent_name: str,
+        model: Any,
+        logger: Any = None,
+    ) -> None:
+        self.config = config
+        self.observer = observer
+        self.agent_name = agent_name
+        self.model = model
+        self.logger = logger
+
+    def is_enabled(self) -> bool:
+        return bool(self.config and self.config.enabled)
+
+    def emit(self, result: VerificationResult, round_number: int = 0, message: Optional[str] = None) -> None:
+        if not self.is_enabled():
+            return
+        try:
+            display_message = message or self._build_display_message(result)
+            self.observer.add_message(
+                self.agent_name,
+                ProcessType.VERIFICATION,
+                json.dumps(result.to_payload(round_number, display_message), ensure_ascii=False),
+            )
+        except Exception:
+            if self.logger:
+                self.logger.log("Failed to emit verification event")
+
+    def _build_display_message(self, result: VerificationResult) -> str:
+        if result.passed and result.phase in {"pass", "final_pass"}:
+            prefix = "最终自检通过" if result.phase == "final_pass" else "基础自检通过"
+            summary = self._build_pass_summary(result)
+            return f"{prefix}：{summary}" if summary else prefix
+
+        if result.phase in {"warning", "blocked", "repair", "final_fail"}:
+            note = result.user_visible_note or result.repair_instruction
+            if note:
+                prefix = {
+                    "warning": "自检发现需关注项",
+                    "blocked": "自检已阻断",
+                    "repair": "自检未通过，正在修正",
+                    "final_fail": "最终自检未通过",
+                }.get(result.phase, "自检提示")
+                return f"{prefix}：{note}"
+
+        return result.user_visible_note or result.repair_instruction or ""
+
+    def _build_pass_summary(self, result: VerificationResult) -> str:
+        if result.event == "tool_precheck":
+            return "动作非空、语法正常，未发现越权风险"
+        if result.event == "retrieval":
+            return "检索返回可用内容，未发现错误信号"
+        if result.event == "handoff":
+            return "子任务返回可用结论，未发现错误信号"
+        if result.event in {"tool_result", "code_execution"}:
+            return "执行结果非空，未发现错误信号"
+
+        if result.event == "final_answer":
+            if "Lightweight conversational task" in (result.user_visible_note or ""):
+                return "轻量对话无需外部证据，答案非空且格式正常"
+
+            labels = self._passed_check_labels(result.checks)
+            if labels:
+                return "、".join(labels[:3])
+            if result.user_visible_note:
+                return result.user_visible_note
+            return "答案满足当前任务要求，未发现阻断问题"
+
+        labels = self._passed_check_labels(result.checks)
+        return "、".join(labels[:3])
+
+    def _passed_check_labels(self, checks: List[VerificationCheck]) -> List[str]:
+        label_map = {
+            "non_empty_code": "动作非空",
+            "python_syntax": "语法正常",
+            "action_scope": "未发现越权风险",
+            "tool_relevance_signal": "动作与任务相关",
+            "observation_present": "结果非空",
+            "tool_error_handled": "未发现未处理错误",
+            "retrieval_has_evidence": "检索证据可用",
+            "handoff_has_substance": "子任务结论可用",
+            "final_answer_non_empty": "答案非空",
+            "no_unresolved_raw_tags": "无内部标记",
+            "no_unresolved_placeholders": "无占位符",
+            "previous_errors_acknowledged": "未发现未处理错误",
+            "intent_coverage": "覆盖用户目标",
+            "evidence_grounding": "证据支撑充分",
+            "citation_integrity": "引用格式正常",
+            "format_safety": "格式安全",
+            "tool_error_handling": "工具错误已处理",
+        }
+        ordered_names = [
+            "intent_coverage",
+            "evidence_grounding",
+            "tool_error_handling",
+            "citation_integrity",
+            "format_safety",
+            "final_answer_non_empty",
+            "no_unresolved_raw_tags",
+            "no_unresolved_placeholders",
+            "previous_errors_acknowledged",
+            "observation_present",
+            "tool_error_handled",
+            "retrieval_has_evidence",
+            "handoff_has_substance",
+            "non_empty_code",
+            "python_syntax",
+            "action_scope",
+            "tool_relevance_signal",
+        ]
+        passed_names = {check.name for check in checks if check.passed}
+        return [label_map[name] for name in ordered_names if name in passed_names and name in label_map]
+
+    def verify_before_tool_call(
+        self,
+        code_action: str,
+        step_number: int,
+        available_tool_names: Optional[List[str]] = None,
+    ) -> VerificationResult:
+        if not self._should_verify_step("tool_precheck"):
+            return self._pass("tool_precheck")
+
+        checks: List[VerificationCheck] = []
+        code_text = code_action or ""
+
+        checks.append(VerificationCheck(
+            name="non_empty_code",
+            passed=bool(code_text.strip()),
+            reason="" if code_text.strip() else "The generated action code is empty.",
+            fix_hint="Generate a concrete tool call or a final answer.",
+        ))
+
+        syntax_ok = True
+        try:
+            ast.parse(code_text)
+        except SyntaxError as exc:
+            syntax_ok = False
+            checks.append(VerificationCheck(
+                name="python_syntax",
+                passed=False,
+                reason=f"Python syntax error: {exc}",
+                fix_hint="Rewrite the action as valid Python inside <code>...</code>.",
+            ))
+        if syntax_ok:
+            checks.append(VerificationCheck(name="python_syntax", passed=True))
+
+        dangerous_terms = [
+            "__import__",
+            "eval(",
+            "exec(",
+            "subprocess",
+            "os.system",
+            "shutil.rmtree",
+            "socket.",
+        ]
+        dangerous_hits = [term for term in dangerous_terms if term in code_text]
+        checks.append(VerificationCheck(
+            name="action_scope",
+            passed=not dangerous_hits,
+            reason=f"Potentially unsafe code terms: {', '.join(dangerous_hits)}" if dangerous_hits else "",
+            fix_hint="Use the platform-provided tools instead of direct system or network operations.",
+        ))
+
+        if "final_answer(" not in code_text and available_tool_names:
+            used_tools = [name for name in available_tool_names if re.search(rf"\b{re.escape(name)}\s*\(", code_text)]
+            checks.append(VerificationCheck(
+                name="tool_relevance_signal",
+                passed=bool(used_tools) or "print(" in code_text,
+                reason="" if used_tools or "print(" in code_text else "No known tool call or printed observation was detected.",
+                fix_hint="Call a relevant tool with keyword arguments, or print the evidence needed for the next step.",
+            ))
+
+        return self._result_from_checks(
+            event="tool_precheck",
+            checks=checks,
+            blocking_names={"non_empty_code", "python_syntax", "action_scope"},
+            step_number=step_number,
+        )
+
+    def verify_after_tool_call(
+        self,
+        code_action: str,
+        observation: str,
+        step_number: int,
+        is_final_answer: bool = False,
+    ) -> VerificationResult:
+        event = self._classify_step_event(code_action, is_final_answer)
+        if not self._should_verify_step(event):
+            return self._pass(event)
+
+        observation_text = observation or ""
+        checks = [
+            VerificationCheck(
+                name="observation_present",
+                passed=not self._EMPTY_RE.match(observation_text),
+                reason="" if observation_text.strip() else "The action produced no visible observation.",
+                fix_hint="Retry with better parameters, inspect tool errors, or explain that evidence is unavailable.",
+            ),
+            VerificationCheck(
+                name="tool_error_handled",
+                passed=not self._ERROR_RE.search(observation_text),
+                reason="The observation contains an error signal." if self._ERROR_RE.search(observation_text) else "",
+                fix_hint="Do not ignore this tool error. Diagnose it, retry safely, or state the limitation.",
+            ),
+        ]
+
+        if event == "retrieval":
+            checks.append(VerificationCheck(
+                name="retrieval_has_evidence",
+                passed=not self._looks_empty_retrieval(observation_text),
+                reason="Retrieval appears empty or has no usable evidence." if self._looks_empty_retrieval(observation_text) else "",
+                fix_hint="Search again with refined terms or say that supporting evidence was not found.",
+            ))
+
+        if event == "handoff":
+            checks.append(VerificationCheck(
+                name="handoff_has_substance",
+                passed=not self._looks_empty_handoff(observation_text),
+                reason="The delegated agent returned no useful result." if self._looks_empty_handoff(observation_text) else "",
+                fix_hint="Reassign a narrower task or proceed with clearly stated limitations.",
+            ))
+
+        return self._result_from_checks(
+            event=event,
+            checks=checks,
+            blocking_names=set(),
+            step_number=step_number,
+        )
+
+    def verify_before_final_answer(
+        self,
+        candidate: Any,
+        observation: str,
+        step_number: int,
+    ) -> VerificationResult:
+        if not self.is_enabled() or not self.config.final_verification_enabled:
+            return self._pass("final_answer")
+
+        answer = "" if candidate is None else str(candidate)
+        observation_text = observation or ""
+        recent_error_signal = self._has_recent_error_signal(observation_text)
+        checks = [
+            VerificationCheck(
+                name="final_answer_non_empty",
+                passed=bool(answer.strip()),
+                reason="" if answer.strip() else "The final answer candidate is empty.",
+                fix_hint="Produce a concise answer or an explicit inability summary.",
+            ),
+            VerificationCheck(
+                name="no_unresolved_raw_tags",
+                passed=not self._RAW_TAG_RE.search(answer),
+                reason="The final answer still contains internal execution/display tags." if self._RAW_TAG_RE.search(answer) else "",
+                fix_hint="Convert internal tags to user-facing Markdown before answering.",
+            ),
+            VerificationCheck(
+                name="no_unresolved_placeholders",
+                passed=not any(marker in answer for marker in ["{{", "}}", "<TODO>", "TODO:"]),
+                reason="The final answer contains unresolved placeholders." if any(marker in answer for marker in ["{{", "}}", "<TODO>", "TODO:"]) else "",
+                fix_hint="Replace placeholders with real content or remove them.",
+            ),
+            VerificationCheck(
+                name="previous_errors_acknowledged",
+                passed=not recent_error_signal or self._mentions_limitation(answer),
+                reason="A recent error signal is not acknowledged in the final answer." if recent_error_signal and not self._mentions_limitation(answer) else "",
+                fix_hint="Acknowledge the failed operation, retry, or state what could not be verified.",
+            ),
+        ]
+
+        return self._result_from_checks(
+            event="final_answer",
+            checks=checks,
+            blocking_names={"final_answer_non_empty", "no_unresolved_raw_tags", "no_unresolved_placeholders"},
+            step_number=step_number,
+        )
+
+    def verify_final_answer(
+        self,
+        task: str,
+        candidate: Any,
+        memory_summary: str,
+        round_number: int,
+    ) -> VerificationResult:
+        if not self.is_enabled() or not self.config.final_verification_enabled:
+            return self._pass("final_answer", phase="final_pass")
+
+        start = self._pass("final_answer", phase="start")
+        self.emit(start, round_number, "正在自检最终答案：检查答案完整性、格式和错误处理")
+
+        deterministic = self.verify_before_final_answer(
+            candidate=candidate,
+            observation=memory_summary,
+            step_number=round_number,
+        )
+        if not deterministic.passed:
+            deterministic.phase = "final_fail"
+            self.emit(deterministic, round_number)
+            return deterministic
+
+        if not self.config.llm_verification_enabled:
+            deterministic.phase = "final_pass"
+            self.emit(deterministic, round_number)
+            return deterministic
+
+        policy = self._build_final_verification_policy(task, memory_summary)
+        if policy["task_profile"] == "lightweight_conversation":
+            deterministic.phase = "final_pass"
+            deterministic.user_visible_note = "Lightweight conversational task; deterministic checks passed."
+            self.emit(deterministic, round_number)
+            return deterministic
+
+        llm_result = self._run_llm_verifier(task, candidate, memory_summary, round_number, policy)
+        self.emit(llm_result, round_number)
+        return llm_result
+
+    def build_feedback_observation(self, result: VerificationResult) -> str:
+        failed = ", ".join(result.failed_criteria) if result.failed_criteria else "verification"
+        instruction = result.repair_instruction or "Revise the next action based on the failed verification checks."
+        return (
+            "\nVerification feedback:\n"
+            f"- Event: {result.event}\n"
+            f"- Severity: {result.severity}\n"
+            f"- Failed criteria: {failed}\n"
+            f"- Repair instruction: {instruction}\n"
+        )
+
+    def build_controlled_failure_answer(self, candidate: Any, result: VerificationResult) -> str:
+        note = result.user_visible_note or "最终答案未能通过自验证。"
+        failed = "、".join(result.failed_criteria) if result.failed_criteria else "verification"
+        instruction = result.repair_instruction or "请补充更多信息或放宽任务约束后重试。"
+        if self.config.fail_policy == "warn" and candidate:
+            return f"{candidate}\n\n> 自验证提示：{note}"
+        return (
+            "我无法在当前步骤内给出已通过自验证的确定答案。\n\n"
+            f"- 未通过项：{failed}\n"
+            f"- 原因：{note}\n"
+            f"- 建议：{instruction}"
+        )
+
+    def _should_verify_step(self, event: str) -> bool:
+        return (
+            self.is_enabled()
+            and self.config.step_verification_enabled
+            and event in set(self.config.critical_events)
+        )
+
+    def _run_llm_verifier(
+        self,
+        task: str,
+        candidate: Any,
+        memory_summary: str,
+        round_number: int,
+        policy: Optional[Dict[str, Any]] = None,
+    ) -> VerificationResult:
+        policy = policy or self._build_final_verification_policy(task, memory_summary)
+        monitoring_manager = get_monitoring_manager()
+        attrs = {
+            "agent.verification.event": "final_answer",
+            "agent.verification.round": round_number,
+            "agent.verification.strictness": self.config.strictness,
+            "agent.verification.fail_policy": self.config.fail_policy,
+            "agent.verification.task_profile": policy["task_profile"],
+            "agent.verification.evidence_required": policy["evidence_required"],
+            "agent.verification.tool_error_check_required": policy["tool_error_check_required"],
+        }
+        with monitoring_manager.trace_agent_step(
+            "agent.verify.final_answer",
+            step_type="verification",
+            **attrs,
+        ):
+            messages = self._build_verifier_messages(task, candidate, memory_summary, policy)
+            saved_observer = getattr(self.model, "observer", None)
+            if saved_observer is not None:
+                try:
+                    self.model.observer = _SilentObserver()
+                except Exception:
+                    pass
+            try:
+                chat_message: ChatMessage = self.model(messages)
+                content = chat_message.content or ""
+                result = self._parse_llm_verifier_result(content, policy)
+                monitoring_manager.add_span_event(
+                    "agent.verification.result",
+                    {
+                        "agent.verification.status": result.phase,
+                        "agent.verification.score": result.score,
+                        "agent.verification.failed_criteria": json.dumps(result.failed_criteria, ensure_ascii=False),
+                    },
+                )
+                return result
+            except Exception as exc:
+                if self.logger:
+                    self.logger.log(f"LLM verifier unavailable: {exc}")
+                result = VerificationResult(
+                    passed=True,
+                    severity="warning",
+                    event="final_answer",
+                    phase="final_pass",
+                    score=0.75,
+                    failed_criteria=["verifier_unavailable"],
+                    user_visible_note="Verifier was unavailable; deterministic checks passed.",
+                )
+                monitoring_manager.add_span_event(
+                    "agent.verification.unavailable",
+                    {"error.type": type(exc).__name__, "error.message": str(exc)},
+                )
+                return result
+            finally:
+                if saved_observer is not None:
+                    try:
+                        self.model.observer = saved_observer
+                    except Exception:
+                        pass
+
+    def _build_verifier_messages(
+        self,
+        task: str,
+        candidate: Any,
+        memory_summary: str,
+        policy: Optional[Dict[str, Any]] = None,
+    ) -> List[ChatMessage]:
+        policy = policy or self._build_final_verification_policy(task, memory_summary)
+        clean_memory_summary = self._strip_internal_verification_feedback(memory_summary or "")
+        system_prompt = (
+            "You are a strict answer verifier for a ReAct agent. "
+            "Check only the evidence shown to you. Do not reveal chain-of-thought. "
+            "Return JSON only with keys: passed, score, status, failed_criteria, checks, "
+            "revision_instruction, user_visible_note. "
+            "Criteria: intent_coverage, evidence_grounding, tool_error_handling, citation_integrity, format_safety. "
+            "Apply criteria conditionally: for lightweight conversational tasks such as greetings or capability chat, "
+            "do not require external observations, citations, tool calls, or retrieval evidence. "
+            "Only fail evidence_grounding when evidence_required is true. "
+            "Only fail tool_error_handling when tool_error_check_required is true and the answer ignores an actual "
+            "tool/code execution error in the evidence summary."
+        )
+        user_prompt = json.dumps(
+            {
+                "task": truncate_content(str(task), max_length=4000),
+                "candidate_answer": truncate_content(str(candidate), max_length=4000),
+                "react_evidence_summary": truncate_content(clean_memory_summary, max_length=6000),
+                "task_profile": policy["task_profile"],
+                "evidence_required": policy["evidence_required"],
+                "tool_error_check_required": policy["tool_error_check_required"],
+                "pass_score": self.config.pass_score,
+                "strictness": self.config.strictness,
+            },
+            ensure_ascii=False,
+        )
+        return [
+            ChatMessage(role=MessageRole.SYSTEM, content=[{"type": "text", "text": system_prompt}]),
+            ChatMessage(role=MessageRole.USER, content=[{"type": "text", "text": user_prompt}]),
+        ]
+
+    def _parse_llm_verifier_result(
+        self,
+        content: str,
+        policy: Optional[Dict[str, Any]] = None,
+    ) -> VerificationResult:
+        policy = policy or {
+            "task_profile": "unknown",
+            "evidence_required": True,
+            "tool_error_check_required": True,
+        }
+        data = self._extract_json(content)
+        passed = bool(data.get("passed"))
+        score = float(data.get("score", 0.0))
+        status = str(data.get("status") or ("pass" if passed else "revise"))
+        failed_criteria = data.get("failed_criteria") or []
+        if not isinstance(failed_criteria, list):
+            failed_criteria = [str(failed_criteria)]
+        failed_criteria = [str(item) for item in failed_criteria]
+        ignored_criteria = set()
+        if not policy.get("evidence_required", True):
+            ignored_criteria.add("evidence_grounding")
+        if not policy.get("tool_error_check_required", True):
+            ignored_criteria.add("tool_error_handling")
+        effective_failed_criteria = [
+            criterion for criterion in failed_criteria if criterion not in ignored_criteria
+        ]
+
+        checks = []
+        for item in data.get("checks") or []:
+            if isinstance(item, dict):
+                name = str(item.get("name", "unknown"))
+                check_passed = bool(item.get("passed"))
+                if name in ignored_criteria:
+                    check_passed = True
+                checks.append(VerificationCheck(
+                    name=name,
+                    passed=check_passed,
+                    reason=str(item.get("reason", "")),
+                    fix_hint=str(item.get("fix_hint", "")),
+                ))
+
+        threshold_passed = score >= self.config.pass_score
+        if failed_criteria and not effective_failed_criteria:
+            passed = True
+            score = max(score, self.config.pass_score)
+            threshold_passed = True
+            status = "pass"
+        effective_passed = passed and threshold_passed
+        severity = "info" if effective_passed else "blocking"
+        return VerificationResult(
+            passed=effective_passed,
+            severity=severity,
+            event="final_answer",
+            phase="final_pass" if effective_passed else "final_fail",
+            score=score,
+            failed_criteria=effective_failed_criteria if effective_failed_criteria else ([] if effective_passed else ["llm_verifier"]),
+            repair_instruction=str(data.get("revision_instruction") or data.get("repair_instruction") or ""),
+            user_visible_note=str(data.get("user_visible_note") or ""),
+            checks=checks,
+        )
+
+    def _extract_json(self, content: str) -> Dict[str, Any]:
+        text = (content or "").strip()
+        if text.startswith("```"):
+            text = re.sub(r"^```(?:json)?\s*", "", text)
+            text = re.sub(r"\s*```$", "", text)
+        try:
+            return json.loads(text)
+        except json.JSONDecodeError:
+            start = text.find("{")
+            end = text.rfind("}")
+            if start >= 0 and end > start:
+                return json.loads(text[start:end + 1])
+            raise
+
+    def _result_from_checks(
+        self,
+        event: str,
+        checks: List[VerificationCheck],
+        blocking_names: set[str],
+        step_number: int,
+    ) -> VerificationResult:
+        failed = [check for check in checks if not check.passed]
+        blocking_failed = [check for check in failed if check.name in blocking_names]
+        should_block = bool(blocking_failed) or (self.config.strictness == "strict" and bool(failed))
+        passed = not should_block
+        severity = "info" if not failed else ("blocking" if should_block else "warning")
+        phase = "pass" if not failed else ("blocked" if should_block else "warning")
+        score = max(0.0, 1.0 - 0.15 * len(failed) - 0.35 * len(blocking_failed))
+        failed_names = [check.name for check in failed]
+        repair_instruction = " ".join(check.fix_hint for check in failed if check.fix_hint).strip()
+        user_visible_note = "；".join(check.reason for check in failed if check.reason).strip()
+        result = VerificationResult(
+            passed=passed,
+            severity=severity,
+            event=event,
+            score=score,
+            phase=phase,
+            failed_criteria=failed_names,
+            repair_instruction=repair_instruction,
+            user_visible_note=user_visible_note,
+            checks=checks,
+        )
+        monitoring_manager = get_monitoring_manager()
+        with monitoring_manager.trace_agent_step(
+            "agent.verify.step",
+            step_type="verification",
+            **{
+                "agent.verification.event": event,
+                "agent.verification.step_number": step_number,
+                "agent.verification.status": phase,
+                "agent.verification.severity": severity,
+                "agent.verification.score": score,
+                "agent.verification.failed_criteria": json.dumps(failed_names, ensure_ascii=False),
+            },
+        ):
+            monitoring_manager.add_span_event(
+                "agent.verification.result",
+                {
+                    "agent.verification.passed": passed,
+                    "agent.verification.failed_criteria": json.dumps(failed_names, ensure_ascii=False),
+                },
+            )
+        self.emit(result, step_number)
+        return result
+
+    def _build_final_verification_policy(self, task: str, memory_summary: str) -> Dict[str, Any]:
+        clean_memory_summary = self._strip_internal_verification_feedback(memory_summary or "")
+        lightweight = self._is_lightweight_conversation_task(task)
+        evidence_required = (not lightweight) and bool(self._EVIDENCE_DEMAND_RE.search(task or ""))
+        return {
+            "task_profile": "lightweight_conversation" if lightweight else "task_oriented",
+            "evidence_required": evidence_required,
+            "tool_error_check_required": self._has_recent_error_signal(clean_memory_summary),
+        }
+
+    def _is_lightweight_conversation_task(self, task: str) -> bool:
+        text = (task or "").strip()
+        if not text:
+            return False
+        if self._LIGHTWEIGHT_CONVERSATION_RE.match(text):
+            return True
+        return False
+
+    def _strip_internal_verification_feedback(self, text: str) -> str:
+        lines = (text or "").splitlines()
+        cleaned: List[str] = []
+        skipping = False
+        for line in lines:
+            if line.strip() == "Verification feedback:":
+                skipping = True
+                continue
+            if skipping:
+                if not line.strip() or line.lstrip().startswith("- "):
+                    continue
+                skipping = False
+            cleaned.append(line)
+        return "\n".join(cleaned)
+
+    def _has_recent_error_signal(self, text: str) -> bool:
+        clean_text = self._strip_internal_verification_feedback(text or "")
+        return bool(self._ERROR_RE.search(clean_text))
+
+    def _classify_step_event(self, code_action: str, is_final_answer: bool) -> str:
+        if is_final_answer:
+            return "final_answer"
+        code = code_action or ""
+        lowered = code.lower()
+        if "knowledge_base_search" in lowered or "search(" in lowered or "_search" in lowered:
+            return "retrieval"
+        if "task=" in code and re.search(r"\w+\s*\(\s*task\s*=", code):
+            return "handoff"
+        return "code_execution"
+
+    def _pass(self, event: str, phase: str = "pass") -> VerificationResult:
+        return VerificationResult(passed=True, severity="info", event=event, phase=phase)
+
+    def _looks_empty_retrieval(self, text: str) -> bool:
+        lowered = (text or "").lower()
+        return any(marker in lowered for marker in ["no result", "no results", "[]", "未找到", "无结果", "没有找到"])
+
+    def _looks_empty_handoff(self, text: str) -> bool:
+        lowered = (text or "").lower()
+        return any(marker in lowered for marker in ["cannot help", "unable", "no answer", "无法", "不能", "空"])
+
+    def _mentions_limitation(self, answer: str) -> bool:
+        lowered = (answer or "").lower()
+        return any(marker in lowered for marker in ["无法", "失败", "错误", "未能", "cannot", "unable", "failed", "error", "limitation"])
diff --git a/sdk/nexent/core/tools/__init__.py b/sdk/nexent/core/tools/__init__.py
index a640cb5ff..c35991f6e 100644
--- a/sdk/nexent/core/tools/__init__.py
+++ b/sdk/nexent/core/tools/__init__.py
@@ -24,6 +24,8 @@
 from .run_skill_script_tool import run_skill_script
 from .read_skill_md_tool import read_skill_md
 from .read_skill_config_tool import read_skill_config
+from .store_memory_tool import StoreMemoryTool
+from .search_memory_tool import SearchMemoryTool
 
 __all__ = [
     "MySqlTool",
@@ -53,5 +55,7 @@
     "AnalyzeVideoTool",
     "run_skill_script",
     "read_skill_md",
-    "read_skill_config"
+    "read_skill_config",
+    "StoreMemoryTool",
+    "SearchMemoryTool",
 ]
diff --git a/sdk/nexent/core/tools/knowledge_base_search_tool.py b/sdk/nexent/core/tools/knowledge_base_search_tool.py
index 3405be833..c0115a0ab 100644
--- a/sdk/nexent/core/tools/knowledge_base_search_tool.py
+++ b/sdk/nexent/core/tools/knowledge_base_search_tool.py
@@ -21,6 +21,21 @@
 logger = logging.getLogger("knowledge_base_search_tool")
 
 
+def _unwrap_field_info(value):
+    """Resolve a value that may be wrapped in a Pydantic FieldInfo.
+
+    Parameters declared with `Field(...)` and `exclude=True` are not expanded by
+    smolagents' Tool wrapper, so they arrive at `__init__` as raw FieldInfo
+    instances instead of their declared defaults. This helper extracts the
+    concrete value so callers can safely treat the result as plain data.
+    """
+    if isinstance(value, FieldInfo):
+        if value.default_factory is not None:
+            return value.default_factory()
+        return value.default
+    return value
+
+
 class KnowledgeBaseSearchTool(Tool):
     """Knowledge base search tool"""
 
@@ -48,6 +63,10 @@ class KnowledgeBaseSearchTool(Tool):
         },
     }
 
+    # Internal parameter: restricts search results to specified document paths only.
+    # Not exposed to LLM, only settable via tool_params from /chat/run.
+    _internal_document_paths: Optional[List[str]] = None
+
     init_param_descriptions = {
         "top_k": {
             "description": "Maximum number of search results",
@@ -96,6 +115,10 @@ def __init__(
         display_name_to_index_map: dict = Field(
             description="Mapping from display_name (knowledge_name) to index_name",
             default_factory=dict, exclude=True),
+        # Internal parameter: not exposed to LLM, only settable via tool_params from /chat/run.
+        document_paths: Optional[List[str]] = Field(
+            description="Internal: restrict results to documents with these path_or_urls", default=None, exclude=True
+        ),
     ):
         """Initialize the KBSearchTool.
 
@@ -121,11 +144,26 @@ def __init__(
         self.rerank_model = rerank_model
         self.data_process_service = os.getenv("DATA_PROCESS_SERVICE")
         self.display_name_to_index_map = display_name_to_index_map
+        # `document_paths` is declared with `exclude=True` so smolagents passes the
+        # raw FieldInfo default when no value is supplied. Unwrap it here so the
+        # internal filter is always a concrete list (or None), never a FieldInfo.
+        self._internal_document_paths = _unwrap_field_info(document_paths)
 
         self.record_ops = 1
         self.running_prompt_zh = "知识库检索中..."
         self.running_prompt_en = "Searching the knowledge base..."
 
+    def set_document_paths(self, document_paths: Optional[List[str]]) -> None:
+        """Set the internal document_paths filter for access control.
+
+        This method is intended for internal use only, called via tool_params
+        from the /chat/run endpoint. It is NOT exposed to the LLM.
+
+        Args:
+            document_paths: List of allowed document path_or_urls. If None, no filtering is applied.
+        """
+        self._internal_document_paths = _unwrap_field_info(document_paths)
+
     def _convert_to_index_names(self, names: List[str]) -> List[str]:
         """Convert display names (knowledge_name) to index names if necessary.
 
@@ -155,6 +193,36 @@ def _convert_to_index_names(self, names: List[str]) -> List[str]:
                 converted_names.append(name)
         return converted_names
 
+    def _filter_by_document_paths(self, results: List[dict]) -> List[dict]:
+        """Filter search results by allowed document paths for access control.
+
+        If _internal_document_paths is set, only results whose path_or_url is in the
+        allowed list are returned. Results with no path_or_url field are discarded
+        when the filter is active.
+
+        Args:
+            results: List of search result dicts from VDB search
+
+        Returns:
+            Filtered list containing only results with allowed document paths
+        """
+        allowed_paths = _unwrap_field_info(self._internal_document_paths)
+        if not allowed_paths:
+            return results
+
+        filtered = [
+            result for result in results
+            if result.get("path_or_url") in allowed_paths
+        ]
+
+        if filtered:
+            logger.info(
+                "Document paths filter applied: %d/%d results match allowed paths",
+                len(filtered),
+                len(results),
+            )
+        return filtered
+
     def forward(self, query: str, index_names: Optional[List[str]] = None) -> str:
         # Parse index_names from string (always required)
         search_index_names = index_names if index_names is not None else self.index_names
@@ -203,6 +271,9 @@ def forward(self, query: str, index_names: Optional[List[str]] = None) -> str:
         )
         kb_search_results = kb_search_data["results"]
 
+        # Apply document_paths access control: filter out results not in allowed list
+        kb_search_results = self._filter_by_document_paths(kb_search_results)
+
         if not kb_search_results:
             raise Exception("No results found! Try a less restrictive/shorter query.")
 
diff --git a/sdk/nexent/core/tools/search_memory_tool.py b/sdk/nexent/core/tools/search_memory_tool.py
new file mode 100644
index 000000000..4819a7625
--- /dev/null
+++ b/sdk/nexent/core/tools/search_memory_tool.py
@@ -0,0 +1,109 @@
+import asyncio
+import logging
+from typing import Any
+
+from smolagents.tools import Tool
+from pydantic import Field
+
+from ..utils.observer import MessageObserver, ProcessType
+from ..utils.tools_common_message import ToolSign, ToolCategory
+
+logger = logging.getLogger("search_memory_tool")
+
+
+class SearchMemoryTool(Tool):
+    name = "search_memory"
+    description = (
+        "Search long-term memory for relevant information from previous interactions. "
+        "Use this when you need context about the user's preferences, past decisions, "
+        "or previously discussed topics that aren't in the current conversation. "
+        "The system already provides some memory context automatically -- use this tool "
+        "when you need to search for specific information not already available."
+    )
+    description_zh = (
+        "搜索长期记忆中来自之前交互的相关信息。"
+        "当你需要了解用户的偏好、过去的决策或当前对话中未提及的之前讨论过的话题时使用此工具。"
+        "系统已自动提供一些记忆上下文 -- 仅在需要搜索尚未提供的特定信息时使用此工具。"
+    )
+
+    inputs = {
+        "query": {
+            "type": "string",
+            "description": "Natural language query describing what to search for",
+            "description_zh": "描述要搜索内容的自然语言查询"
+        },
+        "top_k": {
+            "type": "integer",
+            "description": "Maximum number of results to return",
+            "description_zh": "返回结果的最大数量",
+            "default": 5,
+            "nullable": True
+        }
+    }
+    output_type = "string"
+    category = ToolCategory.SEARCH.value
+    tool_sign = ToolSign.MEMORY_OPERATION.value
+
+    def __init__(
+        self,
+        memory_config: dict = Field(description="Mem0 configuration", exclude=True),
+        tenant_id: str = Field(description="Tenant ID", default="", exclude=True),
+        user_id: str = Field(description="User ID", default="", exclude=True),
+        agent_id: str = Field(description="Agent ID", default="", exclude=True),
+        memory_user_config: Any = Field(description="User memory preferences", default=None, exclude=True),
+        observer: MessageObserver = Field(description="Message observer", default=None, exclude=True),
+    ):
+        super().__init__()
+        self.memory_config = memory_config
+        self.tenant_id = tenant_id
+        self.user_id = user_id
+        self.agent_id = agent_id
+        self.memory_user_config = memory_user_config
+        self.observer = observer
+        self.running_prompt_en = "Searching memory..."
+        self.running_prompt_zh = "搜索记忆中..."
+
+    def forward(self, query: str, top_k: int = 5) -> str:
+        logger.info(f"[ACTIVE MEMORY] SearchMemoryTool invoked: query={query[:200]}, top_k={top_k}, user_id={self.user_id}, agent_id={self.agent_id}")
+        if self.observer:
+            running_prompt = self.running_prompt_zh if self.observer.lang == "zh" else self.running_prompt_en
+            self.observer.add_message("", ProcessType.TOOL, running_prompt)
+
+        memory_levels = ["tenant", "user", "agent", "user_agent"]
+        if self.memory_user_config.agent_share_option == "never":
+            memory_levels.remove("agent")
+        if self.agent_id in getattr(self.memory_user_config, "disable_agent_ids", []):
+            if "agent" in memory_levels:
+                memory_levels.remove("agent")
+        if self.agent_id in getattr(self.memory_user_config, "disable_user_agent_ids", []):
+            if "user_agent" in memory_levels:
+                memory_levels.remove("user_agent")
+
+        try:
+            from ...memory.memory_service import search_memory_in_levels
+            result = asyncio.run(search_memory_in_levels(
+                query_text=query,
+                memory_config=self.memory_config,
+                tenant_id=self.tenant_id,
+                user_id=self.user_id,
+                agent_id=self.agent_id,
+                top_k=top_k,
+                memory_levels=memory_levels,
+            ))
+
+            items = result.get("results", [])
+            logger.info(f"[ACTIVE MEMORY] SearchMemoryTool completed: found {len(items)} memories, levels={[item.get('memory_level', 'unknown') for item in items]}")
+            if not items:
+                return "No relevant memories found."
+
+            lines = [f"Found {len(items)} relevant memories:"]
+            for i, item in enumerate(items):
+                content = item.get("memory", "") or item.get("content", "")
+                score = item.get("score", 0.0)
+                level = item.get("memory_level", "unknown")
+                lines.append(f"[{i+1}] (score: {score:.2f}, level: {level}) {content}")
+            return "\n".join(lines)
+
+        except Exception as e:
+            logger.error(f"search_memory failed: {e}")
+            return f"Memory search failed: {str(e)}. Continuing without memory results."
diff --git a/sdk/nexent/core/tools/store_memory_tool.py b/sdk/nexent/core/tools/store_memory_tool.py
new file mode 100644
index 000000000..29dbc4a8f
--- /dev/null
+++ b/sdk/nexent/core/tools/store_memory_tool.py
@@ -0,0 +1,110 @@
+import asyncio
+import logging
+from typing import Any
+
+from smolagents.tools import Tool
+from pydantic import Field
+
+from ..utils.observer import MessageObserver, ProcessType
+from ..utils.tools_common_message import ToolSign, ToolCategory
+
+logger = logging.getLogger("store_memory_tool")
+
+
+class StoreMemoryTool(Tool):
+    name = "store_memory"
+    description = (
+        "Save important information to long-term memory for future recall. "
+        "Use this when the user shares personal preferences, facts about themselves, "
+        "project context, or instructions that should persist across conversations. "
+        "Do NOT store transient information like temporary calculations, information "
+        "already in the knowledge base, or data the user explicitly says to forget."
+    )
+    description_zh = (
+        "将重要信息保存到长期记忆中以便未来回忆。"
+        "当用户分享个人偏好、关于自己的事实、项目上下文或应跨对话保留的指令时使用此工具。"
+        "不要存储临时信息，如临时计算结果、知识库中已有的信息或用户明确要求遗忘的数据。"
+    )
+
+    inputs = {
+        "content": {
+            "type": "string",
+            "description": "The information to remember",
+            "description_zh": "需要记住的信息"
+        }
+    }
+    output_type = "string"
+    category = ToolCategory.DATABASE.value
+    tool_sign = ToolSign.MEMORY_OPERATION.value
+
+    def __init__(
+        self,
+        memory_config: dict = Field(description="Mem0 configuration", exclude=True),
+        tenant_id: str = Field(description="Tenant ID", default="", exclude=True),
+        user_id: str = Field(description="User ID", default="", exclude=True),
+        agent_id: str = Field(description="Agent ID", default="", exclude=True),
+        memory_user_config: Any = Field(description="User memory preferences", default=None, exclude=True),
+        observer: MessageObserver = Field(description="Message observer", default=None, exclude=True),
+    ):
+        super().__init__()
+        self.memory_config = memory_config
+        self.tenant_id = tenant_id
+        self.user_id = user_id
+        self.agent_id = agent_id
+        self.memory_user_config = memory_user_config
+        self.observer = observer
+        self.store_count = 0
+        self.max_stores_per_run = 3
+        self.running_prompt_en = "Saving to memory..."
+        self.running_prompt_zh = "保存到记忆中..."
+
+    def forward(self, content: str) -> str:
+        logger.info(f"[ACTIVE MEMORY] StoreMemoryTool invoked: content={content[:200]}, user_id={self.user_id}, agent_id={self.agent_id}, store_count={self.store_count}/{self.max_stores_per_run}")
+        if self.observer:
+            running_prompt = self.running_prompt_zh if self.observer.lang == "zh" else self.running_prompt_en
+            self.observer.add_message("", ProcessType.TOOL, running_prompt)
+
+        if self.store_count >= self.max_stores_per_run:
+            return "Memory storage limit reached for this conversation. Information will be saved automatically at the end."
+
+        levels = ["user_agent", "agent"]
+        if self.memory_user_config.agent_share_option == "never":
+            levels.remove("agent")
+        if self.agent_id in getattr(self.memory_user_config, "disable_user_agent_ids", []):
+            levels = [l for l in levels if l != "user_agent"]
+        if self.agent_id in getattr(self.memory_user_config, "disable_agent_ids", []):
+            levels = [l for l in levels if l != "agent"]
+        if not levels:
+            return "No memory levels available (all disabled by user preferences)."
+
+        try:
+            from ...memory.memory_service import add_memory_in_levels
+            result = asyncio.run(add_memory_in_levels(
+                messages=[{"role": "user", "content": content}],
+                memory_config=self.memory_config,
+                tenant_id=self.tenant_id,
+                user_id=self.user_id,
+                agent_id=self.agent_id,
+                memory_levels=levels,
+            ))
+            self.store_count += 1
+
+            items = result.get("results", [])
+            logger.info(f"[ACTIVE MEMORY] StoreMemoryTool completed: {len(items)} items processed, events={[item.get('event', 'NONE') for item in items]}")
+            if not items:
+                return "No new facts were extracted from the content."
+
+            stored_facts = []
+            for item in items:
+                event = item.get("event", "NONE")
+                text = item.get("memory", "")
+                if event in ("ADD", "UPDATE"):
+                    stored_facts.append(f"[{event}] {text}")
+
+            if not stored_facts:
+                return "The information was already present in memory (no changes needed)."
+            return "Stored successfully:\n" + "\n".join(stored_facts)
+
+        except Exception as e:
+            logger.error(f"store_memory failed: {e}")
+            return f"Failed to store memory: {str(e)}. Continuing without saving."
diff --git a/sdk/nexent/core/utils/observer.py b/sdk/nexent/core/utils/observer.py
index c123b5157..fc45b30aa 100644
--- a/sdk/nexent/core/utils/observer.py
+++ b/sdk/nexent/core/utils/observer.py
@@ -27,6 +27,7 @@ class ProcessType(Enum):
     TOOL = "tool"  # tool name
     MEMORY_SEARCH = "memory_search"  # memory search status
     MAX_STEPS_REACHED = "max_steps_reached"  # agent reached maximum steps limit
+    VERIFICATION = "verification"  # layered ReAct self-verification status
 
 
 # message transformer base class
@@ -159,7 +160,8 @@ def _init_message_transformers(self):
             ProcessType.CARD: default_transformer,
             ProcessType.TOOL: default_transformer,
             ProcessType.MEMORY_SEARCH: default_transformer,
-            ProcessType.MAX_STEPS_REACHED: default_transformer
+            ProcessType.MAX_STEPS_REACHED: default_transformer,
+            ProcessType.VERIFICATION: default_transformer
         }
 
     def add_model_new_token(self, new_token):
diff --git a/sdk/nexent/core/utils/tools_common_message.py b/sdk/nexent/core/utils/tools_common_message.py
index 1d27f6b6d..6b5f2e056 100644
--- a/sdk/nexent/core/utils/tools_common_message.py
+++ b/sdk/nexent/core/utils/tools_common_message.py
@@ -17,6 +17,7 @@ class ToolSign(Enum):
     TERMINAL_OPERATION = "t"  # Terminal operation tool identifier
     MULTIMODAL_OPERATION = "m"  # Multimodal operation tool identifier
     DATABASE_OPERATION = "z"  # Database operation tool identifier
+    MEMORY_OPERATION = "n"      # Memory operation tool identifier
 
 
 # Tool sign mapping for backward compatibility
@@ -33,6 +34,7 @@ class ToolSign(Enum):
     "terminal_operation": ToolSign.TERMINAL_OPERATION.value,
     "multimodal_operation": ToolSign.MULTIMODAL_OPERATION.value,
     "database_operation": ToolSign.DATABASE_OPERATION.value,
+    "memory_operation": ToolSign.MEMORY_OPERATION.value,
 }
 
 # Reverse mapping for lookup
diff --git a/sdk/nexent/memory/memory_core.py b/sdk/nexent/memory/memory_core.py
index 434bf2cb0..c5004c00e 100644
--- a/sdk/nexent/memory/memory_core.py
+++ b/sdk/nexent/memory/memory_core.py
@@ -102,7 +102,9 @@ async def get_memory_instance(memory_config: Dict[str, Any]) -> AsyncMemory:
     # Validate *before* computing hash so we fail fast with human-readable error
     _validate_config(memory_config)
 
-    cache_key = _hash_config(memory_config)
+    config_hash = _hash_config(memory_config)
+    loop = asyncio.get_event_loop()
+    cache_key = f"{config_hash}:{id(loop)}"
 
     async with _get_cache_lock():
         if cache_key in _MEMORY_CACHE:
diff --git a/sdk/nexent/skills/skill_manager.py b/sdk/nexent/skills/skill_manager.py
index 4c05b3c06..c2e50c790 100644
--- a/sdk/nexent/skills/skill_manager.py
+++ b/sdk/nexent/skills/skill_manager.py
@@ -7,6 +7,7 @@
 import shlex
 import shutil
 import subprocess
+import sys
 import tempfile
 import zipfile
 from typing import Any, Dict, List, Optional, Union
@@ -786,9 +787,13 @@ def _run_python_script(self, script_path: str, params: Optional[str]) -> str:
         """
         cmd_parts = shlex.split(params) if params else []
 
+        # Use sys.executable to ensure the script runs in the same Python environment
+        # as the current process, so all installed packages (e.g., python-docx) are available
+        python_executable = sys.executable
+
         try:
             result = subprocess.run(
-                ["python", script_path] + cmd_parts,
+                [python_executable, script_path] + cmd_parts,
                 capture_output=True,
                 text=True,
                 timeout=300,
diff --git a/sdk/pyproject.toml b/sdk/pyproject.toml
index cdb5459b9..e39bbbf5e 100644
--- a/sdk/pyproject.toml
+++ b/sdk/pyproject.toml
@@ -9,12 +9,12 @@ description = "Nexent Agent Framework"
 authors = [
     { name = "Nexent Dev Team" }
 ]
-requires-python = ">=3.10"
+requires-python = ">=3.11,<3.12"
 keywords = ["agent", "ai", "framework"]
 classifiers = [
     "Intended Audience :: Developers",
     "Programming Language :: Python :: 3",
-    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
 ]
 dependencies = [
     "aiofiles>=24.1.0",
@@ -38,8 +38,8 @@ dependencies = [
     "botocore>=1.37.34",
     "python-multipart>=0.0.20",
     "mcpadapt>=0.1.13",
-    "mcp>=1.19.0,<1.23",
-    "fastmcp==2.12.0",
+    "mcp>=1.24.0,<1.30",
+    "fastmcp>=2.14.2,<3.0",
     "docker>=7.0.0",
     "kubernetes>=29.0.0",
     "tiktoken>=0.5.0",
diff --git a/sonar-project.properties b/sonar-project.properties
new file mode 100644
index 000000000..7da5cc4c8
--- /dev/null
+++ b/sonar-project.properties
@@ -0,0 +1,5 @@
+sonar.projectKey=ModelEngine-Group_nexent
+sonar.organization=modelengine-group
+
+sonar.exclusions=**/init.sql
+sonar.cpd.exclusions=**/init.sql
\ No newline at end of file
diff --git a/test/backend/agents/test_create_agent_info.py b/test/backend/agents/test_create_agent_info.py
index f650de5d7..083886c1a 100644
--- a/test/backend/agents/test_create_agent_info.py
+++ b/test/backend/agents/test_create_agent_info.py
@@ -47,6 +47,21 @@ class ToolExecutionException(Exception):
 
 consts_model_module = types.ModuleType("consts.model")
 consts_model_module.HistoryItem = HistoryItem
+
+
+class MockAgentToolParamsRequest(BaseModel):
+    """Mock for AgentToolParamsRequest."""
+    tools: Dict[str, Dict[str, Any]] = {}
+
+
+class MockToolParamsRequest(BaseModel):
+    """Mock for ToolParamsRequest."""
+    agents: Dict[str, MockAgentToolParamsRequest] = {}
+
+
+consts_model_module.HistoryItem = HistoryItem
+consts_model_module.AgentToolParamsRequest = MockAgentToolParamsRequest
+consts_model_module.ToolParamsRequest = MockToolParamsRequest
 sys.modules["consts.model"] = consts_model_module
 
 # Mock consts.exceptions module with ValidationError
@@ -63,7 +78,7 @@ class ToolExecutionException(Exception):
     setattr(consts_module, "model", consts_model_module)
     setattr(consts_module, "exceptions", consts_exceptions_module)
 
-# Also add model to consts module attributes
+# Also add model to consts module attributes (with AgentToolParamsRequest and ToolParamsRequest)
 consts_module = sys.modules.get("consts")
 if consts_module:
     setattr(consts_module, "model", consts_model_module)
@@ -150,6 +165,11 @@ def __init__(self, **kwargs):
 
 # Mock external dependencies before imports
 mock_message_observer = MagicMock()
+class MockAgentVerificationConfig:
+    @classmethod
+    def model_validate(cls, value):
+        return value or {}
+
 sys.modules['nexent.core.utils.observer'] = MagicMock(MessageObserver=mock_message_observer)
 sys.modules['nexent.core.agents.agent_model'] = _create_stub_module(
     "nexent.core.agents.agent_model",
@@ -159,6 +179,7 @@ def __init__(self, **kwargs):
     ToolConfig=MagicMock(),
     ExternalA2AAgentConfig=MagicMock(),
     AgentRunInfo=MagicMock(),
+    AgentVerificationConfig=MockAgentVerificationConfig,
     MessageObserver=MagicMock(),
     ContextComponent=_create_stub_component_class("ContextComponent"),
     ToolsComponent=_create_stub_component_class("ToolsComponent"),
@@ -239,6 +260,7 @@ def __init__(self, **kwargs):
 sys.modules['nexent.core.agents.agent_model'].ModelConfig = mock_model_config
 sys.modules['nexent.core.agents.agent_model'].ToolConfig = mock_tool_config
 sys.modules['nexent.core.agents.agent_model'].AgentRunInfo = mock_agent_run_info
+sys.modules['nexent.core.agents.agent_model'].AgentVerificationConfig = MockAgentVerificationConfig
 sys.modules['nexent.core.utils.observer'].MessageObserver = mock_message_observer
 
 # Mock BASE_BUILTIN_MODULES
@@ -293,6 +315,9 @@ def __init__(self, **kwargs):
     _build_internal_s3_url,
     _format_minio_files_for_content,
     _convert_history_with_minio_files,
+    _normalize_tool_params_request,
+    _get_agent_tool_overrides,
+    _merge_tool_params,
 )
 
 # Import HistoryItem for testing (from mocked consts.model)
@@ -301,6 +326,9 @@ def __init__(self, **kwargs):
 # Import ValidationError for testing (from mocked consts.exceptions)
 ValidationError = sys.modules["consts.exceptions"].ValidationError
 
+# Import ToolParamsRequest for testing
+ToolParamsRequest = sys.modules["consts.model"].ToolParamsRequest
+
 # Import constants for testing
 from consts.const import MODEL_CONFIG_MAPPING
 
@@ -736,6 +764,11 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
         """Ensure multimodal param is forwarded to embedding model selection."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["idx1", "idx2"],
+            "multimodal": True,
+            "rerank": False,
+        }
 
         with patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
@@ -744,7 +777,7 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
                 patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names') as mock_get_knowledge_map, \
                 patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config:
-            
+
             mock_tool_config.return_value = mock_tool_instance
 
             mock_search_tools.return_value = [
@@ -755,7 +788,7 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
                     "inputs": "string",
                     "output_type": "string",
                     "params": [
-                        {"name": "index_names", "default": ["idx1", "idx2"]},  # 添加这个
+                        {"name": "index_names", "default": ["idx1", "idx2"]},
                         {"name": "multimodal", "default": True},
                         {"name": "rerank", "default": False},
                     ],
@@ -773,9 +806,6 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
             assert len(result) == 1
             # Verify get_embedding_model_by_index_name was called with tenant_id and first index_name
             mock_embedding_by_index.assert_called_once_with("tenant_1", "idx1")
-            
-            # Verify that multimodal parameter was removed from params (popped)
-            assert "multimodal" not in result[0].params
 
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_analyze_image_tool(self):
@@ -897,11 +927,16 @@ async def test_create_tool_config_list_with_analyze_text_file_tool(self):
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_knowledge_base_tool_metadata(self):
         """
-        Test that KnowledgeBaseSearchTool metadata contains vdb_core, embedding_model, 
+        Test that KnowledgeBaseSearchTool metadata contains vdb_core, embedding_model,
         rerank_model, display_name_to_index_map, and index_name_to_display_map.
         """
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["idx_a"],
+            "rerank": True,
+            "rerank_model_name": "gte-rerank-v2",
+        }
 
         with patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
@@ -944,7 +979,7 @@ async def test_create_tool_config_list_with_knowledge_base_tool_metadata(self):
 
             # Verify correct functions were called with correct parameters
             mock_get_vector_db_core.assert_called_once()
-            # 修改：验证调用时使用 tenant_id 和 index_name
+            # Verify that call uses tenant_id and first index_name
             mock_embedding.assert_called_once_with("tenant_1", "idx_a")
             mock_rerank.assert_called_once_with(tenant_id="tenant_1", model_name="gte-rerank-v2")
             mock_get_knowledge_map.assert_called_once_with(["idx_a"])
@@ -1230,52 +1265,155 @@ async def test_create_tool_config_list_multiple_tools_same_type(self):
             assert mock_tool_2.metadata["display_name_to_index_map"] == {}
 
     @pytest.mark.asyncio
-    async def test_create_tool_config_list_with_dify_tool(self):
-        """Test that DifySearchTool gets correct metadata including rerank model."""
-        mock_tool_instance = MagicMock()
-        mock_tool_instance.class_name = "DifySearchTool"
+    async def test_create_tool_config_list_applies_request_overrides_for_multiple_tools(self):
+        """Request tool_params should override DB params for multiple tools in one agent."""
+        kb_tool = MagicMock()
+        kb_tool.class_name = "KnowledgeBaseSearchTool"
+        kb_tool.params = {
+            "index_names": ["idx_override"],
+            "rerank": True,
+            "rerank_model_name": "gte-rerank-v2",
+            "top_k": 10,
+        }
+        analyze_tool = MagicMock()
+        analyze_tool.class_name = "AnalyzeTextFileTool"
+        analyze_tool.params = {
+            "prompt": "override prompt",
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
-                patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank:
+                patch('backend.agents.create_agent_info.get_vector_db_core') as mock_get_vector_db_core, \
+                patch('backend.agents.create_agent_info.get_embedding_model_by_index_name') as mock_embedding, \
+                patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
+                patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names', return_value={"idx_override": "Override KB"}), \
+                patch('backend.agents.create_agent_info.get_llm_model', return_value='llm-model'):
+            mock_tool_config.side_effect = [kb_tool, analyze_tool]
+            mock_get_vector_db_core.return_value = 'vdb-core'
+            mock_embedding.return_value = ('embedding-model', 1, {'status': 'ok'})
+            mock_rerank.return_value = 'rerank-model'
+            mock_search_tools.return_value = [
+                {
+                    'class_name': 'KnowledgeBaseSearchTool',
+                    'name': 'knowledge_base_search',
+                    'description': 'kb',
+                    'inputs': '{}',
+                    'output_type': 'string',
+                    'params': [
+                        {'name': 'index_names', 'default': ['idx_default']},
+                        {'name': 'rerank', 'default': False},
+                        {'name': 'rerank_model_name', 'default': ''},
+                        {'name': 'top_k', 'default': 5},
+                    ],
+                    'source': 'local',
+                    'usage': None,
+                },
+                {
+                    'class_name': 'AnalyzeTextFileTool',
+                    'name': 'analyze_text_file',
+                    'description': 'text',
+                    'inputs': '{}',
+                    'output_type': 'string',
+                    'params': [
+                        {'name': 'prompt', 'default': 'default prompt'},
+                    ],
+                    'source': 'local',
+                    'usage': None,
+                },
+            ]
 
+            result = await create_tool_config_list(
+                'agent_1',
+                'tenant_1',
+                'user_1',
+                tool_params={
+                    'agents': {
+                        'test_agent': {
+                            'tools': {
+                                'knowledge_base_search': {
+                                    'top_k': 10,
+                                    'rerank': True,
+                                    'rerank_model_name': 'gte-rerank-v2',
+                                    'index_names': ['idx_override'],
+                                },
+                                'analyze_text_file': {
+                                    'prompt': 'override prompt',
+                                },
+                            }
+                        }
+                    }
+                },
+            )
+
+        assert len(result) == 2
+        assert kb_tool.params['top_k'] == 10
+        assert kb_tool.params['rerank'] is True
+        assert kb_tool.params['rerank_model_name'] == 'gte-rerank-v2'
+        assert kb_tool.params['index_names'] == ['idx_override']
+        assert analyze_tool.params['prompt'] == 'override prompt'
+        mock_rerank.assert_called_once_with(tenant_id='tenant_1', model_name='gte-rerank-v2')
+        mock_embedding.assert_called_once_with('tenant_1', 'idx_override')
+
+    @pytest.mark.asyncio
+    async def test_create_tool_config_list_with_tool_params(self):
+        """Test create_tool_config_list with valid tool_params."""
+        mock_tool_instance = MagicMock()
+        mock_tool_instance.class_name = "AnalyzeTextFileTool"
+        mock_tool_instance.params = {
+            "prompt": "override prompt",
+        }
+
+        with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
+                patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
+                patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
+                patch('backend.agents.create_agent_info.get_llm_model', return_value='llm-model'):
             mock_tool_config.return_value = mock_tool_instance
-            mock_rerank.return_value = "mock_rerank_model"
 
             mock_search_tools.return_value = [
                 {
-                    "class_name": "DifySearchTool",
-                    "name": "dify_search",
-                    "description": "Dify knowledge search",
-                    "inputs": "string",
-                    "output_type": "string",
-                    "params": [
-                        {"name": "rerank", "default": True},
-                        {"name": "rerank_model_name", "default": "gte-rerank-v2"},
+                    'class_name': 'AnalyzeTextFileTool',
+                    'name': 'analyze_text_file',
+                    'description': 'text',
+                    'inputs': '{}',
+                    'output_type': 'string',
+                    'params': [
+                        {'name': 'prompt', 'default': 'default prompt'},
                     ],
-                    "source": "local",
-                    "usage": None
+                    'source': 'local',
+                    'usage': None,
                 }
             ]
 
-            from backend.agents.create_agent_info import create_tool_config_list
-            result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
-
-            # Verify rerank model was fetched
-            mock_rerank.assert_called_once_with(
-                tenant_id="tenant_1", model_name="gte-rerank-v2"
+            result = await create_tool_config_list(
+                'agent_1',
+                'tenant_1',
+                'user_1',
+                tool_params={
+                    'agents': {
+                        'test_agent': {
+                            'tools': {
+                                'analyze_text_file': {
+                                    'prompt': 'override prompt',
+                                }
+                            }
+                        }
+                    }
+                },
             )
 
-            # Verify metadata
             assert len(result) == 1
             assert result[0] is mock_tool_instance
 
     @pytest.mark.asyncio
-    async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
-        """Test that DifySearchTool without rerank gets None metadata."""
+    async def test_create_tool_config_list_with_dify_tool(self):
+        """Test that DifySearchTool gets correct metadata including rerank model."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "DifySearchTool"
+        mock_tool_instance.params = {
+            "rerank": True,
+            "rerank_model_name": "gte-rerank-v2",
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1283,6 +1421,7 @@ async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank:
 
             mock_tool_config.return_value = mock_tool_instance
+            mock_rerank.return_value = "mock_rerank_model"
 
             mock_search_tools.return_value = [
                 {
@@ -1292,29 +1431,34 @@ async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
                     "inputs": "string",
                     "output_type": "string",
                     "params": [
-                        {"name": "rerank", "default": False},
-                        {"name": "rerank_model_name", "default": ""},
+                        {"name": "rerank", "default": True},
+                        {"name": "rerank_model_name", "default": "gte-rerank-v2"},
                     ],
                     "source": "local",
                     "usage": None
                 }
             ]
 
-            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
-            # Verify rerank model was NOT fetched
-            mock_rerank.assert_not_called()
+            # Verify rerank model was fetched
+            mock_rerank.assert_called_once_with(
+                tenant_id="tenant_1", model_name="gte-rerank-v2"
+            )
 
             # Verify metadata
             assert len(result) == 1
             assert result[0] is mock_tool_instance
 
     @pytest.mark.asyncio
-    async def test_create_tool_config_list_with_datamate_tool(self):
-        """Test that DataMateSearchTool gets correct metadata including rerank model."""
+    async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
+        """Test that DifySearchTool without rerank gets None metadata."""
         mock_tool_instance = MagicMock()
-        mock_tool_instance.class_name = "DataMateSearchTool"
+        mock_tool_instance.class_name = "DifySearchTool"
+        mock_tool_instance.params = {
+            "rerank": False,
+            "rerank_model_name": "",
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1322,31 +1466,27 @@ async def test_create_tool_config_list_with_datamate_tool(self):
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank:
 
             mock_tool_config.return_value = mock_tool_instance
-            mock_rerank.return_value = "mock_datamate_rerank_model"
 
             mock_search_tools.return_value = [
                 {
-                    "class_name": "DataMateSearchTool",
-                    "name": "datamate_search",
-                    "description": "DataMate knowledge search",
+                    "class_name": "DifySearchTool",
+                    "name": "dify_search",
+                    "description": "Dify knowledge search",
                     "inputs": "string",
                     "output_type": "string",
                     "params": [
-                        {"name": "rerank", "default": True},
-                        {"name": "rerank_model_name", "default": "jina-rerank-v2"},
+                        {"name": "rerank", "default": False},
+                        {"name": "rerank_model_name", "default": ""},
                     ],
                     "source": "local",
                     "usage": None
                 }
             ]
 
-            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
-            # Verify rerank model was fetched
-            mock_rerank.assert_called_once_with(
-                tenant_id="tenant_1", model_name="jina-rerank-v2"
-            )
+            # Verify rerank model was NOT fetched
+            mock_rerank.assert_not_called()
 
             # Verify metadata
             assert len(result) == 1
@@ -1357,6 +1497,10 @@ async def test_create_tool_config_list_with_datamate_tool_no_rerank(self):
         """Test that DataMateSearchTool without rerank gets None metadata."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "DataMateSearchTool"
+        mock_tool_instance.params = {
+            "rerank": False,
+            "rerank_model_name": "",
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1381,13 +1525,12 @@ async def test_create_tool_config_list_with_datamate_tool_no_rerank(self):
                 }
             ]
 
-            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify rerank model was NOT fetched
             mock_rerank.assert_not_called()
 
-            # Verify metadata
+            # Verify result
             assert len(result) == 1
             assert result[0] is mock_tool_instance
 
@@ -1487,7 +1630,7 @@ class TestCreateAgentConfig:
     async def test_create_agent_config_basic(self):
         """Test case for basic agent configuration creation"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1538,14 +1681,15 @@ async def test_create_agent_config_basic(self):
                 managed_agents=[],
                 external_a2a_agents=[],
                 context_manager_config=ANY,
-                context_components=ANY
+                context_components=ANY,
+                verification_config=ANY
             )
 
     @pytest.mark.asyncio
     async def test_create_agent_config_with_sub_agents(self):
         """Test case for creating agent configuration with sub-agents"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1566,7 +1710,9 @@ async def test_create_agent_config_with_sub_agents(self):
                 "model_id": 123,
                 "provide_run_summary": True
             }
-            mock_query_sub.return_value = ["sub_agent_1"]
+            mock_query_sub.return_value = [
+                {"selected_agent_id": "sub_agent_1", "selected_agent_version_no": None}
+            ]
             mock_create_tools.return_value = []
             mock_get_template.return_value = {
                 "system_prompt": "{{duty}} {{constraint}} {{few_shots}}"}
@@ -1607,14 +1753,74 @@ async def test_create_agent_config_with_sub_agents(self):
                     managed_agents=[mock_sub_agent_config],
                     external_a2a_agents=[],
                     context_manager_config=ANY,
-                    context_components=ANY
+                    context_components=ANY,
+                    verification_config=ANY
                 )
 
+    @pytest.mark.asyncio
+    async def test_create_agent_config_with_pinned_sub_agent_version(self):
+        """Test sub-agent config uses pinned selected_agent_version_no from relation"""
+        with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.resolve_sub_agent_version_no', return_value=3) as mock_resolve, \
+                patch('backend.agents.create_agent_info.create_tool_config_list', new_callable=AsyncMock) as mock_create_tools, \
+                patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
+                patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
+                patch('backend.agents.create_agent_info.build_memory_context') as mock_build_memory, \
+                patch('backend.agents.create_agent_info.AgentConfig') as mock_agent_config, \
+                patch('backend.agents.create_agent_info.prepare_prompt_templates') as mock_prepare_templates, \
+                patch('backend.agents.create_agent_info.get_model_by_model_id') as mock_get_model_by_id:
+
+            mock_search_agent.return_value = {
+                "name": "test_agent",
+                "description": "test description",
+                "duty_prompt": "test duty",
+                "constraint_prompt": "test constraint",
+                "few_shots_prompt": "test few shots",
+                "max_steps": 5,
+                "model_id": 123,
+                "provide_run_summary": True,
+            }
+            mock_query_sub.return_value = [
+                {"selected_agent_id": 42, "selected_agent_version_no": 3}
+            ]
+            mock_create_tools.return_value = []
+            mock_get_template.return_value = {"system_prompt": "{{duty}}"}
+            mock_tenant_config.get_app_config.side_effect = ["TestApp", "Test Description"]
+            mock_build_memory.return_value = Mock(
+                user_config=Mock(memory_switch=False),
+                memory_config={},
+                tenant_id="tenant_1",
+                user_id="user_1",
+                agent_id="agent_1",
+            )
+            mock_prepare_templates.return_value = {"system_prompt": "populated_system_prompt"}
+            mock_get_model_by_id.return_value = {"display_name": "test_model"}
+
+            mock_sub_agent_config = Mock()
+            mock_sub_agent_config.name = "sub_agent"
+
+            with patch(
+                'backend.agents.create_agent_info.create_agent_config',
+                new_callable=AsyncMock,
+                return_value=mock_sub_agent_config,
+            ) as mock_recursive_create:
+                mock_agent_config.reset_mock()
+                await create_agent_config("agent_1", "tenant_1", "user_1", "zh", "test query", version_no=2)
+
+                mock_resolve.assert_called_once_with(
+                    selected_agent_id=42,
+                    selected_agent_version_no=3,
+                    tenant_id="tenant_1",
+                )
+                mock_recursive_create.assert_called_once()
+                assert mock_recursive_create.call_args.kwargs["version_no"] == 3
+
     @pytest.mark.asyncio
     async def test_create_agent_config_with_memory(self):
         """Test case for creating agent configuration with memory"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1678,7 +1884,7 @@ async def test_create_agent_config_memory_disabled_no_search(self):
             "backend.agents.create_agent_info.search_agent_info_by_agent_id"
         ) as mock_search_agent, \
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub, \
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -1756,7 +1962,7 @@ async def test_create_agent_config_memory_disabled_no_search(self):
     async def test_create_agent_config_model_id_none(self):
         """Test case for creating agent configuration when model_id is None"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1806,7 +2012,8 @@ async def test_create_agent_config_model_id_none(self):
                 managed_agents=[],
                 external_a2a_agents=[],
                 context_manager_config=ANY,
-                context_components=ANY
+                context_components=ANY,
+                verification_config=ANY
             )
 
     @pytest.mark.asyncio
@@ -1817,7 +2024,7 @@ async def test_create_agent_config_memory_exception(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -1897,7 +2104,7 @@ async def test_create_agent_config_memory_levels_agent_share_never(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -1992,7 +2199,7 @@ async def test_create_agent_config_memory_levels_disable_agent(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2087,7 +2294,7 @@ async def test_create_agent_config_memory_levels_disable_user_agent(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2181,7 +2388,7 @@ async def test_create_agent_config_with_knowledge_base_summary_filtering(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2302,7 +2509,7 @@ async def test_create_agent_config_uses_metadata_index_name_to_display_map(self)
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2413,7 +2620,7 @@ async def test_create_agent_config_metadata_without_index_name_to_display_map(se
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2513,7 +2720,7 @@ async def test_create_agent_config_knowledge_base_summary_no_indexes_message(
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agents_id_list"
+                "backend.agents.create_agent_info.query_sub_agent_relations"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2578,7 +2785,7 @@ async def test_create_agent_config_knowledge_base_summary_no_indexes_message(
     async def test_create_agent_config_knowledge_base_summary_error(self):
         """Test case for error handling during knowledge base summary build"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -2952,6 +3159,7 @@ async def test_create_agent_run_info_success(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=1,
+                tool_params=None,
             )
             mock_get_mcp.assert_called_once_with(tenant_id="tenant_1", is_need_auth=True)
             mock_filter.assert_called_once_with("agent_config", {
@@ -3488,6 +3696,7 @@ async def test_create_agent_run_info_forwards_allow_memory_false(self):
                 last_user_query="processed_query",
                 allow_memory_search=False,
                 version_no=1,
+                tool_params=None,
             )
 
     @pytest.mark.asyncio
@@ -3534,6 +3743,7 @@ async def test_create_agent_run_info_is_debug_true(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=0,  # Debug mode uses draft version 0
+                tool_params=None,
             )
 
     @pytest.mark.asyncio
@@ -3586,6 +3796,7 @@ async def test_create_agent_run_info_no_published_version_fallback(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=0,  # Fallback to draft version 0
+                tool_params=None,
             )
             # Verify that get_remote_mcp_server_list was called with is_need_auth=True
             mock_get_mcp.assert_called_once_with(tenant_id="tenant_1", is_need_auth=True)
@@ -4250,6 +4461,10 @@ async def test_knowledge_base_with_display_name_to_index_map(self):
         """Test that KnowledgeBaseSearchTool gets correct display_name_to_index_map from index_names"""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["idx1", "idx2"],
+            "rerank": False,
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4511,11 +4726,16 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
         """Test that ValidationError is raised when index_names is empty for KnowledgeBaseSearchTool."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": [],
+            "rerank": False,
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
                 patch('backend.agents.create_agent_info.get_vector_db_core') as mock_get_vector_db_core, \
+                patch('backend.agents.create_agent_info.get_embedding_model_by_index_name') as mock_get_emb, \
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
                 patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names') as mock_get_knowledge_map:
 
@@ -4538,6 +4758,7 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
                 }
             ]
             mock_get_vector_db_core.return_value = "vdb_core_instance"
+            mock_get_emb.return_value = None  # Will trigger ValidationError
             mock_rerank.return_value = None
             mock_get_knowledge_map.return_value = {}
 
@@ -4546,13 +4767,17 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
                 await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify error message
-            assert "Embedding model is required for knowledge_base_search but index_names is empty" in str(exc_info.value)
+            assert "index_names" in str(exc_info.value) and "not configured" in str(exc_info.value)
 
     @pytest.mark.asyncio
     async def test_knowledge_base_no_embedding_model_raises_validation_error(self):
         """Test that ValidationError is raised when get_embedding_model_by_index_name returns None."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["idx1"],
+            "rerank": False,
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4590,8 +4815,7 @@ async def test_knowledge_base_no_embedding_model_raises_validation_error(self):
             with pytest.raises(ValidationError) as exc_info:
                 await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
-            # Verify error message contains index name and guidance
-            assert "No embedding model found for index 'idx1'" in str(exc_info.value)
+            # Verify error message contains guidance about configuring embedding model
             assert "Please configure an embedding model for this knowledge base" in str(exc_info.value)
 
     @pytest.mark.asyncio
@@ -4599,6 +4823,11 @@ async def test_knowledge_base_with_valid_embedding_model(self):
         """Test that KnowledgeBaseSearchTool correctly sets embedding_model when get_embedding_model_by_index_name succeeds."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["idx1", "idx2"],
+            "rerank": True,
+            "rerank_model_name": "gte-rerank-v2",
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4642,19 +4871,19 @@ async def test_knowledge_base_with_valid_embedding_model(self):
 
             # Verify the tool was created successfully
             assert len(result) == 1
-            
+
             # Verify get_embedding_model_by_index_name was called with correct parameters
             mock_get_emb_by_index.assert_called_once_with("tenant_1", "idx1")
-            
+
             # Verify metadata contains the embedding_model
             assert result[0].metadata["embedding_model"] == mock_embedding_model
-            
+
             # Verify metadata also contains other expected fields
             assert "vdb_core" in result[0].metadata
             assert "rerank_model" in result[0].metadata
             assert "display_name_to_index_map" in result[0].metadata
             assert "index_name_to_display_map" in result[0].metadata
-            
+
             # Verify mappings are correct
             assert result[0].metadata["display_name_to_index_map"] == {
                 "Knowledge Base 1": "idx1",
@@ -4670,6 +4899,10 @@ async def test_knowledge_base_with_single_index_and_embedding_model(self):
         """Test KnowledgeBaseSearchTool with single index_name and valid embedding model."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
+        mock_tool_instance.params = {
+            "index_names": ["single_index"],
+            "rerank": False,
+        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4710,13 +4943,13 @@ async def test_knowledge_base_with_single_index_and_embedding_model(self):
 
             # Verify the tool was created successfully
             assert len(result) == 1
-            
+
             # Verify get_embedding_model_by_index_name was called
             mock_get_emb_by_index.assert_called_once_with("tenant_1", "single_index")
-            
+
             # Verify embedding_model is set correctly
             assert result[0].metadata["embedding_model"] == mock_embedding_model
-            
+
             # Verify mappings for single index
             assert result[0].metadata["display_name_to_index_map"] == {
                 "My Knowledge Base": "single_index"
@@ -4759,12 +4992,12 @@ async def test_knowledge_base_embedding_model_error_metadata(self):
             mock_get_vector_db_core.return_value = "vdb_core"
             mock_rerank.return_value = None
             mock_get_knowledge_map.return_value = {"test_idx": "Test KB"}
-            
+
             # Return valid embedding model with error metadata
             mock_embedding_model = MagicMock()
             mock_get_emb_by_index.return_value = (
-                mock_embedding_model, 
-                789, 
+                mock_embedding_model,
+                789,
                 {"status": "error", "message": "Some error but model exists"}
             )
 
@@ -5189,3 +5422,157 @@ def test_convert_history_with_minio_files_all_items_have_minio_files(self):
 
 if __name__ == "__main__":
     pytest.main([__file__])
+
+
+# ============================================================================
+# Additional tests for improved coverage
+# ============================================================================
+
+
+class TestNormalizeToolParamsRequest:
+    """Tests for _normalize_tool_params_request function."""
+
+    def test_normalize_with_none(self):
+        """Test that None returns empty ToolParamsRequest."""
+        result = _normalize_tool_params_request(None)
+        assert isinstance(result, ToolParamsRequest)
+        assert result.agents == {}
+
+    def test_normalize_with_tool_params_request(self):
+        """Test that ToolParamsRequest is returned as-is."""
+        req = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
+        result = _normalize_tool_params_request(req)
+        assert result is req
+
+    def test_normalize_with_valid_dict(self):
+        """Test that valid dict is validated into ToolParamsRequest."""
+        input_dict = {"agents": {"agent1": {"tools": {"tool1": {"param1": "value1"}}}}}
+        result = _normalize_tool_params_request(input_dict)
+        assert isinstance(result, ToolParamsRequest)
+        assert "agent1" in result.agents
+
+    def test_normalize_with_invalid_type_raises_validation_error(self):
+        """Test that non-dict, non-ToolParamsRequest raises ValidationError."""
+        with pytest.raises(ValidationError, match="tool_params must be an object"):
+            _normalize_tool_params_request("invalid_string")
+
+    def test_normalize_with_invalid_dict_returns_empty(self):
+        """Test that invalid dict returns empty ToolParamsRequest (mock behavior)."""
+        # The mock ToolParamsRequest doesn't validate, so it just returns empty
+        result = _normalize_tool_params_request({"invalid_key": 123})
+        assert isinstance(result, ToolParamsRequest)
+
+
+class TestGetAgentToolOverrides:
+    """Tests for _get_agent_tool_overrides function."""
+
+    def test_get_overrides_with_none_tool_params(self):
+        """Test that None tool_params returns empty dict."""
+        result = _get_agent_tool_overrides(None, "agent1")
+        assert result == {}
+
+    def test_get_overrides_with_none_agent_name(self):
+        """Test that None agent_name returns empty dict."""
+        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
+        result = _get_agent_tool_overrides(tool_params, None)
+        assert result == {}
+
+    def test_get_overrides_with_empty_agent_name(self):
+        """Test that empty agent_name returns empty dict."""
+        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
+        result = _get_agent_tool_overrides(tool_params, "")
+        assert result == {}
+
+    def test_get_overrides_with_unknown_agent(self):
+        """Test that unknown agent returns empty dict."""
+        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
+        result = _get_agent_tool_overrides(tool_params, "unknown_agent")
+        assert result == {}
+
+    def test_get_overrides_with_existing_agent(self):
+        """Test that existing agent returns its tool overrides."""
+        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}, "tool2": {"param2": "value2"}})})
+        result = _get_agent_tool_overrides(tool_params, "agent1")
+        assert result == {"tool1": {"param1": "value1"}, "tool2": {"param2": "value2"}}
+
+
+class TestBuildInternalS3Url:
+    """Tests for _build_internal_s3_url function."""
+
+    def test_build_with_non_dict(self):
+        """Test that non-dict input returns empty string."""
+        assert _build_internal_s3_url("not a dict") == ""
+        assert _build_internal_s3_url(None) == ""
+        assert _build_internal_s3_url(123) == ""
+
+    def test_build_with_empty_dict(self):
+        """Test that empty dict returns empty string."""
+        assert _build_internal_s3_url({}) == ""
+
+    def test_build_with_object_name(self):
+        """Test URL building with object_name."""
+        result = _build_internal_s3_url({"object_name": "path/to/file.txt"})
+        # Bucket name depends on test environment mock (MINIO_DEFAULT_BUCKET = "test-bucket")
+        assert result.startswith("s3://")
+        assert "path/to/file.txt" in result
+
+    def test_build_with_object_name_leading_slash(self):
+        """Test URL building with leading slash in object_name."""
+        result = _build_internal_s3_url({"object_name": "/path/to/file.txt"})
+        # Bucket name depends on test environment mock
+        assert result.startswith("s3://")
+        assert "path/to/file.txt" in result
+
+    def test_build_with_s3_url_input(self):
+        """Test that s3:// URL is returned as-is."""
+        result = _build_internal_s3_url({"url": "s3://bucket/path/file.txt"})
+        assert result == "s3://bucket/path/file.txt"
+
+    def test_build_with_s3_single_slash(self):
+        """Test URL building with s3:/ prefix."""
+        result = _build_internal_s3_url({"url": "s3:/bucket/file.txt"})
+        assert result == "s3://bucket/file.txt"
+
+    def test_build_with_blob_url(self):
+        """Test that blob: URL returns empty string."""
+        assert _build_internal_s3_url({"url": "blob:http://example.com/file"}) == ""
+
+    def test_build_with_s3_blob_url(self):
+        """Test that s3:/blob: URL returns empty string."""
+        assert _build_internal_s3_url({"url": "s3:/blob:http://example.com/file"}) == ""
+
+    def test_build_with_http_url(self):
+        """Test that non-s3 URL returns s3:/ prefixed version."""
+        result = _build_internal_s3_url({"url": "https://example.com/file.txt"})
+        assert result == "s3:/https://example.com/file.txt"
+
+
+class TestMergeToolParams:
+    """Tests for _merge_tool_params function."""
+
+    def test_merge_with_override_params(self):
+        """Test that override params update merged params."""
+        tool_record = {"params": [{"name": "param1", "default": "default1"}, {"name": "param2", "default": "default2"}]}
+        override_params = {"param1": "override1"}
+        result = _merge_tool_params(tool_record, override_params)
+        assert result == {"param1": "override1", "param2": "default2"}
+
+    def test_merge_with_extra_params(self):
+        """Test that extra params take precedence."""
+        tool_record = {"params": [{"name": "param1", "default": "default1"}]}
+        override_params = {"param1": "override1"}
+        extra_params = {"param1": "extra1", "internal_param": "secret"}
+        result = _merge_tool_params(tool_record, override_params, extra_params)
+        assert result == {"param1": "extra1", "internal_param": "secret"}
+
+    def test_merge_with_no_params_in_tool_record(self):
+        """Test merge when tool_record has no params."""
+        tool_record = {}
+        result = _merge_tool_params(tool_record, {"override": "value"})
+        assert result == {"override": "value"}
+
+    def test_merge_with_empty_override_params(self):
+        """Test merge with empty override params."""
+        tool_record = {"params": [{"name": "param1", "default": "default1"}]}
+        result = _merge_tool_params(tool_record, {})
+        assert result == {"param1": "default1"}
diff --git a/test/backend/app/test_agent_app.py b/test/backend/app/test_agent_app.py
index f1f0ca6a4..f65083217 100644
--- a/test/backend/app/test_agent_app.py
+++ b/test/backend/app/test_agent_app.py
@@ -720,7 +720,7 @@ def test_export_agent_api_success(mocker, mock_auth_header):
     """Test export_agent_api success case returning JSON."""
     mock_export_agent = mocker.patch(
         "apps.agent_app.export_agent_with_skills_impl", new_callable=AsyncMock)
-    mock_export_agent.return_value = '{"agent_id": 123, "name": "Test Agent"}'
+    mock_export_agent.return_value = {"agent_id": 123, "name": "Test Agent"}
 
     response = config_client.post(
         "/agent/export",
diff --git a/test/backend/app/test_agent_repository_app.py b/test/backend/app/test_agent_repository_app.py
new file mode 100644
index 000000000..b9b0d573a
--- /dev/null
+++ b/test/backend/app/test_agent_repository_app.py
@@ -0,0 +1,161 @@
+"""Unit tests for backend.apps.agent_repository_app module."""
+
+import os
+import sys
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+from fastapi import FastAPI
+from fastapi.testclient import TestClient
+
+current_dir = os.path.dirname(os.path.abspath(__file__))
+backend_dir = os.path.abspath(os.path.join(current_dir, "../../../backend"))
+sys.path.insert(0, backend_dir)
+
+sys.modules.setdefault("services.agent_repository_service", MagicMock())
+sys.modules.setdefault("utils.auth_utils", MagicMock())
+
+from apps.agent_repository_app import agent_repository_router
+
+app = FastAPI()
+app.include_router(agent_repository_router)
+client = TestClient(app)
+
+
+@pytest.fixture
+def mock_auth_header():
+    return {"Authorization": "Bearer test_token"}
+
+
+def test_create_agent_repository_listing_api_success(mocker, mock_auth_header):
+    """Test create_agent_repository_listing_api success case."""
+    mock_get_user_id = mocker.patch(
+        "apps.agent_repository_app.get_current_user_id"
+    )
+    mock_create_listing = mocker.patch(
+        "apps.agent_repository_app.create_agent_repository_listing_impl",
+        new_callable=AsyncMock,
+    )
+
+    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
+    mock_create_listing.return_value = {
+        "agent_repository_id": 42,
+        "agent_id": 123,
+        "source_version_no": 1,
+        "is_updated": False,
+    }
+
+    response = client.post(
+        "/repository/agent/123/versions/1",
+        headers=mock_auth_header,
+    )
+
+    assert response.status_code == 200
+    mock_get_user_id.assert_called_once_with(mock_auth_header["Authorization"])
+    mock_create_listing.assert_awaited_once_with(
+        agent_id=123,
+        tenant_id="test_tenant_id",
+        user_id="test_user_id",
+        version_no=1,
+    )
+    assert response.json()["agent_repository_id"] == 42
+    assert response.json()["is_updated"] is False
+
+
+def test_create_agent_repository_listing_api_draft_version(mocker, mock_auth_header):
+    """Test create_agent_repository_listing_api with draft version (version_no=0)."""
+    mock_get_user_id = mocker.patch(
+        "apps.agent_repository_app.get_current_user_id"
+    )
+    mock_create_listing = mocker.patch(
+        "apps.agent_repository_app.create_agent_repository_listing_impl",
+        new_callable=AsyncMock,
+    )
+
+    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
+    mock_create_listing.return_value = {
+        "agent_repository_id": 42,
+        "agent_id": 123,
+        "source_version_no": 0,
+        "is_updated": True,
+    }
+
+    response = client.post(
+        "/repository/agent/123/versions/0",
+        headers=mock_auth_header,
+    )
+
+    assert response.status_code == 200
+    mock_create_listing.assert_awaited_once_with(
+        agent_id=123,
+        tenant_id="test_tenant_id",
+        user_id="test_user_id",
+        version_no=0,
+    )
+    assert response.json()["source_version_no"] == 0
+
+
+def test_create_agent_repository_listing_api_bad_request(mocker, mock_auth_header):
+    """Test create_agent_repository_listing_api with ValueError."""
+    mock_get_user_id = mocker.patch(
+        "apps.agent_repository_app.get_current_user_id"
+    )
+    mock_create_listing = mocker.patch(
+        "apps.agent_repository_app.create_agent_repository_listing_impl",
+        new_callable=AsyncMock,
+    )
+
+    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
+    mock_create_listing.side_effect = ValueError("version_no must be >= 0")
+
+    response = client.post(
+        "/repository/agent/123/versions/-1",
+        headers=mock_auth_header,
+    )
+
+    assert response.status_code == 400
+    assert response.json()["detail"] == "version_no must be >= 0"
+
+
+def test_create_agent_repository_listing_api_rejects_asset_owner(mocker, mock_auth_header):
+    """Test create_agent_repository_listing_api rejects ASSET_OWNER agents with 400."""
+    mock_get_user_id = mocker.patch(
+        "apps.agent_repository_app.get_current_user_id"
+    )
+    mock_create_listing = mocker.patch(
+        "apps.agent_repository_app.create_agent_repository_listing_impl",
+        new_callable=AsyncMock,
+    )
+
+    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
+    mock_create_listing.side_effect = ValueError("租户管理员智能体无法共享")
+
+    response = client.post(
+        "/repository/agent/123/versions/1",
+        headers=mock_auth_header,
+    )
+
+    assert response.status_code == 400
+    assert response.json()["detail"] == "租户管理员智能体无法共享"
+
+
+def test_create_agent_repository_listing_api_exception(mocker, mock_auth_header):
+    """Test create_agent_repository_listing_api with general exception."""
+    mock_get_user_id = mocker.patch(
+        "apps.agent_repository_app.get_current_user_id"
+    )
+    mock_create_listing = mocker.patch(
+        "apps.agent_repository_app.create_agent_repository_listing_impl",
+        new_callable=AsyncMock,
+    )
+
+    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
+    mock_create_listing.side_effect = Exception("Database error")
+
+    response = client.post(
+        "/repository/agent/123/versions/1",
+        headers=mock_auth_header,
+    )
+
+    assert response.status_code == 500
+    assert "Create agent repository listing error." in response.json()["detail"]
diff --git a/test/backend/app/test_cas_app.py b/test/backend/app/test_cas_app.py
new file mode 100644
index 000000000..97536c2db
--- /dev/null
+++ b/test/backend/app/test_cas_app.py
@@ -0,0 +1,184 @@
+import os
+import sys
+import unittest
+from http import HTTPStatus
+from unittest.mock import AsyncMock, MagicMock
+
+from fastapi import FastAPI
+from fastapi.testclient import TestClient
+
+test_dir = os.path.dirname(__file__)
+backend_dir = os.path.abspath(os.path.join(test_dir, "../../../backend"))
+sys.path.insert(0, backend_dir)
+
+
+class _CasAuthenticationError(Exception):
+    pass
+
+
+_MODULES_TO_RESTORE = ["services.cas_service"]
+_ORIGINAL_MODULES = {name: sys.modules.get(name) for name in _MODULES_TO_RESTORE}
+
+cas_service_mock = MagicMock()
+cas_service_mock.CAS_SERVER_URL = "https://cas.example.com"
+cas_service_mock.CasAuthenticationError = _CasAuthenticationError
+cas_service_mock.get_cas_config = MagicMock(
+    return_value={
+        "enabled": True,
+        "login_mode": "button",
+        "renew_before_seconds": 300,
+        "renew_timeout_seconds": 10,
+        "display_name": "CAS",
+    }
+)
+cas_service_mock.build_login_url = MagicMock(return_value="https://cas.example.com/login?service=x")
+cas_service_mock.build_renew_url = MagicMock(return_value="https://cas.example.com/login?gateway=true")
+cas_service_mock.login_with_ticket = AsyncMock(
+    return_value={
+        "user": {"id": "user-1", "email": "u@example.com", "role": "USER"},
+        "session": {"access_token": "jwt", "expires_at": 1779780000, "expires_in_seconds": 3600},
+        "redirect_url": "/chat",
+    }
+)
+cas_service_mock.renew_with_ticket = AsyncMock(
+    return_value={
+        "user": {"id": "user-1", "email": "u@example.com", "role": "USER"},
+        "session": {"access_token": "jwt2", "expires_at": 1779780300, "expires_in_seconds": 3600},
+        "redirect_url": "/",
+        "renew": True,
+    }
+)
+cas_service_mock.revoke_from_logout_request = MagicMock(
+    return_value={"revoked": 1, "cas_user_id": "cas-user-1", "session_index": "ST-1"}
+)
+sys.modules["services.cas_service"] = cas_service_mock
+
+from apps.cas_app import router  # noqa: E402
+
+for _name, _module in _ORIGINAL_MODULES.items():
+    if _module is None:
+        sys.modules.pop(_name, None)
+    else:
+        sys.modules[_name] = _module
+
+app = FastAPI()
+app.include_router(router)
+client = TestClient(app)
+
+
+class TestCasApp(unittest.TestCase):
+    def tearDown(self):
+        cas_service_mock.build_login_url.side_effect = None
+        cas_service_mock.build_login_url.return_value = "https://cas.example.com/login?service=x"
+        cas_service_mock.build_renew_url.side_effect = None
+        cas_service_mock.build_renew_url.return_value = "https://cas.example.com/login?gateway=true"
+        cas_service_mock.login_with_ticket.side_effect = None
+        cas_service_mock.revoke_from_logout_request.reset_mock()
+
+    def test_config_returns_public_cas_settings(self):
+        response = client.get("/user/cas/config")
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        data = response.json()
+        self.assertEqual(data["message"], "success")
+        self.assertTrue(data["data"]["enabled"])
+        self.assertEqual(data["data"]["login_mode"], "button")
+
+    def test_login_redirects_to_cas_server(self):
+        response = client.get("/user/cas/login?redirect=/chat", follow_redirects=False)
+
+        self.assertEqual(response.status_code, HTTPStatus.FOUND)
+        self.assertEqual(response.headers["location"], "https://cas.example.com/login?service=x")
+        cas_service_mock.build_login_url.assert_called_with("/chat")
+
+    def test_login_returns_400_when_cas_not_configured(self):
+        cas_service_mock.build_login_url.side_effect = _CasAuthenticationError("CAS is not configured")
+
+        response = client.get("/user/cas/login")
+
+        self.assertEqual(response.status_code, HTTPStatus.BAD_REQUEST)
+        self.assertEqual(response.json()["detail"], "CAS login is not available")
+        self.assertNotIn("CAS is not configured", response.text)
+
+    def test_login_rejects_redirect_url_outside_configured_cas_server(self):
+        cas_service_mock.build_login_url.return_value = "https://evil.example.com/login?service=x"
+
+        response = client.get("/user/cas/login?redirect=/chat", follow_redirects=False)
+
+        self.assertEqual(response.status_code, HTTPStatus.BAD_REQUEST)
+        self.assertEqual(response.json()["detail"], "CAS login is not available")
+
+    def test_callback_returns_session_payload(self):
+        response = client.get("/user/cas/callback?ticket=ST-1&redirect=/chat")
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        data = response.json()
+        self.assertEqual(data["message"], "CAS login successful")
+        self.assertEqual(data["data"]["session"]["access_token"], "jwt")
+        cas_service_mock.login_with_ticket.assert_awaited()
+
+    def test_callback_returns_401_for_invalid_ticket(self):
+        cas_service_mock.login_with_ticket.side_effect = _CasAuthenticationError("bad ticket")
+
+        response = client.get("/user/cas/callback?ticket=bad")
+
+        self.assertEqual(response.status_code, HTTPStatus.UNAUTHORIZED)
+        self.assertEqual(response.json()["detail"], "CAS authentication failed")
+        self.assertNotIn("bad ticket", response.text)
+
+    def test_renew_does_not_expose_cas_configuration_exception(self):
+        cas_service_mock.build_renew_url.side_effect = _CasAuthenticationError("internal CAS config path")
+
+        response = client.get("/user/cas/renew")
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        self.assertIn("cas-renew-failed", response.text)
+        self.assertIn("CAS renew failed", response.text)
+        self.assertNotIn("internal CAS config path", response.text)
+
+    def test_renew_callback_without_ticket_posts_failure_to_iframe_parent(self):
+        response = client.get("/user/cas/renew_callback")
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        self.assertIn("text/html", response.headers["content-type"])
+        self.assertIn("cas-renew-failed", response.text)
+
+    def test_logout_callback_accepts_cas_form_body(self):
+        xml = """
+        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
+          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
+          <saml:NameID>cas-user-1</saml:NameID>
+          <samlp:SessionIndex>ST-1</samlp:SessionIndex>
+        </samlp:LogoutRequest>
+        """
+
+        response = client.post(
+            "/user/cas/logout_callback",
+            data={"logoutRequest": xml},
+        )
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        self.assertEqual(response.json()["data"]["revoked"], 1)
+        cas_service_mock.revoke_from_logout_request.assert_called_once_with(xml)
+
+    def test_callback_post_accepts_cas_single_logout_request(self):
+        xml = """
+        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
+          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
+          <saml:NameID>cas-user-1</saml:NameID>
+          <samlp:SessionIndex>ST-1</samlp:SessionIndex>
+        </samlp:LogoutRequest>
+        """
+
+        response = client.post(
+            "/user/cas/callback",
+            data={"logoutRequest": xml},
+        )
+
+        self.assertEqual(response.status_code, HTTPStatus.OK)
+        self.assertEqual(response.json()["data"]["revoked"], 1)
+        cas_service_mock.revoke_from_logout_request.assert_called_once_with(xml)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/backend/app/test_idata_app.py b/test/backend/app/test_idata_app.py
index 66b213f96..4f7774ccd 100644
--- a/test/backend/app/test_idata_app.py
+++ b/test/backend/app/test_idata_app.py
@@ -5,6 +5,7 @@
 """
 import sys
 import os
+import types
 from unittest.mock import patch, MagicMock
 
 import pytest
@@ -19,6 +20,57 @@
 if backend_dir not in sys.path:
     sys.path.insert(0, backend_dir)
 
+# Stub the SDK modules used during import so tests do not load nexent.__init__ and
+# its optional runtime dependencies.
+nexent_module = types.ModuleType("nexent")
+nexent_module.__path__ = []
+nexent_storage_module = types.ModuleType("nexent.storage")
+nexent_storage_module.__path__ = []
+nexent_storage_factory_module = types.ModuleType("nexent.storage.storage_client_factory")
+nexent_minio_config_module = types.ModuleType("nexent.storage.minio_config")
+nexent_utils_module = types.ModuleType("nexent.utils")
+nexent_utils_module.__path__ = []
+nexent_http_client_manager_module = types.ModuleType("nexent.utils.http_client_manager")
+
+
+class MockMinIOStorageConfig:
+    def __init__(self, *args, **kwargs):
+        self.default_bucket = kwargs.get("default_bucket")
+
+    def validate(self):
+        return None
+
+
+nexent_storage_factory_module.create_storage_client_from_config = MagicMock()
+nexent_storage_factory_module.MinIOStorageConfig = MockMinIOStorageConfig
+nexent_minio_config_module.MinIOStorageConfig = MockMinIOStorageConfig
+nexent_http_client_manager_module.http_client_manager = MagicMock()
+nexent_module.storage = nexent_storage_module
+nexent_module.utils = nexent_utils_module
+nexent_storage_module.storage_client_factory = nexent_storage_factory_module
+nexent_storage_module.minio_config = nexent_minio_config_module
+nexent_utils_module.http_client_manager = nexent_http_client_manager_module
+
+sys.modules["nexent"] = nexent_module
+sys.modules["nexent.storage"] = nexent_storage_module
+sys.modules["nexent.storage.storage_client_factory"] = nexent_storage_factory_module
+sys.modules["nexent.storage.minio_config"] = nexent_minio_config_module
+sys.modules["nexent.utils"] = nexent_utils_module
+sys.modules["nexent.utils.http_client_manager"] = nexent_http_client_manager_module
+
+backend_module = sys.modules.get("backend") or types.ModuleType("backend")
+backend_module.__path__ = [backend_dir]
+backend_database_module = types.ModuleType("backend.database")
+backend_database_module.__path__ = [os.path.join(backend_dir, "database")]
+backend_database_client_module = types.ModuleType("backend.database.client")
+backend_database_client_module.MinioClient = MagicMock()
+backend_module.database = backend_database_module
+backend_database_module.client = backend_database_client_module
+
+sys.modules["backend"] = backend_module
+sys.modules["backend.database"] = backend_database_module
+sys.modules["backend.database.client"] = backend_database_client_module
+
 # Mock the storage client factory BEFORE importing any backend modules that depend on it.
 # This prevents MinIO connection attempts during module import.
 
@@ -517,29 +569,17 @@ def test_router_prefix(self):
     def test_routes_registered(self):
         """Test that all routes are registered."""
         app = _build_app()
-        routes = [route.path for route in app.routes]
+        paths = app.openapi()["paths"]
 
-        assert "/idata/knowledge-space" in routes
-        assert "/idata/datasets" in routes
+        assert "/idata/knowledge-space" in paths
+        assert "/idata/datasets" in paths
 
     def test_router_methods(self):
         """Test that routes have correct HTTP methods."""
         app = _build_app()
+        paths = app.openapi()["paths"]
 
-        # Find routes by path
-        knowledge_space_route = None
-        datasets_route = None
-
-        for route in app.routes:
-            if hasattr(route, 'path'):
-                if route.path == "/idata/knowledge-space":
-                    knowledge_space_route = route
-                elif route.path == "/idata/datasets":
-                    datasets_route = route
-
-        assert knowledge_space_route is not None
-        assert datasets_route is not None
-
-        # Check HTTP methods
-        assert "GET" in [method for method in knowledge_space_route.methods]
-        assert "GET" in [method for method in datasets_route.methods]
+        assert "/idata/knowledge-space" in paths
+        assert "/idata/datasets" in paths
+        assert "get" in paths["/idata/knowledge-space"]
+        assert "get" in paths["/idata/datasets"]
diff --git a/test/backend/app/test_knowledge_summary_app.py b/test/backend/app/test_knowledge_summary_app.py
index 6201cf381..fcbad52db 100644
--- a/test/backend/app/test_knowledge_summary_app.py
+++ b/test/backend/app/test_knowledge_summary_app.py
@@ -12,6 +12,7 @@
 from unittest.mock import patch, MagicMock, AsyncMock
 
 import pytest
+from pydantic import BaseModel
 
 # Apply patches that need to be active before imports
 from unittest.mock import patch as mock_patch
@@ -39,7 +40,16 @@ class MockToolConfig:
     pass
 
 
+class MockAgentVerificationConfig:
+    @classmethod
+    def model_validate(cls, value):
+        mock_config = MagicMock()
+        mock_config.model_dump.return_value = value
+        return mock_config
+
+
 nexent_core_agents_agent_model.ToolConfig = MockToolConfig
+nexent_core_agents_agent_model.AgentVerificationConfig = MockAgentVerificationConfig
 sys.modules['nexent.core.agents.agent_model'] = nexent_core_agents_agent_model
 nexent_nexent_vector_database = types.ModuleType('nexent.vector_database')
 sys.modules['nexent.vector_database'] = nexent_nexent_vector_database
@@ -73,6 +83,18 @@ def mock_get_vector_db_core():
 sys.modules['services.redis_service'] = types.ModuleType('services.redis_service')
 sys.modules['services.group_service'] = types.ModuleType('services.group_service')
 
+# knowledge_summary_app only needs this request model from consts.model. Keeping
+# it local avoids importing unrelated EmailStr models and optional validators.
+consts_model_mock = types.ModuleType('consts.model')
+
+
+class ChangeSummaryRequest(BaseModel):
+    summary_result: str
+
+
+consts_model_mock.ChangeSummaryRequest = ChangeSummaryRequest
+sys.modules['consts.model'] = consts_model_mock
+
 # Mock utils modules used by knowledge_summary_app to avoid deep DB/storage import chains
 utils_auth_utils_mock = types.ModuleType('utils.auth_utils')
 utils_auth_utils_mock.get_current_user_id = MagicMock(return_value=("test_user_id", "test_tenant_id"))
@@ -90,7 +112,6 @@ def mock_get_vector_db_core():
 # Import the modules we need
 from fastapi.testclient import TestClient
 from fastapi import FastAPI
-from pydantic import BaseModel
 from apps.knowledge_summary_app import router
 
 # Create a test app and client
diff --git a/test/backend/app/test_northbound_app.py b/test/backend/app/test_northbound_app.py
index 2bfb25a76..827e04e4d 100644
--- a/test/backend/app/test_northbound_app.py
+++ b/test/backend/app/test_northbound_app.py
@@ -1,53 +1,22 @@
-import os
+"""Unit tests for backend.apps.northbound_app module."""
 import sys
-from unittest.mock import MagicMock, AsyncMock
+import os
+
+# The conftest.py sets up all mocks
+
+from unittest.mock import AsyncMock, MagicMock, patch
 import pytest
-from fastapi import FastAPI, HTTPException
-from fastapi.responses import StreamingResponse
+from fastapi import FastAPI
 from fastapi.testclient import TestClient
-import types
-import sys as _sys
-
-# Dynamically determine the backend path
-current_dir = os.path.dirname(os.path.abspath(__file__))
-backend_dir = os.path.abspath(os.path.join(current_dir, "../../../backend"))
-sys.path.append(backend_dir)
-
-
-# Pre-mock heavy dependencies before importing router
-sys.modules['consts'] = MagicMock()
-sys.modules['consts.model'] = MagicMock()
-
-consts_exceptions_mod = types.ModuleType("consts.exceptions")
-
-class LimitExceededError(Exception):
-    pass
-class UnauthorizedError(Exception):
-    pass
-class SignatureValidationError(Exception):
-    pass
-
-consts_exceptions_mod.LimitExceededError = LimitExceededError
-consts_exceptions_mod.UnauthorizedError = UnauthorizedError
-consts_exceptions_mod.SignatureValidationError = SignatureValidationError
-
-# Ensure the parent 'consts' is a module
-if 'consts' not in _sys.modules or not isinstance(_sys.modules['consts'], types.ModuleType):
-    consts_root = types.ModuleType("consts")
-    consts_root.__path__ = []
-    _sys.modules['consts'] = consts_root
-else:
-    consts_root = _sys.modules['consts']
-
-consts_root.exceptions = consts_exceptions_mod
-_sys.modules['consts.exceptions'] = consts_exceptions_mod
-sys.modules['services'] = MagicMock()
-sys.modules['services.northbound_service'] = MagicMock()
-sys.modules['utils'] = MagicMock()
-sys.modules['utils.auth_utils'] = MagicMock()
-
-# Import router after setting mocks
+from io import BytesIO
+
+# Import from conftest (which sets up mocks automatically)
 from apps.northbound_app import router
+from consts.exceptions import (
+    LimitExceededError,
+    UnauthorizedError,
+    SignatureValidationError,
+)
 
 
 app = FastAPI()
@@ -56,6 +25,7 @@ class SignatureValidationError(Exception):
 
 
 def _build_headers(auth="Bearer test_jwt", request_id="req-123", aksk=True):
+    """Build request headers for testing."""
     headers = {
         "Authorization": auth,
         "X-Request-Id": request_id,
@@ -69,8 +39,12 @@ def _build_headers(auth="Bearer test_jwt", request_id="req-123", aksk=True):
     return headers
 
 
-@pytest.mark.asyncio
-async def test_health_check():
+# =============================================================================
+# Health Check Tests
+# =============================================================================
+
+def test_health_check():
+    """Test health check endpoint returns healthy status."""
     resp = client.get("/nb/v1/health")
     assert resp.status_code == 200
     data = resp.json()
@@ -78,544 +52,783 @@ async def test_health_check():
     assert data["service"] == "northbound-api"
 
 
-def test_run_chat_calls_service(monkeypatch):
-    # Mock Bearer token validation to return valid token
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    # Mock user/tenant lookup to return user and tenant
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    async def _gen():
-        yield b"data: hello\n\n"
-    start_mock = AsyncMock(return_value=StreamingResponse(_gen(), media_type="text/event-stream"))
-    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", start_mock)
+# =============================================================================
+# Upload Chat Attachments Tests
+# =============================================================================
 
-    # Use integer conversation_id as the endpoint expects Optional[int]
-    payload = {"conversation_id": 1, "agent_name": "agent-a", "query": "hi"}
-    headers = {**_build_headers(), "Idempotency-Key": "idem-1"}
-    resp = client.post("/nb/v1/chat/run", json=payload, headers=headers)
+def test_upload_chat_attachments_success():
+    """Test successful chat attachment upload."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
 
-    assert resp.status_code == 200
-    assert "text/event-stream" in resp.headers["content-type"]
-    # Validate call into service
-    assert start_mock.await_count == 1
-    args, kwargs = start_mock.call_args
-    assert kwargs["conversation_id"] == 1
-    assert kwargs["agent_name"] == "agent-a"
-    assert kwargs["query"] == "hi"
-    assert kwargs["idempotency_key"] == "idem-1"
-
-
-def test_stop_chat_calls_service(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    stop_mock = AsyncMock(return_value={"message": "success"})
-    monkeypatch.setattr("apps.northbound_app.stop_chat", stop_mock)
-
-    # Use integer conversation_id in URL path
-    resp = client.get("/nb/v1/chat/stop/123", headers=_build_headers())
-    assert resp.status_code == 200
-    assert stop_mock.await_count == 1
+        mock_ctx.return_value = MagicMock()
+        mock_upload.return_value = {
+            "message": "Processed 1 files",
+            "requestId": "req-123",
+            "results": [{"filename": "test.pdf", "status": "success"}],
+        }
 
+        # Create a fake file upload
+        file_content = b"test file content"
+        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
 
-def test_get_history_calls_service(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    hist_mock = AsyncMock(return_value={"message": "success"})
-    monkeypatch.setattr("apps.northbound_app.get_conversation_history", hist_mock)
+        resp = client.post(
+            "/nb/v1/chat/attachments/upload",
+            files=files,
+            headers=_build_headers(),
+        )
 
-    # Use integer conversation_id in URL path
-    resp = client.get("/nb/v1/conversations/123", headers=_build_headers())
-    assert resp.status_code == 200
-    assert hist_mock.await_count == 1
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["message"] == "Processed 1 files"
 
 
-def test_list_agents_calls_service(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    agents_mock = AsyncMock(return_value={"message": "success", "data": []})
-    monkeypatch.setattr("apps.northbound_app.get_agent_info_list", agents_mock)
+def test_upload_chat_attachments_limit_exceeded():
+    """Test upload returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
 
-    resp = client.get("/nb/v1/agents", headers=_build_headers())
-    assert resp.status_code == 200
-    assert agents_mock.await_count == 1
+        mock_ctx.return_value = MagicMock()
+        mock_upload.side_effect = LimitExceededError("Upload limit exceeded")
 
+        file_content = b"test file content"
+        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
 
-def test_list_conversations_calls_service(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    list_mock = AsyncMock(return_value={"message": "success", "data": []})
-    monkeypatch.setattr("apps.northbound_app.list_conversations", list_mock)
+        resp = client.post(
+            "/nb/v1/chat/attachments/upload",
+            files=files,
+            headers=_build_headers(),
+        )
 
-    resp = client.get("/nb/v1/conversations", headers=_build_headers())
-    assert resp.status_code == 200
-    assert list_mock.await_count == 1
-
-
-def test_update_title_sets_headers(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    # Ensure NorthboundContext yields plain string fields (avoid MagicMock in headers)
-    class _NCtx:
-        def __init__(self, request_id: str, tenant_id: str, user_id: str, authorization: str, token_id: int = 0):
-            self.request_id = request_id
-            self.tenant_id = tenant_id
-            self.user_id = user_id
-            self.authorization = authorization
-            self.token_id = token_id
-    monkeypatch.setattr("apps.northbound_app.NorthboundContext", _NCtx)
-    update_mock = AsyncMock(return_value={"message": "success", "data": "nb-4", "idempotency_key": "ide-xyz"})
-    monkeypatch.setattr("apps.northbound_app.update_conversation_title", update_mock)
-
-    headers = {**_build_headers(request_id="req-999"), "Idempotency-Key": "ide-xyz"}
-    resp = client.put("/nb/v1/conversations/123/title", params={"title": "New Title"}, headers=headers)
-    assert resp.status_code == 200
-    # Router wraps JSONResponse and should echo idempotency and request id
-    assert resp.headers.get("Idempotency-Key") == "ide-xyz"
-    assert resp.headers.get("X-Request-Id") == "req-999"
-    assert update_mock.await_count == 1
+        assert resp.status_code == 429
 
 
-def _std_headers(auth="Bearer test_jwt"):
-    return {
-        **_build_headers(auth=auth),
-        "Idempotency-Key": "idem-xyz",
-    }
+def test_upload_chat_attachments_internal_error():
+    """Test upload returns 500 when internal error occurs."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
 
+        mock_ctx.return_value = MagicMock()
+        mock_upload.side_effect = Exception("Unknown error")
 
-@pytest.mark.parametrize("exc_cls, status", [
-    (UnauthorizedError, 401),
-    (LimitExceededError, 429),
-    (SignatureValidationError, 401),
-])
-def test_run_chat_auth_exceptions_are_mapped(monkeypatch, exc_cls, status):
-    # Force Bearer token validation to raise domain exceptions
-    def _raise(*_, **__):
-        raise exc_cls("boom")
-
-    monkeypatch.setattr(
-        "apps.northbound_app.validate_bearer_token", _raise)
-    # Even if provided, auth should not be parsed because token validation fails first
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    assert resp.status_code == status
-
-
-def test_run_chat_missing_authorization_header_returns_401(monkeypatch):
-    # When no Authorization header, validate_bearer_token returns (False, None)
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (False, None))
-    # No Authorization header
-    headers = {k: v for k, v in _std_headers().items() if k.lower()
-               != "authorization"}
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=headers,
-    )
-    assert resp.status_code == 401
-    assert "bearer token" in resp.json()["detail"].lower()
+        file_content = b"test file content"
+        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
 
+        resp = client.post(
+            "/nb/v1/chat/attachments/upload",
+            files=files,
+            headers=_build_headers(),
+        )
 
-def test_run_chat_jwt_parse_exception_returns_401(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+        assert resp.status_code == 500
 
-    def _raise_user_lookup(_access_key):
-        raise Exception("user lookup error")
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", _raise_user_lookup)
 
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    # When user lookup fails due to an invalid API key, return 401
-    assert resp.status_code == 401
-    assert "invalid api key" in resp.json()["detail"].lower()
+# =============================================================================
+# Run Chat Tests
+# =============================================================================
 
+def test_run_chat_success():
+    """Test successful chat run initiation."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
 
-def test_run_chat_jwt_missing_user_id_returns_400(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr(
-        "apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-            "user_id": None, "tenant_id": "t1", "token_id": "t1"
-        })
+        mock_ctx.return_value = MagicMock()
+        mock_run.return_value = {
+            "message": "Chat run initiated",
+            "request_id": "req-789",
+            "status": "initiated",
+        }
 
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    assert resp.status_code == 400
-    assert "user" in resp.json()["detail"].lower()
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello, agent",
+            },
+            headers=_build_headers(),
+        )
 
+        assert resp.status_code == 200
 
-def test_run_chat_jwt_missing_tenant_id_returns_400(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr(
-        "apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-            "user_id": "u1", "tenant_id": None, "token_id": "t1"
-        })
 
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    assert resp.status_code == 400
-    assert "tenant" in resp.json()["detail"].lower()
+def test_run_chat_limit_exceeded():
+    """Test run chat returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.side_effect = LimitExceededError("Rate limit exceeded")
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello",
+            },
+            headers=_build_headers(),
+        )
 
+        assert resp.status_code == 429
 
-def test_run_chat_internal_error_when_parsing_context_returns_401(monkeypatch):
-    def _raise(*_, **__):
-        raise Exception("unexpected")
-    monkeypatch.setattr(
-        "apps.northbound_app.validate_bearer_token", _raise)
 
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    # Any exception during validation returns 401
-    assert resp.status_code == 401
-
-
-def test_run_chat_unexpected_service_error_maps_500(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    start_mock = AsyncMock(side_effect=Exception("boom"))
-    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", start_mock)
-
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
-        headers=_std_headers(),
-    )
-    assert resp.status_code == 500
-
-
-@pytest.mark.parametrize("path", [
-    "/nb/v1/chat/stop/123",
-    "/nb/v1/conversations/123",
-    "/nb/v1/agents",
-    "/nb/v1/conversations",
-])
-@pytest.mark.parametrize("exc_cls, status", [
-    (UnauthorizedError, 401),
-    (LimitExceededError, 429),
-    (SignatureValidationError, 401),
-])
-def test_other_endpoints_auth_exceptions_are_mapped(monkeypatch, path, exc_cls, status):
-    def _raise(*_, **__):
-        raise exc_cls("boom")
-    monkeypatch.setattr(
-        "apps.northbound_app.validate_bearer_token", _raise)
-
-    resp = client.get(path, headers=_build_headers())
-    assert resp.status_code == status
-
-
-@pytest.mark.parametrize(
-    "path, target",
-    [
-        ("/nb/v1/chat/stop/123", "apps.northbound_app.stop_chat"),
-        ("/nb/v1/conversations/123", "apps.northbound_app.get_conversation_history"),
-        ("/nb/v1/agents", "apps.northbound_app.get_agent_info_list"),
-        ("/nb/v1/conversations", "apps.northbound_app.list_conversations"),
-    ],
-)
-def test_other_endpoints_unexpected_service_error_maps_500(monkeypatch, path, target):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    monkeypatch.setattr(target, AsyncMock(side_effect=Exception("boom")))
-
-    resp = client.get(path, headers=_build_headers())
-    assert resp.status_code == 500
-
-
-def test_update_title_unexpected_service_error_maps_500(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-    monkeypatch.setattr("apps.northbound_app.update_conversation_title", AsyncMock(
-        side_effect=Exception("boom")))
-
-    resp = client.put(
-        "/nb/v1/conversations/123/title",
-        params={"title": "x"},
+def test_run_chat_unauthorized():
+    """Test run chat returns 500 on unauthorized (broad exception handling)."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx:
+        mock_ctx.side_effect = UnauthorizedError("Invalid token")
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello",
+            },
+            headers=_build_headers(),
+        )
+
+        # The run_chat endpoint has broad exception handling, so unauthorized returns 500
+        assert resp.status_code == 500
+
+
+# =============================================================================
+# Stop Chat Tests
+# =============================================================================
+
+def test_stop_chat_success():
+    """Test successful chat stop."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
+
+        mock_ctx.return_value = MagicMock()
+        mock_stop.return_value = True
+
+        resp = client.get(
+            "/nb/v1/chat/stop/123",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+# =============================================================================
+# Get Conversation Tests
+# =============================================================================
+
+def test_get_conversation_success():
+    """Test successful retrieval of conversation."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
+
+        mock_ctx.return_value = MagicMock()
+        mock_get.return_value = {
+            "conversation_id": 123,
+            "history": [
+                {"role": "user", "content": "Hello"},
+                {"role": "assistant", "content": "Hi there!"},
+            ]
+        }
+
+        resp = client.get(
+            "/nb/v1/conversations/123",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["conversation_id"] == 123
+        assert len(data["history"]) == 2
+
+
+# =============================================================================
+# List Agents Tests
+# =============================================================================
+
+def test_list_agents_success():
+    """Test successful retrieval of agent list."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
+
+        mock_ctx.return_value = MagicMock()
+        mock_get.return_value = {
+            "agents": [
+                {"name": "agent1", "description": "First agent"},
+                {"name": "agent2", "description": "Second agent"},
+            ]
+        }
+
+        resp = client.get(
+            "/nb/v1/agents",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+        data = resp.json()
+        assert len(data["agents"]) == 2
+
+
+# =============================================================================
+# List Conversations Tests
+# =============================================================================
+
+def test_list_conversations_success():
+    """Test successful retrieval of conversation list."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
+
+        mock_ctx.return_value = MagicMock()
+        mock_list.return_value = {
+            "conversations": [
+                {"id": 1, "title": "Conversation 1"},
+                {"id": 2, "title": "Conversation 2"},
+            ]
+        }
+
+        resp = client.get(
+            "/nb/v1/conversations",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+        data = resp.json()
+        assert len(data["conversations"]) == 2
+
+
+# =============================================================================
+# Update Conversation Title Tests
+# =============================================================================
+
+def test_update_conversation_title_success():
+    """Test successful update of conversation title."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.return_value = {"idempotency_key": "idem-key", "conversation_id": 123, "title": "New Title"}
+
+        resp = client.put(
+            "/nb/v1/conversations/123/title?title=New%20Title",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+# =============================================================================
+# File Fetch Tests
+# =============================================================================
+
+def test_file_fetch_missing_url():
+    """Test file fetch returns 422 when URL is missing."""
+    resp = client.get(
+        "/nb/v1/file/fetch",
         headers=_build_headers(),
     )
-    assert resp.status_code == 500
-
-
-def test_run_chat_sets_headers_from_service_response(monkeypatch):
-    # Mock Bearer token and user lookup
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-
-    # Ensure NorthboundContext yields plain string fields (avoid MagicMock in headers)
-    class _NCtx:
-        def __init__(self, request_id: str, tenant_id: str, user_id: str, authorization: str, token_id: int = 0):
-            self.request_id = request_id
-            self.tenant_id = tenant_id
-            self.user_id = user_id
-            self.authorization = authorization
-            self.token_id = token_id
-
-    monkeypatch.setattr("apps.northbound_app.NorthboundContext", _NCtx)
-
-    async def _gen():
-        yield b"data: ok\n\n"
-
-    async def _start(ctx, conversation_id, agent_name, query, meta_data=None, idempotency_key=None):
-        resp = StreamingResponse(_gen(), media_type="text/event-stream")
-        # Service attaches headers in latest logic; emulate here
-        resp.headers["X-Request-Id"] = ctx.request_id
-        resp.headers["conversation_id"] = str(conversation_id)
-        return resp
-
-    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", _start)
-
-    headers = {**_std_headers(), "X-Request-Id": "rid-123"}
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1,
-              "agent_name": "agent-a", "query": "hello"},
-        headers=headers,
-    )
 
-    assert resp.status_code == 200
-    assert resp.headers.get("X-Request-Id") == "rid-123"
-    assert resp.headers.get("conversation_id") == "1"
+    # Missing required parameter returns 422
+    assert resp.status_code == 422
 
 
-def test_run_chat_service_error_maps_500(monkeypatch):
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
+# =============================================================================
+# Error Handling Tests
+# =============================================================================
+
+def test_invalid_request_body():
+    """Test that invalid request body returns 422."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx:
+        mock_ctx.return_value = MagicMock()
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={},  # Missing required fields
+            headers=_build_headers(),
+        )
+
+        # FastAPI returns 422 for validation errors
+        assert resp.status_code == 422
+
+
+def test_run_chat_with_conversation_id():
+    """Test run chat with existing conversation ID."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.return_value = {
+            "message": "Chat run continued",
+            "request_id": "req-456",
+            "status": "continued",
+        }
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello again",
+                "conversation_id": 123,
+            },
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+def test_run_chat_with_attachments():
+    """Test run chat with file attachments."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.return_value = {
+            "message": "Chat run with attachments",
+            "request_id": "req-789",
+            "status": "initiated",
+        }
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Summarize the attached report",
+                "attachments": ["s3://nexent/attachments/file.pdf"],
+            },
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+def test_run_chat_with_tool_params():
+    """Test run chat with tool parameter overrides."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.return_value = {
+            "message": "Chat run with tool params",
+            "request_id": "req-101",
+            "status": "initiated",
+        }
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Search the knowledge base",
+                "tool_params": {
+                    "agents": {
+                        "general-assistant": {
+                            "tools": {
+                                "knowledge_base_search": {
+                                    "top_k": 5,
+                                }
+                            }
+                        }
+                    }
+                },
+            },
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+def test_run_chat_permission_error():
+    """Test run chat returns 403 when permission denied."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.side_effect = PermissionError("Access denied")
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello",
+            },
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 403
+
+
+def test_run_chat_internal_error():
+    """Test run chat returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.side_effect = Exception("Unexpected error")
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello",
+            },
+            headers=_build_headers(),
+        )
 
-    async def _raise(*args, **kwargs):
-        raise Exception("Failed to persist user message: boom")
+        assert resp.status_code == 500
 
-    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", _raise)
 
-    resp = client.post(
-        "/nb/v1/chat/run",
-        json={"conversation_id": 1,
-              "agent_name": "agent-a", "query": "hello"},
-        headers=_std_headers(),
-    )
+def test_run_chat_value_error():
+    """Test run chat returns 400 on value error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
+
+        mock_ctx.return_value = MagicMock()
+        mock_run.side_effect = ValueError("Invalid agent name")
+
+        resp = client.post(
+            "/nb/v1/chat/run",
+            json={
+                "agent_name": "general-assistant",
+                "query": "Hello",
+            },
+            headers=_build_headers(),
+        )
 
-    assert resp.status_code == 500
+        assert resp.status_code == 400
 
 
-# --- Tests for /file/fetch endpoint ---
+# =============================================================================
+# Stop Chat Error Tests
+# =============================================================================
 
-def test_fetch_file_missing_presigned_url():
-    """Missing presigned_url parameter returns 422 (FastAPI validation)."""
-    resp = client.get("/nb/v1/file/fetch")
-    assert resp.status_code == 422
+def test_stop_chat_limit_exceeded():
+    """Test stop chat returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
 
+        mock_ctx.return_value = MagicMock()
+        mock_stop.side_effect = LimitExceededError("Rate limit exceeded")
 
-def test_fetch_file_invalid_url_scheme(monkeypatch):
-    """URL scheme other than http/https returns 400."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
+        resp = client.get(
+            "/nb/v1/chat/stop/123",
+            headers=_build_headers(),
+        )
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "ftp://example.com/file"},
-        headers=_build_headers(),
-    )
-    assert resp.status_code == 400
-    assert "Invalid URL scheme" in resp.json()["detail"]
-
-
-def test_fetch_file_success(monkeypatch):
-    """Valid presigned_url: proxies file content as StreamingResponse."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
-
-    import httpx
-    mock_response = MagicMock()
-    mock_response.status_code = 200
-    mock_response.headers = {
-        "Content-Type": "application/pdf",
-        "Content-Disposition": 'attachment; filename="report.pdf"',
-    }
-    mock_response.aiter_bytes = MagicMock(return_value=iter([b"PDF content here"]))
+        assert resp.status_code == 429
 
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(return_value=mock_response)
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+def test_stop_chat_internal_error():
+    """Test stop chat returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
-        headers=_build_headers(),
-    )
+        mock_ctx.return_value = MagicMock()
+        mock_stop.side_effect = Exception("Unexpected error")
 
-    assert resp.status_code == 200
-    assert resp.headers["content-type"] == "application/pdf"
-    assert "report.pdf" in resp.headers["content-disposition"]
+        resp = client.get(
+            "/nb/v1/chat/stop/123",
+            headers=_build_headers(),
+        )
 
+        assert resp.status_code == 500
 
-def test_fetch_file_non_200_returns_502(monkeypatch):
-    """MinIO returns non-200: maps to 502 Bad Gateway."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
 
-    mock_response = MagicMock()
-    mock_response.status_code = 403
-    mock_response.headers = {}
+# =============================================================================
+# Get Conversation Error Tests
+# =============================================================================
 
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(return_value=mock_response)
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
+def test_get_conversation_limit_exceeded():
+    """Test get conversation returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+        mock_ctx.return_value = MagicMock()
+        mock_get.side_effect = LimitExceededError("Rate limit exceeded")
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
-        headers=_build_headers(),
-    )
+        resp = client.get(
+            "/nb/v1/conversations/123",
+            headers=_build_headers(),
+        )
 
-    assert resp.status_code == 502
-    assert "Failed to fetch file from storage" in resp.json()["detail"]
+        assert resp.status_code == 429
 
 
-def test_fetch_file_timeout_returns_504(monkeypatch):
-    """httpx.TimeoutException: maps to 504 Gateway Timeout."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
+def test_get_conversation_internal_error():
+    """Test get conversation returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
 
-    import httpx
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(side_effect=httpx.TimeoutException("Connection timed out"))
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
+        mock_ctx.return_value = MagicMock()
+        mock_get.side_effect = Exception("Unexpected error")
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+        resp = client.get(
+            "/nb/v1/conversations/123",
+            headers=_build_headers(),
+        )
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
-        headers=_build_headers(),
-    )
+        assert resp.status_code == 500
 
-    assert resp.status_code == 504
-    assert "Timeout" in resp.json()["detail"]
 
+# =============================================================================
+# List Agents Error Tests
+# =============================================================================
 
-def test_fetch_file_request_error_returns_502(monkeypatch):
-    """httpx.RequestError: maps to 502 Bad Gateway."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
+def test_list_agents_limit_exceeded():
+    """Test list agents returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
 
-    import httpx
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(side_effect=httpx.RequestError("Connection refused", request=MagicMock()))
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
+        mock_ctx.return_value = MagicMock()
+        mock_get.side_effect = LimitExceededError("Rate limit exceeded")
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+        resp = client.get(
+            "/nb/v1/agents",
+            headers=_build_headers(),
+        )
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
-        headers=_build_headers(),
-    )
+        assert resp.status_code == 429
 
-    assert resp.status_code == 502
-    assert "Failed to fetch file from storage" in resp.json()["detail"]
 
+def test_list_agents_internal_error():
+    """Test list agents returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
 
-def test_fetch_file_unexpected_error_returns_500(monkeypatch):
-    """Unexpected exception: maps to 500 Internal Server Error."""
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
-    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
-        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
-    })
+        mock_ctx.return_value = MagicMock()
+        mock_get.side_effect = Exception("Unexpected error")
 
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(side_effect=RuntimeError("unexpected failure"))
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
+        resp = client.get(
+            "/nb/v1/agents",
+            headers=_build_headers(),
+        )
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+        assert resp.status_code == 500
 
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
-        headers=_build_headers(),
+
+# =============================================================================
+# List Conversations Error Tests
+# =============================================================================
+
+def test_list_conversations_limit_exceeded():
+    """Test list conversations returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
+
+        mock_ctx.return_value = MagicMock()
+        mock_list.side_effect = LimitExceededError("Rate limit exceeded")
+
+        resp = client.get(
+            "/nb/v1/conversations",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 429
+
+
+def test_list_conversations_internal_error():
+    """Test list conversations returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
+
+        mock_ctx.return_value = MagicMock()
+        mock_list.side_effect = Exception("Unexpected error")
+
+        resp = client.get(
+            "/nb/v1/conversations",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 500
+
+
+# =============================================================================
+# Update Conversation Title Error Tests
+# =============================================================================
+
+def test_update_conversation_title_limit_exceeded():
+    """Test update conversation title returns 429 when limit exceeded."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.side_effect = LimitExceededError("Rate limit exceeded")
+
+        resp = client.put(
+            "/nb/v1/conversations/123/title?title=New%20Title",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 429
+
+
+def test_update_conversation_title_not_found():
+    """Test update conversation title returns 404 when conversation not found."""
+    from consts.exceptions import ConversationNotFoundError
+
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.side_effect = ConversationNotFoundError("Conversation not found")
+
+        resp = client.put(
+            "/nb/v1/conversations/999/title?title=New%20Title",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 404
+
+
+def test_update_conversation_title_internal_error():
+    """Test update conversation title returns 500 on internal error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.side_effect = Exception("Unexpected error")
+
+        resp = client.put(
+            "/nb/v1/conversations/123/title?title=New%20Title",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 500
+
+
+def test_update_conversation_title_with_meta_data():
+    """Test update conversation title with metadata."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.return_value = {"idempotency_key": "idem-key", "conversation_id": 123}
+
+        resp = client.put(
+            "/nb/v1/conversations/123/title?title=New%20Title&meta_data=%7B%22source%22%3A%22test%22%7D",
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 200
+
+
+def test_update_conversation_title_with_idempotency_key():
+    """Test update conversation title with idempotency key."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+
+        mock_ctx.return_value = MagicMock()
+        mock_ctx.return_value.request_id = "req-123"
+        mock_update.return_value = {"idempotency_key": "my-key", "conversation_id": 123}
+
+        resp = client.put(
+            "/nb/v1/conversations/123/title?title=New%20Title",
+            headers={**_build_headers(), "Idempotency-Key": "my-key"},
+        )
+
+        assert resp.status_code == 200
+
+
+# =============================================================================
+# Upload Attachments Error Tests
+# =============================================================================
+
+def test_upload_chat_attachments_value_error():
+    """Test upload returns 400 on value error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
+
+        mock_ctx.return_value = MagicMock()
+        mock_upload.side_effect = ValueError("Invalid file")
+
+        file_content = b"test file content"
+        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
+
+        resp = client.post(
+            "/nb/v1/chat/attachments/upload",
+            files=files,
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 400
+
+
+def test_upload_chat_attachments_permission_error():
+    """Test upload returns 403 on permission error."""
+    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
+            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
+
+        mock_ctx.return_value = MagicMock()
+        mock_upload.side_effect = PermissionError("Access denied")
+
+        file_content = b"test file content"
+        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
+
+        resp = client.post(
+            "/nb/v1/chat/attachments/upload",
+            files=files,
+            headers=_build_headers(),
+        )
+
+        assert resp.status_code == 403
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])
+
+
+# =============================================================================
+# Helper Function Tests
+# =============================================================================
+
+def test_resolve_proxy_download_filename_with_rfc598_filename():
+    """Test filename resolution with RFC 598 filename."""
+    from apps.northbound_app import _resolve_proxy_download_filename
+
+    result = _resolve_proxy_download_filename(
+        "https://example.com/path/file.pdf",
+        'filename="report.pdf"'
     )
+    assert result == "report.pdf"
 
-    assert resp.status_code == 500
-    assert "Internal server error" in resp.json()["detail"]
 
+def test_resolve_proxy_download_filename_with_rfc598_star_filename():
+    """Test filename resolution with RFC 598 star filename."""
+    from apps.northbound_app import _resolve_proxy_download_filename
 
-def test_fetch_file_no_auth_required(monkeypatch):
-    """Endpoint requires no authentication (NOTE: No authentication required)."""
-    auth_called = []
+    result = _resolve_proxy_download_filename(
+        "https://example.com/path/file.pdf",
+        "filename*=UTF-8''report%20final.pdf"
+    )
+    assert result == "report final.pdf"
 
-    def _track_auth(auth):
-        auth_called.append(auth)
-        return (True, {"token_id": "t1"})
 
-    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", _track_auth)
+def test_resolve_proxy_download_filename_from_url():
+    """Test filename resolution from URL when no content-disposition."""
+    from apps.northbound_app import _resolve_proxy_download_filename
 
-    mock_response = MagicMock()
-    mock_response.status_code = 200
-    mock_response.headers = {"Content-Type": "text/plain"}
-    mock_response.aiter_bytes = MagicMock(return_value=iter([b"hello"]))
+    result = _resolve_proxy_download_filename(
+        "https://example.com/path/to/document.pdf",
+        ""
+    )
+    assert result == "document.pdf"
 
-    mock_client = MagicMock()
-    mock_client.get = AsyncMock(return_value=mock_response)
-    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
-    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
+def test_resolve_proxy_download_filename_no_filename_in_url():
+    """Test filename resolution returns 'download' when no filename in URL."""
+    from apps.northbound_app import _resolve_proxy_download_filename
 
-    # No headers at all - should still work because auth is not checked
-    resp = client.get(
-        "/nb/v1/file/fetch",
-        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+    result = _resolve_proxy_download_filename(
+        "https://example.com/path/",
+        ""
     )
+    assert result == "download"
 
-    assert resp.status_code == 200
+
+def test_resolve_proxy_download_filename_empty_content_disposition():
+    """Test filename resolution with empty content-disposition."""
+    from apps.northbound_app import _resolve_proxy_download_filename
+
+    result = _resolve_proxy_download_filename(
+        "https://example.com/path/file.pdf",
+        None
+    )
+    assert result == "file.pdf"
diff --git a/test/backend/app/test_northbound_base_app.py b/test/backend/app/test_northbound_base_app.py
index 4f58b3062..9ab9a3d11 100644
--- a/test/backend/app/test_northbound_base_app.py
+++ b/test/backend/app/test_northbound_base_app.py
@@ -274,17 +274,17 @@ def test_cors_middleware_configuration(self):
 
     def test_router_inclusion(self):
         """The main northbound router should be included."""
-        routes = [route.path for route in app.routes]
-        self.assertIn("/dummy", routes)
+        paths = app.openapi()["paths"]
+        self.assertIn("/dummy", paths)
 
     def test_a2a_router_inclusion(self):
         """A2A router should be registered under /nb/a2a."""
-        routes = [route.path for route in app.routes]
-        self.assertIn("/nb/a2a/{endpoint_id}/.well-known/agent-card.json", routes)
-        self.assertIn("/nb/a2a/{endpoint_id}/v1", routes)
-        self.assertIn("/nb/a2a/{endpoint_id}/message:send", routes)
-        self.assertIn("/nb/a2a/{endpoint_id}/message:stream", routes)
-        self.assertIn("/nb/a2a/{endpoint_id}/tasks/{task_id}", routes)
+        paths = app.openapi()["paths"]
+        self.assertIn("/nb/a2a/{endpoint_id}/.well-known/agent-card.json", paths)
+        self.assertIn("/nb/a2a/{endpoint_id}/v1", paths)
+        self.assertIn("/nb/a2a/{endpoint_id}/message:send", paths)
+        self.assertIn("/nb/a2a/{endpoint_id}/message:stream", paths)
+        self.assertIn("/nb/a2a/{endpoint_id}/tasks/{task_id}", paths)
 
     # -------------------------------------------------------------------
     # Exception handlers - delegated to app_factory which calls register_exception_handlers
diff --git a/test/backend/app/test_northbound_knowledge_app.py b/test/backend/app/test_northbound_knowledge_app.py
index 54d11b4c5..e39abdf19 100644
--- a/test/backend/app/test_northbound_knowledge_app.py
+++ b/test/backend/app/test_northbound_knowledge_app.py
@@ -57,6 +57,15 @@ class _ElasticSearchServiceStub:
     def list_indices(*args, **kwargs):
         return {"indices": ["kb1"]}
 
+    @staticmethod
+    async def delete_document_by_scope(index_name, path_or_url, scope, vdb_core):
+        return {
+            "status": "success",
+            "message": "Documents deleted successfully",
+            "scope": scope,
+            "deleted_es_count": 1,
+        }
+
     @staticmethod
     def delete_documents(index_name, path_or_url, vdb_core):
         return {"message": "Documents deleted successfully", "deleted": 1}
@@ -238,7 +247,10 @@ def test_redis_cleanup_failure_still_returns_200(self, client, mock_northbound_c
 
         response = client.delete(
             "/nb/v1/knowledge/indices/kb1/documents",
-            params={"path_or_url": "minio://path/doc.pdf"},
+            params={
+                "path_or_url": "minio://path/doc.pdf",
+                "scope": "full",
+            },
         )
 
         assert response.status_code == 200
diff --git a/test/backend/app/test_prompt_app.py b/test/backend/app/test_prompt_app.py
index 40d88e0e2..722b0f4d2 100644
--- a/test/backend/app/test_prompt_app.py
+++ b/test/backend/app/test_prompt_app.py
@@ -8,6 +8,19 @@
 backend_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), "../../../backend"))
 sys.path.insert(0, backend_dir)
 
+prompt_service_stub = type(sys)("services.prompt_service")
+prompt_service_stub.gen_system_prompt_streamable = MagicMock()
+prompt_service_stub.OptimizeRequest = type("OptimizeRequest", (), {"__init__": lambda self, **kwargs: self.__dict__.update(kwargs)})
+prompt_service_stub.OptimizeResult = type("OptimizeResult", (), {})
+prompt_service_stub.PromptOptimizationService = MagicMock()
+sys.modules["services.prompt_service"] = prompt_service_stub
+sys.modules["backend.services.prompt_service"] = prompt_service_stub
+
+auth_utils_stub = type(sys)("utils.auth_utils")
+auth_utils_stub.get_current_user_info = MagicMock()
+sys.modules["utils.auth_utils"] = auth_utils_stub
+sys.modules["backend.utils.auth_utils"] = auth_utils_stub
+
 from apps.prompt_app import router
 
 
@@ -17,18 +30,21 @@
 
 
 @patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.optimize_prompt_section_impl")
-def test_optimize_prompt_section_api_success(
-    mock_optimize_prompt_section,
-    mock_get_current_user_info,
-):
+@patch("apps.prompt_app.PromptOptimizationService")
+def test_optimize_prompt_section_api_success(mock_service_cls, mock_get_current_user_info):
+    """Test /prompt/optimize returns optimized content with X-Prompt-Source header"""
     mock_get_current_user_info.return_value = ("user-1", "tenant-1", "en")
-    mock_optimize_prompt_section.return_value = {
-        "section_type": "duty",
-        "section_title": "Agent Role",
-        "original_content": "Original",
-        "optimized_content": "Optimized",
-    }
+
+    mock_result = MagicMock()
+    mock_result.optimized_content = "Optimized"
+    mock_result.source = "nexent"
+    mock_result.section_type = "duty"
+    mock_result.section_title = "Agent Role"
+    mock_result.original_content = "Original"
+
+    mock_svc_instance = MagicMock()
+    mock_svc_instance.optimize.return_value = mock_result
+    mock_service_cls.return_value = mock_svc_instance
 
     response = client.post(
         "/prompt/optimize",
@@ -48,20 +64,165 @@ def test_optimize_prompt_section_api_success(
     )
 
     assert response.status_code == 200
-    assert response.json()["message"] == "Prompt section optimized successfully"
-    assert response.json()["data"]["optimized_content"] == "Optimized"
+    data = response.json()
+    assert data["message"] == "Success"
+    assert data["data"]["optimized_content"] == "Optimized"
+    assert data["data"]["section_type"] == "duty"
+    assert data["data"]["section_title"] == "Agent Role"
+    assert data["data"]["original_content"] == "Original"
     mock_get_current_user_info.assert_called_once()
-    mock_optimize_prompt_section.assert_called_once_with(
-        agent_id=1,
-        model_id=2,
-        task_description="Build an agent",
-        tenant_id="tenant-1",
-        language="en",
-        section_type="duty",
-        section_title="Agent Role",
-        current_content="Original",
-        feedback="Make it clearer",
-        tool_ids=[10],
-        sub_agent_ids=[20],
-        knowledge_base_display_names=["kb-a"],
+    mock_svc_instance.optimize.assert_called_once()
+
+
+@patch("apps.prompt_app.get_current_user_info")
+@patch("apps.prompt_app.PromptOptimizationService")
+def test_optimize_prompt_section_api_with_mode(mock_service_cls, mock_get_current_user_info):
+    """Test /prompt/optimize accepts mode/start_pos/end_pos parameters"""
+    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
+
+    mock_result = MagicMock()
+    mock_result.optimized_content = "Inserted content"
+    mock_result.source = "jiuwen"
+    mock_result.section_type = "duty"
+    mock_result.section_title = "智能体角色"
+    mock_result.original_content = "Old content"
+
+    mock_svc_instance = MagicMock()
+    mock_svc_instance.optimize.return_value = mock_result
+    mock_service_cls.return_value = mock_svc_instance
+
+    response = client.post(
+        "/prompt/optimize",
+        json={
+            "task_description": "Test insert",
+            "agent_id": 5,
+            "model_id": 3,
+            "section_type": "duty",
+            "section_title": "智能体角色",
+            "current_content": "Old content",
+            "feedback": "Insert more detail",
+            "mode": "insert",
+            "start_pos": 10,
+            "end_pos": 20,
+        },
+        headers={"Authorization": "Bearer token"},
+    )
+
+    assert response.status_code == 200
+    call_args = mock_svc_instance.optimize.call_args
+    assert call_args[0][0].mode == "insert"
+    assert call_args[0][0].start_pos == 10
+    assert call_args[0][0].end_pos == 20
+
+
+@patch("apps.prompt_app.get_current_user_info")
+@patch("apps.prompt_app.PromptOptimizationService")
+def test_optimize_prompt_section_api_nexent_capability_error(mock_service_cls, mock_get_current_user_info):
+    """Test /prompt/optimize returns 400 when NexentCapabilityError is raised"""
+    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "en")
+
+    from adapters.exception import NexentCapabilityError
+    mock_svc_instance = MagicMock()
+    mock_svc_instance.optimize.side_effect = NexentCapabilityError(
+        "nexent 原生模式只支持 general 模式，当前请求 mode=insert 不支持"
     )
+    mock_service_cls.return_value = mock_svc_instance
+
+    response = client.post(
+        "/prompt/optimize",
+        json={
+            "task_description": "Build an agent",
+            "agent_id": 1,
+            "model_id": 2,
+            "section_type": "duty",
+            "section_title": "Agent Role",
+            "current_content": "Original",
+            "feedback": "Make it clearer",
+            "mode": "insert",
+        },
+        headers={"Authorization": "Bearer token"},
+    )
+
+    assert response.status_code == 400
+    data = response.json()
+    assert "general" in data["message"]
+
+
+@patch("apps.prompt_app.get_current_user_info")
+@patch("apps.prompt_app.PromptOptimizationService")
+def test_optimize_badcase_api_success(mock_service_cls, mock_get_current_user_info):
+    """Test /prompt/optimize/badcase returns optimized content with X-Prompt-Source header"""
+    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
+
+    mock_result = MagicMock()
+    mock_result.optimized_content = "Fixed based on bad cases"
+    mock_result.source = "jiuwen"
+    mock_result.section_type = "duty"
+    mock_result.section_title = "智能体角色"
+    mock_result.original_content = "Old content"
+
+    mock_svc_instance = MagicMock()
+    mock_svc_instance.optimize_badcase.return_value = mock_result
+    mock_service_cls.return_value = mock_svc_instance
+
+    response = client.post(
+        "/prompt/optimize/badcase",
+        json={
+            "agent_id": 1,
+            "model_id": 2,
+            "current_content": "Old content",
+            "bad_cases": [
+                {
+                    "question": "用户问如何退款",
+                    "answer": "请联系客服",
+                    "label": "退款问题",
+                    "reason": "没有给出具体操作步骤",
+                }
+            ],
+            "section_type": "duty",
+            "section_title": "智能体角色",
+            "tool_ids": [10],
+            "sub_agent_ids": [],
+            "knowledge_base_display_names": [],
+        },
+        headers={"Authorization": "Bearer token"},
+    )
+
+    assert response.status_code == 200
+    data = response.json()
+    assert data["message"] == "Success"
+    assert data["data"]["optimized_content"] == "Fixed based on bad cases"
+    mock_svc_instance.optimize_badcase.assert_called_once()
+
+
+@patch("apps.prompt_app.get_current_user_info")
+@patch("apps.prompt_app.PromptOptimizationService")
+def test_optimize_badcase_api_nexent_capability_error(mock_service_cls, mock_get_current_user_info):
+    """Test /prompt/optimize/badcase returns 400 when NexentCapabilityError is raised"""
+    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
+
+    from adapters.exception import NexentCapabilityError
+    mock_svc_instance = MagicMock()
+    mock_svc_instance.optimize_badcase.side_effect = NexentCapabilityError(
+        "nexent 原生模式不支持 badcase 优化"
+    )
+    mock_service_cls.return_value = mock_svc_instance
+
+    response = client.post(
+        "/prompt/optimize/badcase",
+        json={
+            "agent_id": 1,
+            "model_id": 2,
+            "current_content": "Old content",
+            "bad_cases": [
+                {"question": "Q1", "answer": "A1"}
+            ],
+            "section_type": "duty",
+            "section_title": "智能体角色",
+        },
+        headers={"Authorization": "Bearer token"},
+    )
+
+    assert response.status_code == 400
+    data = response.json()
+    assert "badcase" in data["message"]
diff --git a/test/backend/app/test_prompt_template_app.py b/test/backend/app/test_prompt_template_app.py
index 8cd78cf1d..d54b13412 100644
--- a/test/backend/app/test_prompt_template_app.py
+++ b/test/backend/app/test_prompt_template_app.py
@@ -5,6 +5,7 @@
 from http import HTTPStatus
 
 import pytest
+from pydantic import BaseModel
 
 
 BACKEND_PATH = os.path.abspath(
@@ -18,6 +19,7 @@ def _reset_prompt_template_app_modules():
     sys.modules.pop("apps.prompt_template_app", None)
     sys.modules.pop("services.prompt_template_service", None)
     sys.modules.pop("utils.auth_utils", None)
+    sys.modules.pop("consts.model", None)
 
 
 @pytest.fixture
@@ -36,6 +38,17 @@ def prompt_template_app_module(monkeypatch):
         setattr(service_module, name, lambda *args, **kwargs: None)
     monkeypatch.setitem(sys.modules, "services.prompt_template_service", service_module)
 
+    class PromptTemplateRequest(BaseModel):
+        template_name: str
+        description: str
+        template_type: str
+        template_content_zh: dict
+        template_content_en: dict
+
+    consts_model_module = types.ModuleType("consts.model")
+    consts_model_module.PromptTemplateRequest = PromptTemplateRequest
+    monkeypatch.setitem(sys.modules, "consts.model", consts_model_module)
+
     auth_module = types.ModuleType("utils.auth_utils")
     auth_module.get_current_user_id = lambda authorization: ("user-1", "tenant-1")
     monkeypatch.setitem(sys.modules, "utils.auth_utils", auth_module)
diff --git a/test/backend/app/test_tool_config_app.py b/test/backend/app/test_tool_config_app.py
index 31da4b761..3633b9378 100644
--- a/test/backend/app/test_tool_config_app.py
+++ b/test/backend/app/test_tool_config_app.py
@@ -533,6 +533,60 @@ def test_import_openapi_service_success(
             tenant_id="tenant456",
             user_id="user123",
             service_description="Test API",
+            headers_template=None,
+            force_update=False
+        )
+        mock_refresh_mcp.assert_called_once_with("tenant456")
+
+    @patch('apps.tool_config_app._refresh_openapi_services_in_mcp')
+    @patch('apps.tool_config_app.get_current_user_id')
+    @patch('apps.tool_config_app.import_openapi_service')
+    def test_import_openapi_service_success_with_headers_template(
+        self, mock_import_service, mock_get_user_id, mock_refresh_mcp
+    ):
+        """Test successful OpenAPI service import with headers template"""
+        mock_get_user_id.return_value = ("user123", "tenant456")
+        mock_import_service.return_value = {
+            "tools_created": 1,
+            "tools_updated": 0,
+            "tools_deleted": 0
+        }
+        mock_refresh_mcp.return_value = {"status": "refreshed"}
+        headers_template = {
+            "Authorization": "Bearer {{token}}",
+            "X-Tenant-ID": "{{tenant_id}}"
+        }
+
+        response = client.post(
+            "/tool/openapi_service",
+            json={
+                "service_name": "test_service",
+                "server_url": "https://api.example.com",
+                "openapi_json": {"openapi": "3.0.0", "info": {"title": "Test"}, "paths": {}},
+                "service_description": "Test API",
+                "headers_template": headers_template,
+                "force_update": False
+            }
+        )
+
+        assert response.status_code == HTTPStatus.OK
+        data = response.json()
+        assert data["status"] == "success"
+        assert data["message"] == "OpenAPI service import successful"
+        assert data["data"]["tools_created"] == 1
+        assert data["data"]["tools_updated"] == 0
+        assert data["data"]["tools_deleted"] == 0
+        assert data["data"]["mcp_refresh"]["status"] == "refreshed"
+
+        mock_get_user_id.assert_called_once_with(None)
+        mock_import_service.assert_called_once_with(
+            service_name="test_service",
+            openapi_json={"openapi": "3.0.0", "info": {"title": "Test"}, "paths": {}},
+            server_url="https://api.example.com",
+            tenant_id="tenant456",
+            user_id="user123",
+            service_description="Test API",
+            headers_template=headers_template,
             force_update=False
         )
         mock_refresh_mcp.assert_called_once_with("tenant456")
diff --git a/test/backend/app/test_user_management_app.py b/test/backend/app/test_user_management_app.py
index fd2f08ddd..f5875aca4 100644
--- a/test/backend/app/test_user_management_app.py
+++ b/test/backend/app/test_user_management_app.py
@@ -520,6 +520,69 @@ def test_logout_signout_error_ignored(self, mock_get_client):
         mock_get_client.assert_called_once_with("Bearer token")
         mock_client.auth.sign_out.assert_called_once()
 
+    @patch('database.cas_session_db.revoke_cas_session_by_session_id')
+    @patch('apps.user_management_app.build_logout_url')
+    @patch('apps.user_management_app.extract_session_id_from_authorization')
+    @patch('apps.user_management_app.get_authorized_client')
+    def test_logout_returns_cas_logout_url_for_cas_session(
+        self,
+        mock_get_client,
+        mock_extract_session_id,
+        mock_build_logout_url,
+        mock_revoke_cas_session,
+    ):
+        """Test logout returns CAS logout URL when the JWT carries a CAS session id."""
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_extract_session_id.return_value = "sid-1"
+        mock_build_logout_url.return_value = (
+            "https://cas.example.com/cas/logout?service=https%3A%2F%2Fcas.example.com%2Fcas%2Flogin"
+        )
+
+        response = client.post(
+            "/user/logout",
+            headers={"Authorization": "Bearer token"}
+        )
+
+        assert response.status_code == HTTPStatus.OK
+        data = response.json()
+        assert (
+            data["data"]["cas_logout_url"]
+            == "https://cas.example.com/cas/logout?service=https%3A%2F%2Fcas.example.com%2Fcas%2Flogin"
+        )
+        mock_revoke_cas_session.assert_called_once_with("sid-1", actor="user")
+        mock_build_logout_url.assert_called_once_with()
+        mock_client.auth.sign_out.assert_called_once()
+
+    @patch('database.cas_session_db.revoke_cas_session_by_session_id')
+    @patch('apps.user_management_app.build_logout_url')
+    @patch('apps.user_management_app.extract_session_id_from_authorization')
+    @patch('apps.user_management_app.get_authorized_client')
+    def test_logout_does_not_return_cas_logout_url_when_not_configured(
+        self,
+        mock_get_client,
+        mock_extract_session_id,
+        mock_build_logout_url,
+        mock_revoke_cas_session,
+    ):
+        """Test logout skips CAS server logout redirect when CAS_LOGOUT_URL is empty."""
+        mock_client = MagicMock()
+        mock_get_client.return_value = mock_client
+        mock_extract_session_id.return_value = "sid-1"
+        mock_build_logout_url.return_value = ""
+
+        response = client.post(
+            "/user/logout",
+            headers={"Authorization": "Bearer token"}
+        )
+
+        assert response.status_code == HTTPStatus.OK
+        data = response.json()
+        assert data["data"]["cas_logout_url"] == ""
+        mock_revoke_cas_session.assert_called_once_with("sid-1", actor="user")
+        mock_build_logout_url.assert_called_once_with()
+        mock_client.auth.sign_out.assert_called_once()
+
     @patch('apps.user_management_app.get_authorized_client')
     def test_logout_error(self, mock_get_client):
         """Test logout with error"""
@@ -707,11 +770,47 @@ def test_current_user_info_success(self, mock_get_user_info, mock_validate_token
         assert data["data"]["user"]["tenant_id"] == "tenant456"
         assert data["data"]["user"]["user_email"] == "test@example.com"
         assert data["data"]["user"]["user_role"] == "USER"
+        assert data["data"]["user"]["auth_provider"] == "local"
         assert data["data"]["user"]["permissions"] == [
             "agent:create", "agent:read"]
         assert data["data"]["user"]["accessibleRoutes"] == ["chat", "agents"]
         mock_get_user_info.assert_called_once_with("user123")
 
+    @patch('apps.user_management_app.extract_session_id_from_authorization')
+    @patch('apps.user_management_app.validate_token')
+    @patch('apps.user_management_app.get_user_info', new_callable=AsyncMock)
+    def test_current_user_info_marks_cas_user(
+        self,
+        mock_get_user_info,
+        mock_validate_token,
+        mock_extract_session_id,
+    ):
+        """Test CAS-authenticated current user info includes auth provider"""
+        mock_user = MockUser("user123", "test@example.com")
+        mock_validate_token.return_value = (True, mock_user)
+        mock_extract_session_id.return_value = "cas-session-123"
+        mock_get_user_info.return_value = {
+            "user": {
+                "user_id": "user123",
+                "group_ids": [1],
+                "tenant_id": "tenant456",
+                "user_email": "test@example.com",
+                "user_role": "USER",
+                "permissions": ["agent:read"],
+                "accessibleRoutes": ["chat"]
+            }
+        }
+
+        response = client.get(
+            "/user/current_user_info",
+            headers={"Authorization": "Bearer cas-token"}
+        )
+
+        assert response.status_code == HTTPStatus.OK
+        data = response.json()
+        assert data["data"]["user"]["auth_provider"] == "cas"
+        mock_extract_session_id.assert_called_once_with("Bearer cas-token")
+
     def test_current_user_info_no_authorization(self):
         """Test current user info retrieval without authorization header"""
         response = client.get("/user/current_user_info")
diff --git a/test/backend/app/test_vectordatabase_app.py b/test/backend/app/test_vectordatabase_app.py
index c4820d177..cd684512f 100644
--- a/test/backend/app/test_vectordatabase_app.py
+++ b/test/backend/app/test_vectordatabase_app.py
@@ -1624,20 +1624,23 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "deleted_count": 5
+            "scope": "full",
+            "deleted_es_count": 5,
+            "source_available": False,
         }
-        mock_delete_docs.return_value = es_result
+        mock_delete_by_scope.return_value = es_result
 
-        # Setup the mock for delete_document_records
         redis_result = {
             "index_name": index_name,
             "path_or_url": path_or_url,
@@ -1647,9 +1650,10 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
         }
         redis_service_mock.delete_document_records.return_value = redis_result
 
-        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "full"},
+        )
 
         # Verify expected 200 status code
         assert response.status_code == 200
@@ -1668,13 +1672,46 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
         assert "redis_cleanup" in actual_response
         assert actual_response["redis_cleanup"] == redis_result
 
-        # Verify delete_documents was called with the correct parameters
-        # Use ANY for the vdb_core parameter because the actual object may differ
-        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "full", ANY
+        )
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
 
+@pytest.mark.asyncio
+async def test_delete_documents_source_only_skips_redis(vdb_core_mock, redis_service_mock):
+    """source_only scope must not trigger Redis document cleanup."""
+    with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
+            patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
+
+        index_name = "test_index"
+        path_or_url = "knowledge_base/test.pdf"
+        mock_delete_by_scope.return_value = {
+            "status": "success",
+            "scope": "source_only",
+            "deleted_es_count": 0,
+            "deleted_minio": True,
+            "source_available": False,
+        }
+
+        response = client.delete(
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "source_only"},
+        )
+
+        assert response.status_code == 200
+        assert response.json()["scope"] == "source_only"
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "source_only", ANY
+        )
+        redis_service_mock.delete_document_records.assert_not_called()
+
+
 @pytest.mark.asyncio
 async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
     """
@@ -1684,27 +1721,30 @@ async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "deleted_count": 5
+            "scope": "full",
+            "deleted_es_count": 5,
         }
-        mock_delete_docs.return_value = es_result
+        mock_delete_by_scope.return_value = es_result
 
-        # Setup redis error
         redis_error_message = "Redis connection failed"
         redis_service_mock.delete_document_records.side_effect = Exception(
             redis_error_message)
 
-        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "full"},
+        )
 
         # Verify expected 200 status code (the operation should still succeed even with Redis errors)
         assert response.status_code == 200
@@ -1722,9 +1762,9 @@ async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
         assert "redis_cleanup_error" in actual_response
         assert actual_response["redis_cleanup_error"] == redis_error_message
 
-        # Verify delete_documents was called
-        # Use ANY for the vdb_core parameter because the actual object may differ
-        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "full", ANY
+        )
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
@@ -1737,29 +1777,28 @@ async def test_delete_documents_es_exception(vdb_core_mock):
     """
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
-            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        # Setup the mock to raise an exception
-        mock_delete_docs.side_effect = Exception(
+        mock_delete_by_scope.side_effect = Exception(
             "Elasticsearch deletion failed")
 
-        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "full"},
+        )
 
-        # Verify expected 500 status code
         assert response.status_code == 500
-
-        # Verify error response
         expected_error_detail = "Error delete indexing documents: Elasticsearch deletion failed"
         assert response.json() == {"detail": expected_error_detail}
-
-        # Verify delete_documents was called
-        # Use ANY for the vdb_core parameter because the actual object may differ
-        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "full", ANY
+        )
 
 
 @pytest.mark.asyncio
@@ -1771,20 +1810,22 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "deleted_count": 5
+            "scope": "full",
+            "deleted_es_count": 5,
         }
-        mock_delete_docs.return_value = es_result
+        mock_delete_by_scope.return_value = es_result
 
-        # Setup the mock for delete_document_records with warnings
         redis_result = {
             "index_name": index_name,
             "path_or_url": path_or_url,
@@ -1795,9 +1836,10 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
         }
         redis_service_mock.delete_document_records.return_value = redis_result
 
-        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "full"},
+        )
 
         # Verify expected 200 status code
         assert response.status_code == 200
@@ -1816,9 +1858,9 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
         assert actual_response["redis_warnings"] == [
             "Some cache keys could not be deleted"]
 
-        # Verify delete_documents was called
-        # Use ANY for the vdb_core parameter because the actual object may differ
-        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "full", ANY
+        )
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
@@ -1831,29 +1873,27 @@ async def test_delete_documents_validation_exception(vdb_core_mock):
     """
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
-            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
+            patch(
+                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
+                new_callable=AsyncMock,
+            ) as mock_delete_by_scope:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        # Setup the mock to raise a validation exception
-        mock_delete_docs.side_effect = ValueError(
+        mock_delete_by_scope.side_effect = ValueError(
             "Invalid document path format")
 
-        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
-
-        # Verify expected 500 status code
-        assert response.status_code == 500
-
-        # Verify error response
-        expected_error_detail = "Error delete indexing documents: Invalid document path format"
-        assert response.json() == {"detail": expected_error_detail}
+            f"/indices/{index_name}/documents",
+            params={"path_or_url": path_or_url, "scope": "source_only"},
+        )
 
-        # Verify delete_documents was called
-        # Use ANY for the vdb_core parameter because the actual object may differ
-        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
+        assert response.status_code == 400
+        assert response.json() == {"detail": "Invalid document path format"}
+        mock_delete_by_scope.assert_called_once_with(
+            index_name, path_or_url, "source_only", ANY
+        )
 
 
 @pytest.mark.asyncio
diff --git a/test/backend/data_process/test_tasks.py b/test/backend/data_process/test_tasks.py
index 379989581..cc7eadfcb 100644
--- a/test/backend/data_process/test_tasks.py
+++ b/test/backend/data_process/test_tasks.py
@@ -51,24 +51,26 @@ def import_tasks_with_fake_ray(monkeypatch, initialized=False):
         backends_base_mod = types.ModuleType("celery.backends.base")
         backends_base_mod.DisabledBackend = type("DisabledBackend", (), {})
         sys.modules["celery.backends.base"] = backends_base_mod
-    
+
     if "celery.exceptions" not in sys.modules:
         exceptions_mod = types.ModuleType("celery.exceptions")
         exceptions_mod.Retry = type("Retry", (Exception,), {})
         sys.modules["celery.exceptions"] = exceptions_mod
-    
+
     if "celery.result" not in sys.modules:
         result_mod = types.ModuleType("celery.result")
         result_mod.AsyncResult = type("AsyncResult", (), {})
+
         @contextmanager
         def _allow_join_result():
             yield
         result_mod.allow_join_result = _allow_join_result
         sys.modules["celery.result"] = result_mod
-    
+
     if "celery.signals" not in sys.modules:
         signals_mod = types.ModuleType("celery.signals")
         # Create fake signal objects with connect method
+
         class FakeSignal:
             def connect(self, func):
                 return func
@@ -80,32 +82,34 @@ def connect(self, func):
         signals_mod.task_postrun = FakeSignal()
         signals_mod.task_failure = FakeSignal()
         sys.modules["celery.signals"] = signals_mod
-    
+
     if "celery" not in sys.modules:
         celery_mod = types.ModuleType("celery")
         # Create a Celery class that accepts any arguments and has required attributes
+
         class FakeBackend:
             pass
-        
+
         class FakeCelery:
             def __init__(self, *args, **kwargs):
                 # Set backend to a non-DisabledBackend instance
                 self.backend = FakeBackend()
                 # Create a conf object with update method
                 self.conf = types.SimpleNamespace(update=lambda **kwargs: None)
-            
+
             def task(self, *args, **kwargs):
                 # Return a decorator that returns the function unchanged
                 def decorator(func):
                     return func
                 return decorator
-        
+
         # Stub classes and functions needed by tasks.py
         celery_mod.Celery = FakeCelery
         celery_mod.Task = type("Task", (), {})
         celery_mod.chain = lambda *args: None
         celery_mod.group = lambda *args, **kwargs: []
-        celery_mod.chord = lambda *args, **kwargs: (lambda callback: types.SimpleNamespace(get=lambda: {"success": True, "total_indexed": 0, "total_submitted": 0}))
+        celery_mod.chord = lambda *args, **kwargs: (lambda callback: types.SimpleNamespace(
+            get=lambda: {"success": True, "total_indexed": 0, "total_submitted": 0}))
         celery_mod.states = types.SimpleNamespace(
             PENDING="PENDING",
             STARTED="STARTED",
@@ -115,7 +119,7 @@ def decorator(func):
             REVOKED="REVOKED"
         )
         sys.modules["celery"] = celery_mod
-    
+
     # Stub modules that ray_actors depends on to avoid importing real MinIO
     # Also stub consts package and consts.const module to provide required constants at import time
     if "consts" not in sys.modules:
@@ -163,9 +167,14 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["database.attachment_db"] = types.SimpleNamespace(
             get_file_stream=lambda source: io.BytesIO(b"stub-bytes"),
             get_file_size_from_minio=lambda object_name, bucket=None: 0,
-            build_s3_url=lambda bucket_name, object_name: f"http://mock-s3/{bucket_name}/{object_name}",  # NOSONAR
+            # NOSONAR
+            build_s3_url=lambda bucket_name, object_name: f"http://mock-s3/{bucket_name}/{object_name}",
             upload_fileobj=lambda file_obj, bucket_name, object_name: "mock-etag",
         )
+    if "database.knowledge_db" not in sys.modules:
+        sys.modules["database.knowledge_db"] = types.SimpleNamespace(
+            get_knowledge_record=lambda query=None: {},
+        )
     # Stub model_management_db module required by ray_actors
     if "database.model_management_db" not in sys.modules:
         sys.modules["database.model_management_db"] = types.SimpleNamespace(
@@ -180,6 +189,8 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
             sys.modules["database.attachment_db"])
     setattr(sys.modules["database"], "model_management_db",
             sys.modules["database.model_management_db"])
+    setattr(sys.modules["database"], "knowledge_db",
+            sys.modules["database.knowledge_db"])
 
     # Stub out auth and config utils to avoid importing real dependencies in file_management_utils
     if "utils.auth_utils" not in sys.modules:
@@ -195,9 +206,10 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["utils.config_utils"] = cfg_mod
     if "nexent.data_process" not in sys.modules:
         sys.modules["nexent.data_process"] = types.SimpleNamespace(
-            DataProcessCore=type("_Core", (), {"__init__": lambda self: None, "file_process": lambda *a, **k: []})
+            DataProcessCore=type(
+                "_Core", (), {"__init__": lambda self: None, "file_process": lambda *a, **k: []})
         )
-    
+
     # Stub external dependencies (required by utils.file_management_utils)
     if "aiofiles" not in sys.modules:
         sys.modules["aiofiles"] = types.SimpleNamespace(
@@ -212,7 +224,21 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
     if "httpx" not in sys.modules:
         sys.modules["httpx"] = types.SimpleNamespace()
     if "requests" not in sys.modules:
-        sys.modules["requests"] = types.SimpleNamespace()
+        class _FakeResponse:
+            def __init__(self, status_code=200, json_data=None, text=""):
+                self.status_code = status_code
+                self._json_data = json_data
+                self.text = text
+
+            def json(self):
+                if self._json_data is None:
+                    raise ValueError("no json")
+                return self._json_data
+
+        sys.modules["requests"] = types.SimpleNamespace(
+            delete=lambda *a, **k: _FakeResponse(status_code=200, json_data={
+                                                 "status": "success"}, text=""),
+        )
     if "redis" not in sys.modules:
         sys.modules["redis"] = types.SimpleNamespace(
             Redis=types.SimpleNamespace(
@@ -228,7 +254,7 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         fastapi_mod = types.ModuleType("fastapi")
         fastapi_mod.UploadFile = type("UploadFile", (), {})
         sys.modules["fastapi"] = fastapi_mod
-    
+
     # Stub utils.file_management_utils (required by tasks.py)
     if "utils.file_management_utils" not in sys.modules:
         file_utils_mod = types.ModuleType("utils.file_management_utils")
@@ -242,26 +268,31 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         class _StubRedisService:
             def save_error_info(self, *args, **kwargs):
                 return True
+
             def is_task_cancelled(self, *args, **kwargs):
                 return False
+
             def save_progress_info(self, *args, **kwargs):
                 return True
+
             def increment_progress_info(self, *args, **kwargs):
                 return True
 
         redis_service_mod.get_redis_service = lambda: _StubRedisService()
         sys.modules["services.redis_service"] = redis_service_mod
-    
+
     # Stub aiohttp (required by tasks.py)
     if "aiohttp" not in sys.modules:
         sys.modules["aiohttp"] = types.SimpleNamespace()
-    
+
     import backend.data_process.tasks as tasks
     importlib.reload(tasks)
     # Provide a Celery task shim that allows direct calls and supports .s for chaining
+
     class _SignatureShim:
         def __init__(self):
             pass
+
         def set(self, **_kw):
             return self
 
@@ -269,10 +300,12 @@ class _CeleryTaskShim:
         def __init__(self, run_func, preprocess=None):
             self._run_func = run_func
             self._preprocess = preprocess
+
         def __call__(self, *args, **kwargs):
             if self._preprocess is not None:
                 args, kwargs = self._preprocess(args, kwargs)
             return self._run_func(*args, **kwargs)
+
         def s(self, **_kw):
             return _SignatureShim()
 
@@ -296,15 +329,19 @@ def _unbound_run(task_obj):
     default_actor = types.SimpleNamespace(
         ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"),
         split_file=types.SimpleNamespace(remote=lambda *a, **k: []),
-        process_bytes=types.SimpleNamespace(remote=lambda *a, **k: "ref-bytes"),
+        process_bytes=types.SimpleNamespace(
+            remote=lambda *a, **k: "ref-bytes"),
         process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref"),
-        store_chunks_in_redis=types.SimpleNamespace(remote=lambda *a, **k: None),
+        store_chunks_in_redis=types.SimpleNamespace(
+            remote=lambda *a, **k: None),
     )
     if not hasattr(tasks, "DataProcessorRayActor") or not hasattr(getattr(tasks, "DataProcessorRayActor"), "remote"):
-        tasks.DataProcessorRayActor = types.SimpleNamespace(remote=lambda: default_actor)
+        tasks.DataProcessorRayActor = types.SimpleNamespace(
+            remote=lambda: default_actor)
     # Keep split path stable across tests even when get_ray_actor is monkeypatched.
     tasks._get_split_actor = lambda: types.SimpleNamespace(
-        split_file=types.SimpleNamespace(remote=lambda *a, **k: "__split_parts__")
+        split_file=types.SimpleNamespace(
+            remote=lambda *a, **k: "__split_parts__")
     )
 
     # Preprocess for forward: drop empty/whitespace-only chunks before calling real run
@@ -365,11 +402,15 @@ def _forward_preprocess(args, kwargs):
     maybe = _unbound_run(getattr(tasks, "aggregate_store_chunks", None))
     if maybe is not None:
         tasks.aggregate_store_chunks = _CeleryTaskShim(maybe)
+    maybe = _unbound_run(getattr(tasks, "cleanup_source", None))
+    if maybe is not None:
+        tasks.cleanup_source = _CeleryTaskShim(maybe)
     return tasks, fake_ray
 
 
 def test_init_ray_in_worker_initializes_once(monkeypatch):
-    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
+    tasks, fake_ray = import_tasks_with_fake_ray(
+        monkeypatch, initialized=False)
     # First call initializes
     tasks.init_ray_in_worker()
     assert fake_ray.inits and fake_ray.inits[-1]["configure_logging"] is False
@@ -383,10 +424,11 @@ def test_init_ray_in_worker_initializes_once(monkeypatch):
 
 def test_init_ray_in_worker_respects_disable_dashboard_setting(monkeypatch):
     """Test that init_ray_in_worker respects DISABLE_RAY_DASHBOARD setting"""
-    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
+    tasks, fake_ray = import_tasks_with_fake_ray(
+        monkeypatch, initialized=False)
     # Patch DISABLE_RAY_DASHBOARD in tasks module to True
     monkeypatch.setattr(tasks, "DISABLE_RAY_DASHBOARD", True)
-    
+
     # First call initializes with include_dashboard=False
     tasks.init_ray_in_worker()
     assert fake_ray.inits and fake_ray.inits[-1]["configure_logging"] is False
@@ -397,14 +439,16 @@ def test_init_ray_in_worker_respects_disable_dashboard_setting(monkeypatch):
 
 def test_init_ray_in_worker_raises_on_init_failure(monkeypatch):
     """Test that init_ray_in_worker logs error and re-raises exception when ray.init() fails"""
-    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
-    
+    tasks, fake_ray = import_tasks_with_fake_ray(
+        monkeypatch, initialized=False)
+
     # Make ray.init() raise an exception
     init_exception = RuntimeError("Ray initialization failed")
+
     def failing_init(**kwargs):
         raise init_exception
     fake_ray.init = failing_init
-    
+
     # Verify that the exception is re-raised
     with pytest.raises(RuntimeError) as exc_info:
         tasks.init_ray_in_worker()
@@ -418,7 +462,8 @@ async def sample():
         return 42
 
     # Force RuntimeError in get_running_loop to trigger asyncio.run path
-    monkeypatch.setattr(asyncio, "get_running_loop", lambda: (_ for _ in ()).throw(RuntimeError("no loop")))
+    monkeypatch.setattr(asyncio, "get_running_loop", lambda: (
+        _ for _ in ()).throw(RuntimeError("no loop")))
     result = tasks.run_async(sample())
     assert result == 42
 
@@ -442,14 +487,17 @@ def run_until_complete(self, coro):
 def test_get_ray_actor_returns_actor(monkeypatch):
     tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=True)
 
-    actor_obj = types.SimpleNamespace(ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"))
+    actor_obj = types.SimpleNamespace(
+        ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"))
 
     class _ManagerHandle:
         def __init__(self, actor):
-            self.get_actor = types.SimpleNamespace(remote=lambda: "__actor_ref__")
+            self.get_actor = types.SimpleNamespace(
+                remote=lambda: "__actor_ref__")
             self._actor = actor
 
-    monkeypatch.setattr(tasks, "_get_or_create_global_pool_manager", lambda: _ManagerHandle(actor_obj))
+    monkeypatch.setattr(
+        tasks, "_get_or_create_global_pool_manager", lambda: _ManagerHandle(actor_obj))
     fake_ray.get_returns = {"__actor_ref__": actor_obj}
     actor = tasks.get_ray_actor()
     assert actor is actor_obj
@@ -483,10 +531,13 @@ class FakeActor:
         class P:
             def __init__(self, *a, **k):
                 self.args = (a, k)
+
         def __init__(self):
             self.calls = []
-            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref1")
-            self.store_chunks_in_redis = types.SimpleNamespace(remote=lambda *a, **k: None)
+            self.process_file = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref1")
+            self.store_chunks_in_redis = types.SimpleNamespace(
+                remote=lambda *a, **k: None)
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     # Mock ray.get to return chunks instead of reference
@@ -494,7 +545,8 @@ def __init__(self):
 
     self = FakeSelf("p1")
 
-    result = tasks.process(self, source=str(f), source_type="local", chunking_strategy="basic", index_name="idx", original_filename="a.txt")
+    result = tasks.process(self, source=str(f), source_type="local",
+                           chunking_strategy="basic", index_name="idx", original_filename="a.txt")
     assert result["redis_key"].startswith("dp:p1:chunks")
     # success state updated twice: STARTED and SUCCESS
     assert any(s.get("state") == tasks.states.SUCCESS for s in self.states)
@@ -512,15 +564,18 @@ def test_process_minio_path(monkeypatch):
 
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref")
-            self.store_chunks_in_redis = types.SimpleNamespace(remote=lambda *a, **k: None)
+            self.process_file = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref")
+            self.store_chunks_in_redis = types.SimpleNamespace(
+                remote=lambda *a, **k: None)
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     # Mock ray.get to return chunks
     fake_ray.get_returns = mock_chunks
 
     self = FakeSelf("m1")
-    result = tasks.process(self, source="http://minio/bucket/x", source_type="minio", chunking_strategy="basic")
+    result = tasks.process(self, source="http://minio/bucket/x",
+                           source_type="minio", chunking_strategy="basic")
     assert result["redis_key"].startswith("dp:m1:chunks")
     # Verify chunks_count is set
     success_state = [s for s in self.states if s.get(
@@ -955,7 +1010,7 @@ class DummyClientConnectorError(Exception):
     json.loads(str(ei.value))
 
 
-def test_process_and_forward_returns_empty_when_apply_async_none(monkeypatch):
+def test_submit_process_forward_chain_returns_empty_when_apply_async_none(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
 
     class FakeChain:
@@ -963,18 +1018,25 @@ def apply_async(self):
             return None
 
     monkeypatch.setattr(tasks, "chain", lambda *a, **k: FakeChain())
-    # Ensure process and forward are accessible from the tasks module for process_and_forward
-    # The function looks up process and forward from the module at runtime
     import backend.data_process.tasks as tasks_module
-    # Process and forward should already be shimmed in import_tasks_with_fake_ray
-    # But we need to ensure they're accessible in the module namespace
     tasks_module.process = tasks.process
     tasks_module.forward = tasks.forward
+    tasks_module.cleanup_source = tasks.cleanup_source
+    out = tasks.submit_process_forward_chain(
+        source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
+    assert out == ""
+
+
+def test_process_and_forward_returns_empty_when_apply_async_none(monkeypatch):
+    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
+    monkeypatch.setattr(
+        tasks, "submit_process_forward_chain", lambda **kwargs: "")
     self = FakeSelf("chain_none")
     out = tasks.process_and_forward(
         self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
     assert out == ""
 
+
 def test_process_unsupported_source_type(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch, initialized=True)
     self = FakeSelf("e2")
@@ -991,14 +1053,16 @@ def test_forward_with_chunks_success(monkeypatch):
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 123)
 
     # run_async should return a successful response matching formatted chunk count (1)
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {
+                        "success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
 
     self = FakeSelf("f1")
     chunks = [
         {"content": "text", "metadata": {"creation_date": "2024-01-01"}},
         {"content": "", "metadata": {}},
     ]
-    result = tasks.forward(self, processed_data={"chunks": chunks}, index_name="idx", source="/a.txt", source_type="local", original_filename="a.txt")
+    result = tasks.forward(self, processed_data={
+                           "chunks": chunks}, index_name="idx", source="/a.txt", source_type="local", original_filename="a.txt")
     assert result["chunks_stored"] == 1
 
 
@@ -1006,10 +1070,12 @@ def test_forward_partial_success_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 0)
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 0, "total_submitted": 1, "message": "partial"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {
+                        "success": True, "total_indexed": 0, "total_submitted": 1, "message": "partial"})
     self = FakeSelf("f2")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt", source_type="local")
+        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {
+        }}]}, index_name="idx", source="/a.txt", source_type="local")
     json.loads(str(ei.value))
 
 
@@ -1017,7 +1083,8 @@ def test_forward_no_chunks_and_no_redis_key_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     self = FakeSelf("f3")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={}, index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={},
+                      index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1025,7 +1092,8 @@ def test_forward_formats_to_empty_then_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     self = FakeSelf("f4")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [{"content": "  ", "metadata": {}}]}, index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={"chunks": [
+                      {"content": "  ", "metadata": {}}]}, index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1035,7 +1103,8 @@ def test_forward_missing_es_env_raises(monkeypatch):
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 0)
     self = FakeSelf("f5")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={"chunks": [
+                      {"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1047,22 +1116,27 @@ def test_forward_loads_chunks_from_redis(monkeypatch):
 
     class FakeRedisClient:
         def __init__(self):
-            self.kv = {"dp:rid:chunks": json.dumps([{"content": "x", "metadata": {}}])}
+            self.kv = {"dp:rid:chunks": json.dumps(
+                [{"content": "x", "metadata": {}}])}
+
         def get(self, k):
             return self.kv.get(k)
 
-    fake_redis_mod = types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda url, decode_responses=True: FakeRedisClient()))
+    fake_redis_mod = types.SimpleNamespace(Redis=types.SimpleNamespace(
+        from_url=lambda url, decode_responses=True: FakeRedisClient()))
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
 
     # run_async returns success for 1 chunk
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {
+                        "success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
 
     self = FakeSelf("f6")
-    result = tasks.forward(self, processed_data={"redis_key": "dp:rid:chunks"}, index_name="idx", source="/a.txt")
+    result = tasks.forward(self, processed_data={
+                           "redis_key": "dp:rid:chunks"}, index_name="idx", source="/a.txt")
     assert result["chunks_stored"] == 1
 
 
-def test_process_and_forward_returns_chain_id(monkeypatch):
+def test_submit_process_forward_chain_returns_chain_id(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
 
     class FakeResult:
@@ -1074,8 +1148,24 @@ def apply_async(self):
             return FakeResult("123")
 
     monkeypatch.setattr(tasks, "chain", lambda *a, **k: FakeChain())
+    import backend.data_process.tasks as tasks_module
+    tasks_module.process = tasks.process
+    tasks_module.forward = tasks.forward
+    tasks_module.cleanup_source = tasks.cleanup_source
+    chain_id = tasks.submit_process_forward_chain(
+        source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
+    assert chain_id == "123"
+
+
+def test_process_and_forward_returns_chain_id(monkeypatch):
+    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
+    monkeypatch.setattr(
+        tasks, "submit_process_forward_chain",
+        lambda **kwargs: "123",
+    )
     self = FakeSelf("c1")
-    chain_id = tasks.process_and_forward(self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
+    chain_id = tasks.process_and_forward(
+        self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
     assert chain_id == "123"
 
 
@@ -1125,7 +1215,8 @@ def save_error_info(self, tid, reason):
         "backend.data_process.tasks.logger.info", lambda msg: infos.append(msg)
     )
     monkeypatch.setattr(
-        "backend.data_process.tasks.logger.error", lambda *a, **k: warnings.append(a[0])
+        "backend.data_process.tasks.logger.error", lambda *a, **k: warnings.append(
+            a[0])
     )
 
     # empty task_id
@@ -1196,7 +1287,8 @@ def test_process_error_fallback_when_save_error_raises(monkeypatch, tmp_path):
 
     # State should still be updated in fallback branch
     assert any(
-        s.get("meta", {}).get("stage") in {"text_extraction_failed", "extracting_text"}
+        s.get("meta", {}).get("stage") in {
+            "text_extraction_failed", "extracting_text"}
         for s in self.states
     ) or self.states == []
 
@@ -1211,7 +1303,8 @@ def test_process_error_truncates_reason_when_no_error_code(monkeypatch, tmp_path
     # Provide actor but make ray.get raise inside the try block
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref_err")
+            self.process_file = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref_err")
             self.store_chunks_in_redis = types.SimpleNamespace(
                 remote=lambda *a, **k: None)
 
@@ -1258,13 +1351,15 @@ def test_forward_cancel_check_warning_then_continue(monkeypatch):
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
 
     # make cancellation check raise to hit warning path
-    monkeypatch.setattr(tasks, "get_redis_service", lambda: (_ for _ in ()).throw(RuntimeError("boom")))
+    monkeypatch.setattr(tasks, "get_redis_service", lambda: (
+        _ for _ in ()).throw(RuntimeError("boom")))
 
     # run index_documents normally via stubbed run_async returning success
     monkeypatch.setattr(
         tasks,
         "run_async",
-        lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"},
+        lambda coro: {"success": True, "total_indexed": 1,
+                      "total_submitted": 1, "message": "ok"},
     )
 
     self = FakeSelf("warn-cancel")
@@ -1463,7 +1558,8 @@ def post(self, *a, **k):
             index_name="idx",
             source="/a.txt",
         )
-    assert "Failed to connect to API" in str(exc.value) or "timeout" in str(exc.value).lower()
+    assert "Failed to connect to API" in str(
+        exc.value) or "timeout" in str(exc.value).lower()
 
 
 def test_forward_truncates_reason_when_no_error_code(monkeypatch):
@@ -1474,12 +1570,14 @@ def test_forward_truncates_reason_when_no_error_code(monkeypatch):
 
     long_msg = json.dumps({"message": "m" * 250})
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception(long_msg))
+        tasks, "run_async", lambda coro: (
+            _ for _ in ()).throw(Exception(long_msg))
     )
 
     reasons: list[str] = []
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(
+            reason)
     )
 
     self = FakeSelf("f-trunc")
@@ -1505,12 +1603,14 @@ def test_forward_fallback_truncates_on_non_json_error(monkeypatch):
     monkeypatch.setattr(tasks, "extract_error_code", lambda *a, **k: None)
 
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception("n" * 250))
+        tasks, "run_async", lambda coro: (
+            _ for _ in ()).throw(Exception("n" * 250))
     )
 
     reasons: list[str] = []
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(
+            reason)
     )
 
     self = FakeSelf("f-fallback")
@@ -1534,11 +1634,13 @@ def test_forward_error_truncates_reason_and_uses_save(monkeypatch):
     long_message = "m" * 250
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception(json.dumps({"message": long_message})))
+        tasks, "run_async", lambda coro: (_ for _ in ()).throw(
+            Exception(json.dumps({"message": long_message})))
     )
     captured = {}
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault("reason", reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault(
+            "reason", reason)
     )
 
     self = FakeSelf("trunc")
@@ -1557,11 +1659,13 @@ def test_forward_error_fallback_when_json_loads_fails(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception("not-json-error"))
+        tasks, "run_async", lambda coro: (
+            _ for _ in ()).throw(Exception("not-json-error"))
     )
     captured = {}
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault("reason", reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault(
+            "reason", reason)
     )
 
     self = FakeSelf("fallback-forward")
@@ -1584,7 +1688,8 @@ def test_process_sync_local_returns(monkeypatch):
 
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref1")
+            self.process_file = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref1")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     fake_ray.get_returns = [{"content": "a"}, {"content": "b"}]
@@ -1614,13 +1719,16 @@ def test_build_balanced_batches_balances_image_chunks(monkeypatch):
         {"content": f"img-{i}", "process_source": tasks.IMAGE_METADATA_PROCESS_SOURCE}
         for i in range(6)
     ]
-    text_chunks = [{"content": f"txt-{i}", "process_source": "Unstructured"} for i in range(4)]
-    batches = tasks._build_balanced_batches(image_chunks + text_chunks, batch_size=4)
+    text_chunks = [{"content": f"txt-{i}",
+                    "process_source": "Unstructured"} for i in range(4)]
+    batches = tasks._build_balanced_batches(
+        image_chunks + text_chunks, batch_size=4)
 
     assert len(batches) == 3
     assert all(len(batch) <= 4 for batch in batches)
     image_counts = [
-        sum(1 for chunk in batch if chunk.get("process_source") == tasks.IMAGE_METADATA_PROCESS_SOURCE)
+        sum(1 for chunk in batch if chunk.get("process_source")
+            == tasks.IMAGE_METADATA_PROCESS_SOURCE)
         for batch in batches
     ]
     assert max(image_counts) - min(image_counts) <= 1
@@ -1645,6 +1753,7 @@ def test_forward_large_chunks_uses_chord_batches(monkeypatch):
     class _RedisSvc:
         def save_progress_info(self, *args, **kwargs):
             return True
+
         def is_task_cancelled(self, *args, **kwargs):
             return False
 
@@ -1653,12 +1762,15 @@ def is_task_cancelled(self, *args, **kwargs):
     class _Sig:
         def __init__(self, kwargs):
             self.kwargs = kwargs
+
         def set(self, **_kw):
             return self
 
     captured = {"group_sigs": None}
-    monkeypatch.setattr(tasks, "forward_part", types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
-    monkeypatch.setattr(tasks, "aggregate_forward_parts", types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
+    monkeypatch.setattr(tasks, "forward_part", types.SimpleNamespace(
+        s=lambda **kwargs: _Sig(kwargs)))
+    monkeypatch.setattr(tasks, "aggregate_forward_parts",
+                        types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
 
     def _fake_group(sig_iter):
         sigs = list(sig_iter)
@@ -1667,9 +1779,11 @@ def _fake_group(sig_iter):
 
     def _fake_chord(group_tasks):
         def _runner(_callback):
-            total = sum(len(sig.kwargs.get("chunks", [])) for sig in group_tasks)
+            total = sum(len(sig.kwargs.get("chunks", []))
+                        for sig in group_tasks)
             return types.SimpleNamespace(
-                get=lambda: {"success": True, "total_indexed": total, "total_submitted": total, "message": "ok"}
+                get=lambda: {"success": True, "total_indexed": total,
+                             "total_submitted": total, "message": "ok"}
             )
         return _runner
 
@@ -1682,7 +1796,8 @@ def _fake_allow_join_result():
     monkeypatch.setattr(tasks, "allow_join_result", _fake_allow_join_result)
 
     self = FakeSelf("forward-batch")
-    large_chunks = [{"content": f"content-{i}", "metadata": {}} for i in range(70)]
+    large_chunks = [{"content": f"content-{i}", "metadata": {}}
+                    for i in range(70)]
     out = tasks.forward(
         self,
         processed_data={"chunks": large_chunks},
@@ -1695,7 +1810,8 @@ def _fake_allow_join_result():
     assert out["chunks_stored"] == 70
     assert captured["group_sigs"] is not None
     assert len(captured["group_sigs"]) == 2
-    assert all(sig.kwargs.get("large_mode") is True for sig in captured["group_sigs"])
+    assert all(sig.kwargs.get("large_mode")
+               is True for sig in captured["group_sigs"])
 
 
 def test_process_sync_unsupported_raises_and_updates_state(monkeypatch):
@@ -1703,13 +1819,15 @@ def test_process_sync_unsupported_raises_and_updates_state(monkeypatch):
     monkeypatch.setattr(
         tasks,
         "get_ray_actor",
-        lambda: types.SimpleNamespace(process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref")),
+        lambda: types.SimpleNamespace(
+            process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref")),
     )
     self = FakeSelf("s2")
     with pytest.raises(NotImplementedError):
         tasks.process_sync(self, source="/a.txt", source_type="minio")
     # check that failure meta was updated
-    assert any("sync_processing_failed" in s.get("meta", {}).get("stage", "") for s in self.states)
+    assert any("sync_processing_failed" in s.get(
+        "meta", {}).get("stage", "") for s in self.states)
 
 
 def test_forward_redis_key_requires_backend_url_raises(monkeypatch):
@@ -1931,7 +2049,8 @@ def get(self, key):
         Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeClient())
     )
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
-    assert tasks._wait_for_split_ready("dp:k", timeout_s=1, poll_interval_ms=1) == 2
+    assert tasks._wait_for_split_ready(
+        "dp:k", timeout_s=1, poll_interval_ms=1) == 2
 
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "")
     with pytest.raises(RuntimeError):
@@ -1950,7 +2069,8 @@ def get(self, key):
         Redis=types.SimpleNamespace(from_url=lambda *a, **k: ClientBadJson())
     )
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
-    assert tasks._wait_for_split_ready("dp:k", timeout_s=1, poll_interval_ms=1) == 0
+    assert tasks._wait_for_split_ready(
+        "dp:k", timeout_s=1, poll_interval_ms=1) == 0
 
     class ClientNeverReady:
         def get(self, key):
@@ -1959,7 +2079,8 @@ def get(self, key):
     monkeypatch.setitem(
         sys.modules,
         "redis",
-        types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: ClientNeverReady())),
+        types.SimpleNamespace(Redis=types.SimpleNamespace(
+            from_url=lambda *a, **k: ClientNeverReady())),
     )
     monkeypatch.setattr(tasks.time, "sleep", lambda _s: None)
     t = {"v": 0.0}
@@ -1988,7 +2109,8 @@ def test_estimate_parallel_parts_and_batch_helpers(monkeypatch):
 def test_extract_error_code_from_es_response_detail_string(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     parsed = {"detail": "{\"error_code\":\"es_detail_code\"}"}
-    assert tasks._extract_error_code_from_es_response(parsed, "x") == "es_detail_code"
+    assert tasks._extract_error_code_from_es_response(
+        parsed, "x") == "es_detail_code"
 
 
 def test_run_async_loop_not_running_branch(monkeypatch):
@@ -2034,7 +2156,8 @@ class Actor:
         def __init__(self):
             self.ping = types.SimpleNamespace(remote=lambda: "pong")
 
-    monkeypatch.setattr(tasks, "DataProcessorRayActor", types.SimpleNamespace(remote=lambda: Actor()))
+    monkeypatch.setattr(tasks, "DataProcessorRayActor",
+                        types.SimpleNamespace(remote=lambda: Actor()))
     monkeypatch.setattr(tasks.ray, "get", lambda ref, timeout=None: True)
     manager = tasks.GlobalRayActorPoolManager(warm_timeout_s=1)
     assert manager.ensure_pool(desired=2, max_allowed=3) == 2
@@ -2048,8 +2171,10 @@ class Actor:
         def __init__(self):
             self.ping = types.SimpleNamespace(remote=lambda: "x")
 
-    monkeypatch.setattr(tasks, "DataProcessorRayActor", types.SimpleNamespace(remote=lambda: Actor()))
-    monkeypatch.setattr(tasks.ray, "get", lambda *a, **k: (_ for _ in ()).throw(RuntimeError("warm fail")))
+    monkeypatch.setattr(tasks, "DataProcessorRayActor",
+                        types.SimpleNamespace(remote=lambda: Actor()))
+    monkeypatch.setattr(tasks.ray, "get", lambda *a, **
+                        k: (_ for _ in ()).throw(RuntimeError("warm fail")))
     monkeypatch.setattr(tasks.ray, "kill", lambda *a, **k: None, raising=False)
     manager = tasks.GlobalRayActorPoolManager(warm_timeout_s=1)
     assert manager.ensure_pool(desired=1, max_allowed=1) == 0
@@ -2066,14 +2191,17 @@ def options(self, **_kw):
             raise TypeError("no get_if_exists")
 
     monkeypatch.setattr(tasks, "GlobalRayActorPoolManager", _Opts())
-    monkeypatch.setattr(tasks.ray, "get_actor", lambda *a, **k: "manager", raising=False)
+    monkeypatch.setattr(tasks.ray, "get_actor", lambda *a,
+                        **k: "manager", raising=False)
     assert tasks._get_or_create_global_pool_manager() == "manager"
 
 
 def test_prewarm_ray_actors(monkeypatch):
     tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch)
-    manager = types.SimpleNamespace(ensure_pool=types.SimpleNamespace(remote=lambda **k: "ref"))
-    monkeypatch.setattr(tasks, "_get_or_create_global_pool_manager", lambda: manager)
+    manager = types.SimpleNamespace(
+        ensure_pool=types.SimpleNamespace(remote=lambda **k: "ref"))
+    monkeypatch.setattr(
+        tasks, "_get_or_create_global_pool_manager", lambda: manager)
     monkeypatch.setattr(tasks, "_estimate_parallel_parts", lambda: 4)
     monkeypatch.setattr(fake_ray, "get", lambda ref: 3)
     assert tasks.prewarm_ray_actors(target_size=3) == 3
@@ -2085,7 +2213,8 @@ def test_process_part_success_and_failure(monkeypatch):
 
     class Actor:
         def __init__(self):
-            self.process_bytes = types.SimpleNamespace(remote=lambda *a, **k: "chunks-ref")
+            self.process_bytes = types.SimpleNamespace(
+                remote=lambda *a, **k: "chunks-ref")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: Actor())
     fake_ray.get_returns = {"chunks-ref": [{"content": "x"}]}
@@ -2099,9 +2228,11 @@ def set(self, k, v):
         def expire(self, *a, **k):
             return True
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
+        Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
     out = tasks.process_part(
-        types.SimpleNamespace(request=types.SimpleNamespace(id="p1"), retry=lambda **k: None),
+        types.SimpleNamespace(request=types.SimpleNamespace(
+            id="p1"), retry=lambda **k: None),
         part_bytes=b"a", filename="a.txt", chunking_strategy="basic", part_redis_key="k1",
         source="s", source_type="local"
     )
@@ -2110,7 +2241,8 @@ def expire(self, *a, **k):
 
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "")
     out2 = tasks.process_part(
-        types.SimpleNamespace(request=types.SimpleNamespace(id="p2"), retry=lambda **k: None),
+        types.SimpleNamespace(request=types.SimpleNamespace(
+            id="p2"), retry=lambda **k: None),
         part_bytes=b"a", filename="a.txt", chunking_strategy="basic", part_redis_key="k2",
         source="s", source_type="local"
     )
@@ -2140,10 +2272,12 @@ def expire(self, *a, **k):
         def delete(self, k):
             kv.pop(k, None)
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
+        Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
     res = tasks.aggregate_store_chunks(
         self,
-        parts_results=[{"part_redis_key": "part1"}, {"part_redis_key": "part2"}],
+        parts_results=[{"part_redis_key": "part1"},
+                       {"part_redis_key": "part2"}],
         redis_key="maink",
         source="s",
         index_name="idx",
@@ -2158,7 +2292,8 @@ def test_forward_part_success_and_progress(monkeypatch):
     monkeypatch.setattr(
         tasks,
         "_send_chunks_to_es",
-        lambda **kwargs: {"success": True, "total_indexed": 2, "total_submitted": 2},
+        lambda **kwargs: {"success": True,
+                          "total_indexed": 2, "total_submitted": 2},
     )
     calls = {"inc": 0}
 
@@ -2173,7 +2308,8 @@ def increment_progress_info(self, **kwargs):
     monkeypatch.setattr(tasks, "get_redis_service", lambda: _Svc())
     self = types.SimpleNamespace(
         request=types.SimpleNamespace(id="fp1", retries=0),
-        retry=lambda **k: (_ for _ in ()).throw(RuntimeError("should not retry")),
+        retry=lambda **k: (_ for _ in ()
+                           ).throw(RuntimeError("should not retry")),
     )
     out = tasks.forward_part(
         self,
@@ -2190,14 +2326,16 @@ def increment_progress_info(self, **kwargs):
 
 def test_forward_part_failure_retries(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(tasks, "_send_chunks_to_es", lambda **kwargs: {"success": False, "message": "bad"})
+    monkeypatch.setattr(tasks, "_send_chunks_to_es", lambda **
+                        kwargs: {"success": False, "message": "bad"})
     captured = {}
 
     def _retry(**kwargs):
         captured.update(kwargs)
         raise RuntimeError("retried")
 
-    self = types.SimpleNamespace(request=types.SimpleNamespace(id="fp2", retries=1), retry=_retry)
+    self = types.SimpleNamespace(
+        request=types.SimpleNamespace(id="fp2", retries=1), retry=_retry)
     with pytest.raises(RuntimeError, match="retried"):
         tasks.forward_part(
             self,
@@ -2231,11 +2369,14 @@ def test_run_processing_for_parts_single_and_multi(monkeypatch):
 
     class Actor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref-file")
-            self.process_bytes = types.SimpleNamespace(remote=lambda *a, **k: "ref-bytes")
+            self.process_file = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref-file")
+            self.process_bytes = types.SimpleNamespace(
+                remote=lambda *a, **k: "ref-bytes")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: Actor())
-    fake_ray.get_returns = {"ref-bytes": [{"content": "c1"}], "ref-file": [{"content": "cf"}]}
+    fake_ray.get_returns = {
+        "ref-bytes": [{"content": "c1"}], "ref-file": [{"content": "cf"}]}
 
     split_async, chunks, split_chunk_count = tasks._run_processing_for_parts(
         request_id="r1",
@@ -2256,10 +2397,13 @@ def __init__(self):
     assert split_chunk_count is None
 
     captured = {}
-    monkeypatch.setattr(tasks, "process_part", types.SimpleNamespace(s=lambda **kwargs: types.SimpleNamespace(kwargs=kwargs)))
-    monkeypatch.setattr(tasks, "aggregate_store_chunks", types.SimpleNamespace(s=lambda **kwargs: types.SimpleNamespace(set=lambda **kw: {"kwargs": kwargs, "set": kw})))
+    monkeypatch.setattr(tasks, "process_part", types.SimpleNamespace(
+        s=lambda **kwargs: types.SimpleNamespace(kwargs=kwargs)))
+    monkeypatch.setattr(tasks, "aggregate_store_chunks", types.SimpleNamespace(
+        s=lambda **kwargs: types.SimpleNamespace(set=lambda **kw: {"kwargs": kwargs, "set": kw})))
     monkeypatch.setattr(tasks, "group", lambda gen: list(gen))
-    monkeypatch.setattr(tasks, "chord", lambda group_tasks: (lambda callback: captured.update({"group": group_tasks, "callback": callback})))
+    monkeypatch.setattr(tasks, "chord", lambda group_tasks: (
+        lambda callback: captured.update({"group": group_tasks, "callback": callback})))
     monkeypatch.setattr(tasks, "_compute_split_wait_timeout", lambda n: 9)
     monkeypatch.setattr(tasks, "_estimate_parallel_parts", lambda: 2)
     monkeypatch.setattr(tasks, "_wait_for_split_ready", lambda **kwargs: 6)
@@ -2287,14 +2431,17 @@ def __init__(self):
 def test_process_split_async_redis_image_metadata_count(monkeypatch, tmp_path):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "redis://test")
-    monkeypatch.setattr(tasks, "_process_source_with_split", lambda **kwargs: (True, None, 2))
-    monkeypatch.setattr(tasks, "_count_image_metadata_chunks", lambda chunks: 1)
+    monkeypatch.setattr(tasks, "_process_source_with_split",
+                        lambda **kwargs: (True, None, 2))
+    monkeypatch.setattr(
+        tasks, "_count_image_metadata_chunks", lambda chunks: 1)
 
     class FakeRedisClient:
         def get(self, key):
             return json.dumps([{"metadata": {"content_type": "image"}}, {"metadata": {}}])
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeRedisClient())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
+        Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeRedisClient())))
 
     f = tmp_path / "x.txt"
     f.write_text("hello")
@@ -2309,5 +2456,88 @@ def get(self, key):
     )
     assert out["split_async"] is True
     assert out["image_metadata_chunk_count"] == 1
-    success_state = [s for s in self.states if s.get("state") == tasks.states.SUCCESS][0]
+    success_state = [s for s in self.states if s.get(
+        "state") == tasks.states.SUCCESS][0]
     assert success_state["meta"]["chunks_count"] == 2
+
+
+def test_cleanup_source_skips_when_preserve_true(monkeypatch):
+    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
+    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
+    monkeypatch.setattr(tasks, "get_knowledge_record",
+                        lambda query=None: {"preserve_source_file": True})
+
+    called = {"delete": 0}
+
+    def _delete(*_a, **_k):
+        called["delete"] += 1
+        raise AssertionError(
+            "requests.delete should not be called when preserve_source_file is True")
+
+    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
+
+    self = FakeSelf("cleanup-skip-1")
+    out = tasks.cleanup_source(
+        self,
+        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
+    )
+    assert out["source_cleanup"]["attempted"] is False
+    assert out["source_cleanup"]["skipped_reason"] == "preserve_source_file_true"
+    assert called["delete"] == 0
+
+
+def test_cleanup_source_calls_delete_with_scope_source_only(monkeypatch):
+    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
+    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
+    monkeypatch.setattr(tasks, "get_knowledge_record",
+                        lambda query=None: {"preserve_source_file": False})
+
+    captured = {}
+
+    class FakeResponse:
+        status_code = 200
+        text = ""
+
+        @staticmethod
+        def json():
+            return {"status": "success"}
+
+    def _delete(url, params=None, timeout=None):
+        captured["url"] = url
+        captured["params"] = params
+        captured["timeout"] = timeout
+        return FakeResponse()
+
+    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
+
+    self = FakeSelf("cleanup-call-1")
+    out = tasks.cleanup_source(
+        self,
+        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
+    )
+    assert captured["url"] == "http://api/indices/idx/documents"
+    assert captured["params"]["path_or_url"] == "/a.txt"
+    assert captured["params"]["scope"] == "source_only"
+    assert out["source_cleanup"]["attempted"] is True
+    assert out["source_cleanup"]["success"] is True
+
+
+def test_cleanup_source_failure_is_warning_only(monkeypatch):
+    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
+    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
+    monkeypatch.setattr(tasks, "get_knowledge_record",
+                        lambda query=None: {"preserve_source_file": False})
+
+    def _delete(*_a, **_k):
+        raise RuntimeError("boom")
+
+    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
+
+    self = FakeSelf("cleanup-fail-1")
+    out = tasks.cleanup_source(
+        self,
+        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
+    )
+    assert out["source_cleanup"]["attempted"] is True
+    assert out["source_cleanup"]["success"] is False
+    assert "boom" in (out["source_cleanup"]["error"] or "")
diff --git a/test/backend/data_process/test_worker.py b/test/backend/data_process/test_worker.py
index da4408e2f..79875ba5a 100644
--- a/test/backend/data_process/test_worker.py
+++ b/test/backend/data_process/test_worker.py
@@ -185,7 +185,12 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
             get_model_by_model_id=lambda model_id, tenant_id=None: None
         )
         setattr(sys.modules["database"], "model_management_db", sys.modules["database.model_management_db"])
-    
+    if "database.knowledge_db" not in sys.modules:
+        sys.modules["database.knowledge_db"] = types.SimpleNamespace(
+            get_knowledge_record=lambda query=None: {},
+        )
+        setattr(sys.modules["database"], "knowledge_db", sys.modules["database.knowledge_db"])
+
     # Stub utils modules (required by utils.file_management_utils)
     if "utils.auth_utils" not in sys.modules:
         sys.modules["utils.auth_utils"] = types.SimpleNamespace(
@@ -213,6 +218,19 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["httpx"] = types.SimpleNamespace()
     if "requests" not in sys.modules:
         sys.modules["requests"] = types.SimpleNamespace()
+    if "redis" not in sys.modules:
+        sys.modules["redis"] = types.SimpleNamespace(
+            Redis=types.SimpleNamespace(
+                from_url=lambda *args, **kwargs: types.SimpleNamespace(
+                    get=lambda *a, **k: None,
+                    set=lambda *a, **k: True,
+                    expire=lambda *a, **k: True,
+                    delete=lambda *a, **k: True,
+                    ping=lambda: True,
+                )
+            ),
+            from_url=lambda *args, **kwargs: types.SimpleNamespace(ping=lambda: True),
+        )
     if "fastapi" not in sys.modules:
         fastapi_mod = types.ModuleType("fastapi")
         fastapi_mod.UploadFile = type("UploadFile", (), {})
@@ -223,7 +241,27 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         file_utils_mod = types.ModuleType("utils.file_management_utils")
         file_utils_mod.get_file_size = lambda *args, **kwargs: 0
         sys.modules["utils.file_management_utils"] = file_utils_mod
-    
+
+    # Stub services.redis_service (required by tasks.py via package __init__)
+    if "services.redis_service" not in sys.modules:
+        redis_service_mod = types.ModuleType("services.redis_service")
+
+        class _StubRedisService:
+            def save_error_info(self, *args, **kwargs):
+                return True
+
+            def is_task_cancelled(self, *args, **kwargs):
+                return False
+
+            def save_progress_info(self, *args, **kwargs):
+                return True
+
+            def increment_progress_info(self, *args, **kwargs):
+                return True
+
+        redis_service_mod.get_redis_service = lambda: _StubRedisService()
+        sys.modules["services.redis_service"] = redis_service_mod
+
     # Stub ray_actors (required by tasks.py)
     if "backend.data_process.ray_actors" not in sys.modules:
         ray_actors_mod = types.ModuleType("backend.data_process.ray_actors")
diff --git a/test/backend/database/test_agent_db.py b/test/backend/database/test_agent_db.py
index de2ed8864..77a1d82a9 100644
--- a/test/backend/database/test_agent_db.py
+++ b/test/backend/database/test_agent_db.py
@@ -77,6 +77,12 @@
 db_models_mock.ToolInstance = MagicMock()
 db_models_mock.AgentRelation = MagicMock()
 
+# Mock database.agent_version_db before agent_db imports it
+agent_version_db_mock = MagicMock()
+agent_version_db_mock.query_current_version_no = MagicMock(return_value=3)
+sys.modules['database.agent_version_db'] = agent_version_db_mock
+sys.modules['backend.database.agent_version_db'] = agent_version_db_mock
+
 # 将模拟的db_models模块添加到sys.modules中
 sys.modules['database.db_models'] = db_models_mock
 sys.modules['backend.database.db_models'] = db_models_mock
@@ -87,6 +93,8 @@
     search_agent_id_by_agent_name,
     search_blank_sub_agent_by_main_agent_id,
     query_sub_agents_id_list,
+    query_sub_agent_relations,
+    resolve_sub_agent_version_no,
     create_agent,
     update_agent,
     delete_agent_by_id,
@@ -124,13 +132,17 @@ def __init__(self):
         self.group_ids = None
         self.is_new = True
         self.enable_context_manager = False
+        self.verification_config = None
+        self.greeting_message = None
+        self.example_questions = None
         self.current_version_no = None
         self.version_no = 0
         self.created_by = None
 
 class MockAgentRelation:
-    def __init__(self):
+    def __init__(self, selected_agent_version_no=None):
         self.selected_agent_id = 2
+        self.selected_agent_version_no = selected_agent_version_no
 
 @pytest.fixture
 def mock_session():
@@ -276,6 +288,69 @@ def test_query_sub_agents_id_list(monkeypatch, mock_session):
 
     assert result == [2]
 
+
+def test_query_sub_agent_relations(monkeypatch, mock_session):
+    """Test querying sub-agent relations including pinned version"""
+    session, query = mock_session
+    mock_relation = MockAgentRelation(selected_agent_version_no=2)
+
+    mock_all = MagicMock()
+    mock_all.return_value = [mock_relation]
+    mock_filter = MagicMock()
+    mock_filter.all = mock_all
+    query.filter.return_value = mock_filter
+
+    mock_ctx = MagicMock()
+    mock_ctx.__enter__.return_value = session
+    mock_ctx.__exit__.return_value = None
+    monkeypatch.setattr("backend.database.agent_db.get_db_session", lambda: mock_ctx)
+    monkeypatch.setattr("backend.database.agent_db.as_dict", lambda obj: obj.__dict__)
+
+    result = query_sub_agent_relations(1, "tenant1", version_no=1)
+
+    assert len(result) == 1
+    assert result[0]["selected_agent_id"] == 2
+    assert result[0]["selected_agent_version_no"] == 2
+
+
+def test_resolve_sub_agent_version_no_pinned(monkeypatch):
+    """Test resolve uses pinned version when set"""
+    result = resolve_sub_agent_version_no(
+        selected_agent_id=2,
+        selected_agent_version_no=5,
+        tenant_id="tenant1",
+    )
+    assert result == 5
+
+
+def test_resolve_sub_agent_version_no_fallback(monkeypatch):
+    """Test resolve falls back to child current_version_no when pin is NULL"""
+    monkeypatch.setattr(
+        "backend.database.agent_db.query_current_version_no",
+        MagicMock(return_value=3),
+    )
+    result = resolve_sub_agent_version_no(
+        selected_agent_id=2,
+        selected_agent_version_no=None,
+        tenant_id="tenant1",
+    )
+    assert result == 3
+
+
+def test_resolve_sub_agent_version_no_fallback_to_draft(monkeypatch):
+    """Test resolve falls back to draft when child has no published version"""
+    monkeypatch.setattr(
+        "backend.database.agent_db.query_current_version_no",
+        MagicMock(return_value=None),
+    )
+    result = resolve_sub_agent_version_no(
+        selected_agent_id=2,
+        selected_agent_version_no=None,
+        tenant_id="tenant1",
+    )
+    assert result == 0
+
+
 def test_create_agent_success(monkeypatch, mock_session):
     """测试成功创建agent"""
     session, query = mock_session
diff --git a/test/backend/database/test_agent_version_db.py b/test/backend/database/test_agent_version_db.py
index cd9ad8714..fd354b29c 100644
--- a/test/backend/database/test_agent_version_db.py
+++ b/test/backend/database/test_agent_version_db.py
@@ -171,6 +171,7 @@ def __init__(self):
         self.id = 1
         self.parent_agent_id = 1
         self.selected_agent_id = 2
+        self.selected_agent_version_no = 3
         self.tenant_id = "tenant1"
         self.version_no = 1
         self.delete_flag = "N"
@@ -178,6 +179,7 @@ def __init__(self):
             "id": 1,
             "parent_agent_id": 1,
             "selected_agent_id": 2,
+            "selected_agent_version_no": 3,
             "tenant_id": "tenant1",
             "version_no": 1,
             "delete_flag": "N",
@@ -542,6 +544,25 @@ def query_side_effect(model_class):
     assert tools_list[0]["tool_id"] == 1
     assert len(relations_list) == 1
     assert relations_list[0]["selected_agent_id"] == 2
+    assert relations_list[0]["selected_agent_version_no"] == 3
+
+
+def test_restore_agent_draft_relation_copy_preserves_selected_agent_version_no():
+    """Verify restore draft relation copy keeps selected_agent_version_no unchanged."""
+    rel = {
+        "relation_id": 10,
+        "parent_agent_id": 1,
+        "selected_agent_id": 2,
+        "selected_agent_version_no": 3,
+        "tenant_id": "tenant1",
+        "version_no": 2,
+    }
+    rel_copy = {k: v for k, v in rel.items() if k not in ("version_no",)}
+    rel_copy["version_no"] = 0
+
+    assert rel_copy["selected_agent_version_no"] == 3
+    assert rel_copy["version_no"] == 0
+    assert rel_copy["selected_agent_id"] == 2
 
 
 def test_query_agent_snapshot_no_agent(monkeypatch, mock_session):
diff --git a/test/backend/services/test_agent_repository_service.py b/test/backend/services/test_agent_repository_service.py
new file mode 100644
index 000000000..648d20385
--- /dev/null
+++ b/test/backend/services/test_agent_repository_service.py
@@ -0,0 +1,398 @@
+"""Unit tests for agent marketplace repository service."""
+
+import sys
+from pathlib import Path
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import pytest
+
+_REPO_ROOT = Path(__file__).resolve().parents[3]
+if str(_REPO_ROOT) not in sys.path:
+    sys.path.insert(0, str(_REPO_ROOT))
+
+# Mock DB layer before importing the service under test
+sys.modules.setdefault("sqlalchemy", MagicMock())
+sys.modules.setdefault("sqlalchemy.dialects", MagicMock())
+sys.modules.setdefault("sqlalchemy.dialects.postgresql", MagicMock())
+
+_agent_repo_db_mock = MagicMock()
+_agent_repo_db_mock.STATUS_PENDING_REVIEW = "PENDING_REVIEW"
+_agent_repo_db_mock.VALID_REPOSITORY_STATUSES = frozenset({
+    "NOT_SHARED",
+    "PENDING_REVIEW",
+    "REJECTED",
+    "SHARED",
+})
+_agent_repo_db_mock.get_agent_repository_by_id = MagicMock()
+_agent_repo_db_mock.get_agent_repository_by_agent_id = MagicMock()
+_agent_repo_db_mock.insert_agent_repository_record = MagicMock()
+_agent_repo_db_mock.update_agent_repository_by_id = MagicMock()
+sys.modules["database.agent_repository_db"] = _agent_repo_db_mock
+
+_agent_db_mock = MagicMock()
+_agent_db_mock.search_agent_info_by_agent_id = MagicMock()
+sys.modules["database.agent_db"] = _agent_db_mock
+
+_agent_version_db_mock = MagicMock()
+_agent_version_db_mock.search_version_by_version_no = MagicMock()
+sys.modules["database.agent_version_db"] = _agent_version_db_mock
+
+class _SkillZipEntryMock:
+    def __init__(self, skill_name: str, skill_zip_base64: str):
+        self.skill_name = skill_name
+        self.skill_zip_base64 = skill_zip_base64
+
+
+class _AgentRepositorySnapshotMock:
+    def __init__(self, **kwargs):
+        self._data = kwargs
+
+    def model_dump(self):
+        data = dict(self._data)
+        skills = data.get("skills")
+        if skills:
+            data["skills"] = [
+                {
+                    "skill_name": entry.skill_name,
+                    "skill_zip_base64": entry.skill_zip_base64,
+                }
+                for entry in skills
+            ]
+        return data
+
+
+_consts_model_mock = MagicMock()
+_consts_model_mock.AgentRepositorySnapshot = _AgentRepositorySnapshotMock
+_consts_model_mock.SkillZipEntry = _SkillZipEntryMock
+sys.modules["consts.model"] = _consts_model_mock
+
+_agent_service_mock = MagicMock()
+_agent_service_mock.collect_skill_zip_entries = MagicMock(return_value=[])
+_agent_service_mock.export_agent_dict_for_repository_impl = AsyncMock(return_value={
+    "agent_id": 1,
+    "agent_info": {
+        "1": {
+            "agent_id": 1,
+            "name": "agent_one",
+            "description": "desc",
+            "business_description": "biz",
+            "max_steps": 5,
+            "provide_run_summary": False,
+            "enabled": True,
+            "tools": [],
+            "managed_agents": [],
+        }
+    },
+    "mcp_info": [],
+})
+sys.modules["services.agent_service"] = _agent_service_mock
+
+from consts.const import ASSET_OWNER_TENANT_ID
+
+from backend.services import agent_repository_service as ars
+
+
+@pytest.mark.asyncio
+async def test_create_agent_repository_listing_impl_success():
+    agent_info_json = {
+        "agent_id": 1,
+        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
+        "mcp_info": [],
+        "skills": None,
+    }
+    with patch.object(
+        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
+    ) as mock_build_data, patch.object(
+        ars, "get_agent_repository_by_agent_id"
+    ) as mock_get_by_agent_id, patch.object(
+        ars, "insert_agent_repository_record"
+    ) as mock_insert, patch.object(
+        ars, "get_agent_repository_by_id"
+    ) as mock_get_by_id:
+        mock_build_data.return_value = {
+            "agent_id": 1,
+            "source_version_no": 1,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "status": "PENDING_REVIEW",
+        }
+        mock_get_by_agent_id.return_value = None
+        mock_insert.return_value = 42
+        mock_get_by_id.return_value = {
+            "agent_repository_id": 42,
+            "agent_id": 1,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "source_version_no": 1,
+            "status": "PENDING_REVIEW",
+            "tags": [],
+        }
+
+        result = await ars.create_agent_repository_listing_impl(
+            agent_id=1,
+            tenant_id="tenant_a",
+            user_id="user_a",
+            version_no=1,
+        )
+
+    assert result["agent_repository_id"] == 42
+    assert result["agent_info_json"] == agent_info_json
+    assert result["is_updated"] is False
+    mock_insert.assert_called_once()
+    mock_get_by_agent_id.assert_called_once_with(1)
+
+
+@pytest.mark.asyncio
+async def test_create_agent_repository_listing_impl_updates_existing():
+    agent_info_json = {
+        "agent_id": 1,
+        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
+        "mcp_info": [],
+        "skills": None,
+    }
+    with patch.object(
+        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
+    ) as mock_build_data, patch.object(
+        ars, "get_agent_repository_by_agent_id"
+    ) as mock_get_by_agent_id, patch.object(
+        ars, "update_agent_repository_by_id"
+    ) as mock_update, patch.object(
+        ars, "get_agent_repository_by_id"
+    ) as mock_get_by_id:
+        mock_build_data.return_value = {
+            "agent_id": 1,
+            "source_version_no": 2,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "status": "PENDING_REVIEW",
+        }
+        mock_get_by_agent_id.return_value = {"agent_repository_id": 42}
+        mock_update.return_value = 1
+        mock_get_by_id.return_value = {
+            "agent_repository_id": 42,
+            "agent_id": 1,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "source_version_no": 2,
+            "status": "PENDING_REVIEW",
+            "tags": [],
+        }
+
+        result = await ars.create_agent_repository_listing_impl(
+            agent_id=1,
+            tenant_id="tenant_a",
+            user_id="user_a",
+            version_no=2,
+        )
+
+    assert result["agent_repository_id"] == 42
+    assert result["is_updated"] is True
+    mock_update.assert_called_once()
+    mock_update.assert_called_with(
+        repository_id=42,
+        publisher_tenant_id="tenant_a",
+        user_id="user_a",
+        updates={
+            "source_version_no": 2,
+            "agent_info_json": agent_info_json,
+            "status": "PENDING_REVIEW",
+        },
+    )
+
+
+@pytest.mark.asyncio
+async def test_create_agent_repository_listing_impl_accepts_draft_version():
+    agent_info_json = {
+        "agent_id": 1,
+        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
+        "mcp_info": [],
+        "skills": None,
+    }
+    with patch.object(
+        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
+    ) as mock_build_data, patch.object(
+        ars, "get_agent_repository_by_agent_id"
+    ) as mock_get_by_agent_id, patch.object(
+        ars, "insert_agent_repository_record"
+    ) as mock_insert, patch.object(
+        ars, "get_agent_repository_by_id"
+    ) as mock_get_by_id:
+        mock_build_data.return_value = {
+            "agent_id": 1,
+            "source_version_no": 0,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "status": "PENDING_REVIEW",
+        }
+        mock_get_by_agent_id.return_value = None
+        mock_insert.return_value = 42
+        mock_get_by_id.return_value = {
+            "agent_repository_id": 42,
+            "agent_id": 1,
+            "name": "agent_one",
+            "agent_info_json": agent_info_json,
+            "source_version_no": 0,
+            "status": "PENDING_REVIEW",
+            "tags": [],
+        }
+
+        result = await ars.create_agent_repository_listing_impl(
+            agent_id=1,
+            tenant_id="tenant_a",
+            user_id="user_a",
+            version_no=0,
+        )
+
+    assert result["agent_repository_id"] == 42
+    assert result["source_version_no"] == 0
+    mock_build_data.assert_awaited_once_with(1, "tenant_a", "user_a", 0)
+
+
+@pytest.mark.asyncio
+async def test_create_agent_repository_listing_impl_rejects_negative_version():
+    with pytest.raises(ValueError, match="version_no must be >= 0"):
+        await ars.create_agent_repository_listing_impl(
+            agent_id=1,
+            tenant_id="tenant_a",
+            user_id="user_a",
+            version_no=-1,
+        )
+
+
+def test_validate_create_payload_requires_agent_info_json():
+    with pytest.raises(ValueError, match="agent_info_json"):
+        ars._validate_create_payload({
+            "agent_id": 1,
+            "source_version_no": 1,
+            "name": "agent_one",
+        })
+
+    with pytest.raises(ValueError, match="agent_info_json must contain"):
+        ars._validate_create_payload({
+            "agent_id": 1,
+            "source_version_no": 1,
+            "name": "agent_one",
+            "agent_info_json": {"agent_id": 1},
+        })
+
+
+@pytest.mark.asyncio
+async def test_build_repository_data_from_agent_includes_skills():
+    SkillZipEntry = _consts_model_mock.SkillZipEntry
+
+    _agent_db_mock.search_agent_info_by_agent_id.return_value = {
+        "name": "agent_one",
+        "display_name": "Agent One",
+        "description": "desc",
+        "author": "author",
+    }
+    _agent_service_mock.export_agent_dict_for_repository_impl.return_value = {
+        "agent_id": 1,
+        "agent_info": {
+            "1": {
+                "agent_id": 1,
+                "name": "agent_one",
+                "description": "desc",
+                "business_description": "biz",
+                "max_steps": 5,
+                "provide_run_summary": False,
+                "enabled": True,
+                "tools": [],
+                "managed_agents": [],
+            }
+        },
+        "mcp_info": [],
+    }
+    _agent_service_mock.collect_skill_zip_entries.return_value = [
+        SkillZipEntry(skill_name="SkillA", skill_zip_base64="abc=")
+    ]
+    _agent_version_db_mock.search_version_by_version_no.return_value = {
+        "version_name": "v1.0"
+    }
+
+    result = await ars._build_repository_data_from_agent(
+        agent_id=1,
+        tenant_id="tenant_a",
+        user_id="user_a",
+        version_no=1,
+    )
+
+    assert result["agent_info_json"]["agent_id"] == 1
+    assert result["agent_info_json"]["skills"][0]["skill_name"] == "SkillA"
+    assert result["version_label"] == "v1.0"
+
+
+def test_validate_agent_info_json_rejects_asset_owner_agent():
+    agent_info_json = {
+        "agent_id": 1,
+        "agent_info": {
+            "1": {"agent_id": 1, "tenant_id": ASSET_OWNER_TENANT_ID, "name": "owner_agent"},
+        },
+        "mcp_info": [],
+    }
+    with pytest.raises(ValueError, match="租户管理员智能体无法共享"):
+        ars._validate_agent_info_json_shareable(agent_info_json)
+
+
+def test_validate_agent_info_json_allows_normal_tenant():
+    agent_info_json = {
+        "agent_id": 1,
+        "agent_info": {
+            "1": {"agent_id": 1, "tenant_id": "tenant_a", "name": "agent_one"},
+            "2": {"agent_id": 2, "tenant_id": "tenant_b", "name": "sub_agent"},
+        },
+        "mcp_info": [],
+    }
+    ars._validate_agent_info_json_shareable(agent_info_json)
+
+
+@pytest.mark.asyncio
+async def test_build_repository_data_from_agent_rejects_asset_owner():
+    _agent_db_mock.search_agent_info_by_agent_id.return_value = {
+        "name": "agent_one",
+        "display_name": "Agent One",
+        "description": "desc",
+        "author": "author",
+    }
+    _agent_service_mock.export_agent_dict_for_repository_impl.return_value = {
+        "agent_id": 1,
+        "agent_info": {
+            "1": {
+                "agent_id": 1,
+                "tenant_id": "tenant_a",
+                "name": "agent_one",
+                "description": "desc",
+                "business_description": "biz",
+                "max_steps": 5,
+                "provide_run_summary": False,
+                "enabled": True,
+                "tools": [],
+                "managed_agents": [],
+            },
+            "2": {
+                "agent_id": 2,
+                "tenant_id": ASSET_OWNER_TENANT_ID,
+                "name": "sub_owner_agent",
+                "description": "desc",
+                "business_description": "biz",
+                "max_steps": 5,
+                "provide_run_summary": False,
+                "enabled": True,
+                "tools": [],
+                "managed_agents": [],
+            },
+        },
+        "mcp_info": [],
+    }
+    _agent_service_mock.collect_skill_zip_entries.return_value = []
+    _agent_version_db_mock.search_version_by_version_no.return_value = {
+        "version_name": "v1.0"
+    }
+
+    with pytest.raises(ValueError, match="租户管理员智能体无法共享"):
+        await ars._build_repository_data_from_agent(
+            agent_id=1,
+            tenant_id="tenant_a",
+            user_id="user_a",
+            version_no=1,
+        )
diff --git a/test/backend/services/test_agent_service.py b/test/backend/services/test_agent_service.py
index 86c8a5e2c..6cd7b5da4 100644
--- a/test/backend/services/test_agent_service.py
+++ b/test/backend/services/test_agent_service.py
@@ -92,6 +92,7 @@ def model_dump(self, **kwargs):
 sys.modules['services.agent_version_service'] = agent_version_service_mock
 sys.modules['services.skill_service'] = skill_service_mock
 sys.modules['services.prompt_template_service'] = prompt_template_service_mock
+sys.modules['services.file_management_service'] = MagicMock()
 sys.modules['services.skill_service'] = MagicMock()
 setattr(services_module, 'skill_service', sys.modules['services.skill_service'])
 
@@ -332,6 +333,10 @@ def apply_default_prompt_template_request_fields(request, prompt_template_id=Non
         request.related_agent_ids = None
     if not hasattr(request, "enabled_tool_ids"):
         request.enabled_tool_ids = None
+    if not hasattr(request, "example_questions"):
+        request.example_questions = None
+    if not hasattr(request, "greeting_message"):
+        request.greeting_message = None
     return request
 
 
@@ -500,6 +505,7 @@ async def test_get_agent_info_impl_success(mock_search_agent_info, mock_search_t
     mock_check_availability.assert_called_once()
 
 
+@patch('backend.services.agent_service.query_current_version_no')
 @patch('backend.services.agent_service.SkillService')
 @patch('backend.services.agent_service.query_external_sub_agents')
 @patch('backend.services.agent_service.check_agent_availability')
@@ -508,7 +514,7 @@ async def test_get_agent_info_impl_success(mock_search_agent_info, mock_search_t
 @patch('backend.services.agent_service.search_tools_for_sub_agent')
 @patch('backend.services.agent_service.search_agent_info_by_agent_id')
 @pytest.mark.asyncio
-async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_search_tools, mock_query_sub_agents_id, mock_get_model_by_model_id, mock_check_availability, mock_query_external_sub_agents, mock_skill_service):
+async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_search_tools, mock_query_sub_agents_id, mock_get_model_by_model_id, mock_check_availability, mock_query_external_sub_agents, mock_skill_service, mock_query_current_version_no):
     """
     Test get_agent_info_impl with explicit version_no parameter.
 
@@ -544,6 +550,9 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
     # Mock check_agent_availability - agent is available
     mock_check_availability.return_value = (True, [])
 
+    # Mock query_current_version_no - return 5 as the current version
+    mock_query_current_version_no.return_value = 5
+
     # Execute with explicit version_no
     result = await get_agent_info_impl(agent_id=123, tenant_id="test_tenant", version_no=5)
 
@@ -561,7 +570,8 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
         "prompt_template_id": 0,
         "prompt_template_name": "system_default",
         "is_available": True,
-        "unavailable_reasons": []
+        "unavailable_reasons": [],
+        "current_version_no": 5
     }
     assert result == expected_result
     # Verify version_no is passed correctly
@@ -571,6 +581,8 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
     mock_query_sub_agents_id.assert_called_once_with(
         main_agent_id=123, tenant_id="test_tenant")
     mock_check_availability.assert_called_once()
+    # Verify query_current_version_no is called for version_no > 0
+    mock_query_current_version_no.assert_called_once_with(123, "test_tenant")
 
 
 @patch('backend.services.agent_service.get_model_by_model_id')
@@ -744,6 +756,7 @@ async def test_update_agent_info_impl_exception_handling(mock_get_current_user_i
     request.display_name = "Test Display Name"
     request.enabled_tool_ids = None
     request.related_agent_ids = None
+    request.example_questions = None
     apply_default_prompt_template_request_fields(request)
 
     # Execute & Assert
@@ -1430,7 +1443,7 @@ async def test_export_agent_impl_success(mock_get_current_user_info, mock_export
     # Verify function calls
     mock_get_current_user_info.assert_called_once_with("Bearer token")
     mock_export_agent_by_id.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user")
+        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
     mock_get_mcp_server.assert_called_once_with(
         "test_mcp_server", "test_tenant")
     mock_export_data_format.assert_called_once()
@@ -1510,7 +1523,7 @@ async def test_export_agent_impl_no_mcp_tools(mock_get_current_user_info, mock_e
     # Verify function calls
     mock_get_current_user_info.assert_called_once_with("Bearer token")
     mock_export_agent_by_id.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user")
+        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
     # Should not be called when no MCP tools
     mock_get_mcp_server.assert_not_called()
     mock_export_data_format.assert_called_once()
@@ -2982,7 +2995,8 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
         "duty_prompt": "Test duty prompt",
         "constraint_prompt": "Test constraint prompt",
         "few_shots_prompt": "Test few shots prompt",
-        "enabled": True
+        "enabled": True,
+        "tenant_id": "test_tenant",
     }
     mock_search_agent_info.return_value = mock_agent_info
 
@@ -3058,6 +3072,7 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
 
     # Assert
     assert result.agent_id == 123
+    assert result.tenant_id == "test_tenant"
     assert result.name == "Test Agent"
     assert result.business_description == "For testing purposes"
     assert len(result.tools) == 5
@@ -3083,11 +3098,11 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
 
     # Verify function calls
     mock_search_agent_info.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant")
+        agent_id=123, tenant_id="test_tenant", version_no=0)
     mock_create_tool_config.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user")
+        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
     mock_query_sub_agents_id.assert_called_once_with(
-        main_agent_id=123, tenant_id="test_tenant")
+        main_agent_id=123, tenant_id="test_tenant", version_no=0)
 
 
 @patch('backend.services.agent_service.create_or_update_tool_by_tool_info')
@@ -5157,6 +5172,7 @@ async def test_export_agent_includes_model_names(
         "constraint_prompt": "Test constraints",
         "few_shots_prompt": "Test examples",
         "enabled": True,
+        "tenant_id": "test_tenant",
         "model_id": 5,
         "business_logic_model_id": 4
     }
@@ -5222,6 +5238,7 @@ async def test_export_agent_with_null_model_id(
         "constraint_prompt": "Test constraints",
         "few_shots_prompt": "Test examples",
         "enabled": True,
+        "tenant_id": "test_tenant",
         "model_id": None,  # NULL in database
         "business_logic_model_id": None  # NULL in database
     }
@@ -5284,6 +5301,7 @@ async def test_export_then_import_preserves_model_names(
         "constraint_prompt": "Follow safety rules",
         "few_shots_prompt": "Example tasks",
         "enabled": True,
+        "tenant_id": "source_tenant",
         "model_id": 10,  # Model ID in source tenant
         "business_logic_model_id": 9  # Business logic model ID in source tenant
     }
@@ -5399,6 +5417,7 @@ async def test_export_agent_model_not_found(
         "constraint_prompt": "Test",
         "few_shots_prompt": "Test",
         "enabled": True,
+        "tenant_id": "test_tenant",
         "model_id": 999,  # This model doesn't exist
         "business_logic_model_id": 998  # This model doesn't exist
     }
@@ -8732,6 +8751,176 @@ def convert_side_effect(x):
     assert result[0]["permission"] == PERMISSION_READ
 
 
+def _mock_get_agent_info_impl_dependencies(
+    mock_search_agent_info,
+    mock_search_tools,
+    mock_query_sub_agents_id,
+    mock_get_model_by_model_id,
+    mock_check_availability,
+    mock_query_external_sub_agents,
+    mock_skill_service,
+    agent_info,
+):
+    """Configure common mocks for get_agent_info_impl permission tests."""
+    defaults = {"model_id": None}
+    mock_search_agent_info.return_value = {**defaults, **agent_info}
+    mock_search_tools.return_value = []
+    mock_query_sub_agents_id.return_value = []
+    mock_query_external_sub_agents.return_value = []
+    mock_get_model_by_model_id.return_value = None
+    mock_check_availability.return_value = (True, [])
+    mock_skill_service_instance = MagicMock()
+    mock_skill_service_instance.list_skill_instances.return_value = []
+    mock_skill_service.return_value = mock_skill_service_instance
+
+
+@patch("backend.services.agent_service.SkillService")
+@patch("backend.services.agent_service.query_external_sub_agents")
+@patch("backend.services.agent_service.check_agent_availability")
+@patch("backend.services.agent_service.get_model_by_model_id")
+@patch("backend.services.agent_service.query_sub_agents_id_list")
+@patch("backend.services.agent_service.search_tools_for_sub_agent")
+@patch("backend.services.agent_service.search_agent_info_by_agent_id")
+@patch("backend.services.agent_service.get_user_tenant_by_user_id")
+@pytest.mark.asyncio
+async def test_get_agent_info_impl_asset_owner_agent_read_only_for_admin(
+    mock_get_user_tenant,
+    mock_search_agent_info,
+    mock_search_tools,
+    mock_query_sub_agents_id,
+    mock_get_model_by_model_id,
+    mock_check_availability,
+    mock_query_external_sub_agents,
+    mock_skill_service,
+):
+    """ASSET_OWNER-scoped agent detail is READ_ONLY for ADMIN viewers."""
+    from consts.const import ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
+
+    agent_info = {
+        "agent_id": 99,
+        "tenant_id": ASSET_OWNER_TENANT_ID,
+        "created_by": "admin_user",
+        "ingroup_permission": PERMISSION_EDIT,
+    }
+    _mock_get_agent_info_impl_dependencies(
+        mock_search_agent_info,
+        mock_search_tools,
+        mock_query_sub_agents_id,
+        mock_get_model_by_model_id,
+        mock_check_availability,
+        mock_query_external_sub_agents,
+        mock_skill_service,
+        agent_info,
+    )
+    mock_get_user_tenant.return_value = {"user_role": "ADMIN"}
+
+    result = await get_agent_info_impl(
+        agent_id=99,
+        tenant_id="regular_tenant",
+        user_id="admin_user",
+    )
+
+    assert result["permission"] == PERMISSION_READ
+
+
+@patch("backend.services.agent_service.SkillService")
+@patch("backend.services.agent_service.query_external_sub_agents")
+@patch("backend.services.agent_service.check_agent_availability")
+@patch("backend.services.agent_service.get_model_by_model_id")
+@patch("backend.services.agent_service.query_sub_agents_id_list")
+@patch("backend.services.agent_service.search_tools_for_sub_agent")
+@patch("backend.services.agent_service.search_agent_info_by_agent_id")
+@patch("backend.services.agent_service.get_user_tenant_by_user_id")
+@pytest.mark.asyncio
+async def test_get_agent_info_impl_asset_owner_agent_read_only_for_dev(
+    mock_get_user_tenant,
+    mock_search_agent_info,
+    mock_search_tools,
+    mock_query_sub_agents_id,
+    mock_get_model_by_model_id,
+    mock_check_availability,
+    mock_query_external_sub_agents,
+    mock_skill_service,
+):
+    """ASSET_OWNER-scoped agent detail is READ_ONLY for DEV even with ingroup EDIT."""
+    from consts.const import ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
+
+    agent_info = {
+        "agent_id": 99,
+        "tenant_id": ASSET_OWNER_TENANT_ID,
+        "created_by": "asset_owner_user",
+        "ingroup_permission": PERMISSION_EDIT,
+    }
+    _mock_get_agent_info_impl_dependencies(
+        mock_search_agent_info,
+        mock_search_tools,
+        mock_query_sub_agents_id,
+        mock_get_model_by_model_id,
+        mock_check_availability,
+        mock_query_external_sub_agents,
+        mock_skill_service,
+        agent_info,
+    )
+    mock_get_user_tenant.return_value = {"user_role": "DEV"}
+
+    result = await get_agent_info_impl(
+        agent_id=99,
+        tenant_id="regular_tenant",
+        user_id="dev_user",
+    )
+
+    assert result["permission"] == PERMISSION_READ
+
+
+@patch("backend.services.agent_service.SkillService")
+@patch("backend.services.agent_service.query_external_sub_agents")
+@patch("backend.services.agent_service.check_agent_availability")
+@patch("backend.services.agent_service.get_model_by_model_id")
+@patch("backend.services.agent_service.query_sub_agents_id_list")
+@patch("backend.services.agent_service.search_tools_for_sub_agent")
+@patch("backend.services.agent_service.search_agent_info_by_agent_id")
+@patch("backend.services.agent_service.get_user_tenant_by_user_id")
+@pytest.mark.asyncio
+async def test_get_agent_info_impl_asset_owner_role_gets_edit(
+    mock_get_user_tenant,
+    mock_search_agent_info,
+    mock_search_tools,
+    mock_query_sub_agents_id,
+    mock_get_model_by_model_id,
+    mock_check_availability,
+    mock_query_external_sub_agents,
+    mock_skill_service,
+):
+    """ASSET_OWNER role creator retains EDIT on ASSET_OWNER-scoped agent detail."""
+    from consts.const import ASSET_OWNER_ROLE, ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
+
+    agent_info = {
+        "agent_id": 99,
+        "tenant_id": ASSET_OWNER_TENANT_ID,
+        "created_by": "asset_owner_user",
+        "ingroup_permission": PERMISSION_READ,
+    }
+    _mock_get_agent_info_impl_dependencies(
+        mock_search_agent_info,
+        mock_search_tools,
+        mock_query_sub_agents_id,
+        mock_get_model_by_model_id,
+        mock_check_availability,
+        mock_query_external_sub_agents,
+        mock_skill_service,
+        agent_info,
+    )
+    mock_get_user_tenant.return_value = {"user_role": ASSET_OWNER_ROLE}
+
+    result = await get_agent_info_impl(
+        agent_id=99,
+        tenant_id=ASSET_OWNER_TENANT_ID,
+        user_id="asset_owner_user",
+    )
+
+    assert result["permission"] == PERMISSION_EDIT
+
+
 @pytest.mark.asyncio
 @patch("backend.services.agent_service.get_model_by_model_id")
 @patch("backend.services.agent_service.check_agent_availability")
@@ -9054,6 +9243,8 @@ async def test_update_agent_info_impl_skill_update_exception(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     mock_query_skills.return_value = []
     mock_create_skill.side_effect = Exception("Skill update failed")
@@ -9114,79 +9305,73 @@ def test_generate_stream_with_memory_decorated():
 # =============================================================================
 
 @pytest.mark.asyncio
-@patch('backend.services.agent_service.search_agent_info_by_agent_id')
-@patch('backend.services.agent_service.export_agent_impl')
+@patch('backend.services.agent_service.collect_skill_zip_entries')
+@patch('backend.services.agent_service.export_agent_dict_impl')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_no_skills(mock_get_user_info, mock_export_impl, mock_search_info):
-    """Test export_agent_with_skills_impl returns JSON when agent has no skill instances."""
+async def test_export_agent_with_skills_impl_no_skills(
+    mock_get_user_info, mock_export_dict_impl, mock_collect_skills
+):
+    """Test export_agent_with_skills_impl returns dict when agent has no skill instances."""
     from backend.services.agent_service import export_agent_with_skills_impl
-    from backend.services import agent_service as ag_svc
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
-    mock_export_impl.return_value = '{"agent_id": 1, "agent_info": {}}'
-    mock_search_info.return_value = {"name": "test_agent"}
+    mock_export_dict_impl.return_value = {"agent_id": 1, "agent_info": {}}
+    mock_collect_skills.return_value = []
 
-    # Mock skill_db.query_skill_instances_by_agent_id to return empty list
-    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[]):
-        result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
-    assert result == '{"agent_id": 1, "agent_info": {}}'
-    mock_export_impl.assert_called_once_with(1, "Bearer token")
+    assert result == {"agent_id": 1, "agent_info": {}}
+    mock_export_dict_impl.assert_called_once_with(
+        1, "Bearer token", version_no=0
+    )
 
 
 @pytest.mark.asyncio
-@patch('backend.services.agent_service.search_agent_info_by_agent_id')
-@patch('backend.services.agent_service.export_agent_impl')
+@patch('backend.services.agent_service.collect_skill_zip_entries')
+@patch('backend.services.agent_service.export_agent_dict_impl')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_skills_but_no_names(mock_get_user_info, mock_export_impl, mock_search_info):
-    """Test export_agent_with_skills_impl returns JSON when skill instances have no names."""
+async def test_export_agent_with_skills_impl_skills_but_no_names(
+    mock_get_user_info, mock_export_dict_impl, mock_collect_skills
+):
+    """Test export_agent_with_skills_impl returns dict when skill export yields nothing."""
     from backend.services.agent_service import export_agent_with_skills_impl
-    from backend.services import agent_service as ag_svc
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
-    mock_export_impl.return_value = '{"agent_id": 1, "agent_info": {}}'
-    mock_search_info.return_value = {"name": "test_agent"}
+    mock_export_dict_impl.return_value = {"agent_id": 1, "agent_info": {}}
+    mock_collect_skills.return_value = []
 
-    # Mock skill_db to return skill instances without names
-    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[{"skill_id": 1}]):
-        with patch.object(ag_svc.skill_db, 'get_skill_by_id', return_value=None):
-            result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
-    assert result == '{"agent_id": 1, "agent_info": {}}'
-    mock_export_impl.assert_called_once()
+    assert result == {"agent_id": 1, "agent_info": {}}
+    mock_export_dict_impl.assert_called_once()
 
 
 @pytest.mark.asyncio
 @patch('backend.services.agent_service.search_agent_info_by_agent_id')
+@patch('backend.services.agent_service.collect_skill_zip_entries')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_with_zip(mock_get_user_info, mock_search_info):
+async def test_export_agent_with_skills_impl_with_zip(
+    mock_get_user_info, mock_collect_skills, mock_search_info
+):
     """Test export_agent_with_skills_impl returns ZIP when agent has skills."""
     from backend.services.agent_service import export_agent_with_skills_impl
     from backend.services import agent_service as ag_svc
+    from consts.model import SkillZipEntry
     import io
     import zipfile
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
     mock_search_info.return_value = {"name": "my_agent"}
-
-    skill_instance = {"skill_id": 100}
-    skill_info = {"name": "TestSkill", "skill_id": 100}
-
-    mock_skill_service = MagicMock()
-    mock_skill_service.export_skills_by_names.return_value = [
-        {"skill_name": "TestSkill", "skill_zip_base64": "SGVsbG8gV29ybGQ="}  # "Hello World" in base64
+    mock_collect_skills.return_value = [
+        SkillZipEntry(skill_name="TestSkill", skill_zip_base64="SGVsbG8gV29ybGQ=")
     ]
 
-    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[skill_instance]):
-        with patch.object(ag_svc.skill_db, 'get_skill_by_id', return_value=skill_info):
-            with patch.object(ag_svc, 'export_agent_impl', return_value='{"agent_id": 1}'):
-                with patch('services.skill_service.SkillService', return_value=mock_skill_service):
-                    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    with patch.object(ag_svc, 'export_agent_impl', return_value='{"agent_id": 1}'):
+        result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
     assert result["_zip"] is True
     assert "data" in result
     assert result["filename"] == "my_agent.zip"
-    # Verify it's a valid ZIP
     zip_data = io.BytesIO(result["data"])
     with zipfile.ZipFile(zip_data, 'r') as zf:
         assert "agent.json" in zf.namelist()
@@ -9322,6 +9507,8 @@ async def test_update_agent_info_impl_related_agent_query_error(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     # Make query_sub_agents_id_list raise exception during circular check
     mock_query_sub.side_effect = Exception("Query error")
@@ -9371,6 +9558,8 @@ async def test_update_agent_info_impl_related_external_agents(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     # Mock current relations (empty)
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent', return_value=[]):
@@ -9421,6 +9610,8 @@ async def test_update_agent_info_impl_external_agent_remove_relation(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     # Mock current relations has the ID
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
@@ -9472,6 +9663,8 @@ async def test_update_agent_info_impl_external_agent_relation_exists(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     # Mock current relations includes the same ID - add should raise ValueError (already exists)
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
@@ -9584,6 +9777,8 @@ async def test_update_agent_info_impl_skill_unselected(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     result = await update_agent_info_impl(mock_request, authorization="Bearer token")
 
@@ -9932,8 +10127,126 @@ async def test_update_agent_info_impl_external_agent_list_error(mock_get_user):
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
+    mock_request.example_questions = None
+    mock_request.greeting_message = None
 
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
                      side_effect=Exception("DB error")):
         with pytest.raises(ValueError, match="Failed to update related external agents"):
             await update_agent_info_impl(mock_request, authorization="Bearer token")
+
+
+@patch('backend.services.agent_service.get_current_user_info')
+@pytest.mark.asyncio
+async def test_update_agent_info_impl_example_questions_exceed_limit(mock_get_current_user_info):
+    """Test update_agent_info_impl raises AppException when example_questions exceeds 6 items."""
+    from consts.error_code import ErrorCode
+    from consts.exceptions import AppException
+
+    mock_get_current_user_info.return_value = ("test_user", "test_tenant", "en")
+
+    request = MagicMock()
+    request.agent_id = 123
+    request.model_id = None
+    request.example_questions = ["q1", "q2", "q3", "q4", "q5", "q6", "q7"]
+    request.enabled_tool_ids = None
+    request.related_agent_ids = None
+    apply_default_prompt_template_request_fields(request)
+
+    with pytest.raises(AppException) as exc_info:
+        await update_agent_info_impl(request, authorization="Bearer token")
+
+    assert exc_info.value.error_code == ErrorCode.COMMON_PARAMETER_INVALID
+
+
+# =============================================================================
+# Tests for version_no export and repository export helpers
+# =============================================================================
+
+@pytest.mark.asyncio
+@patch('backend.services.agent_service.resolve_sub_agent_version_no')
+@patch('backend.services.agent_service.query_sub_agent_relations')
+@patch('backend.services.agent_service.export_agent_by_agent_id')
+async def test_export_agent_dict_impl_uses_pinned_sub_agent_versions(
+    mock_export_agent_by_id,
+    mock_query_relations,
+    mock_resolve_version,
+):
+    """BFS export should enqueue sub-agents with their pinned version numbers."""
+    from backend.services.agent_service import export_agent_dict_impl
+    from consts.model import ExportAndImportAgentInfo
+
+    root_agent = ExportAndImportAgentInfo(
+        agent_id=1,
+        name="root",
+        display_name="Root",
+        description="desc",
+        business_description="biz",
+        max_steps=5,
+        provide_run_summary=False,
+        enabled=True,
+        tools=[],
+        managed_agents=[2],
+    )
+    child_agent = ExportAndImportAgentInfo(
+        agent_id=2,
+        name="child",
+        display_name="Child",
+        description="desc",
+        business_description="biz",
+        max_steps=5,
+        provide_run_summary=False,
+        enabled=True,
+        tools=[],
+        managed_agents=[],
+    )
+
+    async def _export_side_effect(agent_id, tenant_id, user_id, version_no=0):
+        if agent_id == 1:
+            return root_agent
+        return child_agent
+
+    mock_export_agent_by_id.side_effect = _export_side_effect
+    mock_query_relations.side_effect = [
+        [{"selected_agent_id": 2, "selected_agent_version_no": 3}],
+        [],
+    ]
+    mock_resolve_version.return_value = 3
+
+    with patch('backend.services.agent_service.get_current_user_info', return_value=("u", "t", "en")):
+        result = await export_agent_dict_impl(agent_id=1, authorization="Bearer token", version_no=2)
+
+    assert result["agent_id"] == 1
+    assert "1" in result["agent_info"]
+    assert "2" in result["agent_info"]
+    mock_export_agent_by_id.assert_any_call(
+        agent_id=1, tenant_id="t", user_id="u", version_no=2
+    )
+    mock_export_agent_by_id.assert_any_call(
+        agent_id=2, tenant_id="t", user_id="u", version_no=3
+    )
+
+
+@pytest.mark.asyncio
+@patch('backend.services.agent_service._export_agent_dict_core')
+async def test_export_agent_dict_for_repository_impl(mock_export_core):
+    """Repository export helper should delegate to core export without auth header."""
+    from backend.services.agent_service import export_agent_dict_for_repository_impl
+
+    mock_export_core.return_value = {
+        "agent_id": 10,
+        "agent_info": {},
+        "mcp_info": [],
+    }
+
+    result = await export_agent_dict_for_repository_impl(
+        agent_id=10, tenant_id="tenant_a", user_id="user_a", version_no=1
+    )
+
+    assert result["agent_id"] == 10
+    mock_export_core.assert_called_once_with(
+        root_agent_id=10,
+        tenant_id="tenant_a",
+        user_id="user_a",
+        version_no=1,
+    )
diff --git a/test/backend/services/test_agent_version_service.py b/test/backend/services/test_agent_version_service.py
index 5c3f231b5..10cf67ca1 100644
--- a/test/backend/services/test_agent_version_service.py
+++ b/test/backend/services/test_agent_version_service.py
@@ -1,5 +1,6 @@
 import asyncio
 import sys
+import types
 import pytest
 from unittest.mock import patch, MagicMock
 from contextlib import contextmanager
@@ -18,10 +19,26 @@
 consts_mock.const.POSTGRES_DB = "test_db"
 consts_mock.const.POSTGRES_PORT = 5432
 consts_mock.const.DEFAULT_TENANT_ID = "default_tenant"
+consts_mock.const.AGENT_PROMPTS_HIDDEN_FLAG = "prompts_hidden"
+consts_mock.const.ASSET_OWNER_ROLE = "ASSET_OWNER"
+consts_mock.const.ASSET_OWNER_TENANT_ID = "asset_owner_tenant_id"
+consts_mock.const.ENABLE_ASSET_OWNER_ROLE = False
+consts_mock.const.PERMISSION_EDIT = "EDIT"
+consts_mock.const.PERMISSION_READ = "READ_ONLY"
 
 sys.modules['consts'] = consts_mock
 sys.modules['consts.const'] = consts_mock.const
 
+consts_exceptions_mod = types.ModuleType("consts.exceptions")
+
+
+class ValidationError(Exception):
+    pass
+
+
+consts_exceptions_mod.ValidationError = ValidationError
+sys.modules['consts.exceptions'] = consts_exceptions_mod
+
 # Mock consts.agent_unavailable_reasons
 agent_unavailable_reasons_mock = MagicMock()
 agent_unavailable_reasons_mock.AgentUnavailableReason = type('AgentUnavailableReason', (), {
@@ -206,8 +223,13 @@ def mock_tools_draft():
 
 
 @pytest.fixture
-def mock_relations_draft():
+def mock_relations_draft(monkeypatch):
     """Mock relations draft data"""
+    monkeypatch.setattr(
+        agent_version_service_module,
+        "query_current_version_no",
+        MagicMock(return_value=1),
+    )
     return [
         {
             "id": 1,
@@ -279,9 +301,34 @@ def test_publish_version_impl_success(monkeypatch, mock_agent_draft, mock_tools_
     mock_insert_agent.assert_called_once()
     assert mock_insert_tool.call_count == 2
     assert mock_insert_relation.call_count == 1
+    relation_snapshot = mock_insert_relation.call_args[0][0]
+    assert relation_snapshot["selected_agent_version_no"] == 1
     assert mock_insert_skill.call_count == 1
 
 
+def test_publish_version_impl_unpublished_sub_agent(
+    monkeypatch, mock_agent_draft, mock_tools_draft, mock_relations_draft, mock_skills_draft
+):
+    """Test publishing fails when a sub-agent has no published version"""
+    mock_query_draft = MagicMock(
+        return_value=(mock_agent_draft, mock_tools_draft, mock_relations_draft)
+    )
+    monkeypatch.setattr(agent_version_service_module, "query_agent_draft", mock_query_draft)
+    monkeypatch.setattr(
+        agent_version_service_module,
+        "query_current_version_no",
+        MagicMock(return_value=None),
+    )
+    monkeypatch.setattr(agent_version_service_module, "get_next_version_no", MagicMock(return_value=1))
+
+    with pytest.raises(ValueError, match="Sub-agent 2 has no published version"):
+        publish_version_impl(
+            agent_id=1,
+            tenant_id="tenant1",
+            user_id="user1",
+        )
+
+
 def test_publish_version_impl_no_draft(monkeypatch):
     """Test publishing when draft doesn't exist"""
     mock_query_draft = MagicMock(return_value=(None, [], []))
@@ -1284,6 +1331,7 @@ def test_get_version_detail_or_draft_draft_version(monkeypatch):
     assert result["version"]["version_status"] == "DRAFT"
     assert len(result["tools"]) == 1
     assert result["sub_agent_id_list"] == [2]
+    assert result["sub_agent_relations"] == [{"agent_id": 2, "version_no": None}]
     assert len(result["skills"]) == 1
 
 
@@ -1487,7 +1535,7 @@ def test_list_published_agents_impl_success(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    model_management_db_mock.get_model_by_model_id = MagicMock(
+    agent_service_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
@@ -1640,15 +1688,15 @@ def test_list_published_agents_impl_user_with_groups(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    model_management_db_mock.get_model_by_model_id = MagicMock(
+    agent_service_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
     result = asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
 
     assert len(result) == 1
-    # User should have READ permission (not EDIT)
-    assert result[0]["permission"] == "READ"
+    # User should have READ_ONLY permission (not EDIT)
+    assert result[0]["permission"] == "READ_ONLY"
 
 
 def test_list_published_agents_impl_model_cache(monkeypatch):
@@ -1690,7 +1738,7 @@ def test_list_published_agents_impl_model_cache(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    model_management_db_mock.get_model_by_model_id = MagicMock(
+    agent_service_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
@@ -1771,7 +1819,7 @@ def test_list_published_agents_impl_is_available_false(monkeypatch):
         return_value=(False, ["model_not_configured"])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    model_management_db_mock.get_model_by_model_id = MagicMock(return_value=None)
+    agent_service_mock.get_model_by_model_id = MagicMock(return_value=None)
 
     result = asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
 
@@ -1780,8 +1828,7 @@ def test_list_published_agents_impl_is_available_false(monkeypatch):
     assert "model_not_configured" in result[0]["unavailable_reasons"]
 
 
-@pytest.mark.asyncio
-async def test_list_published_agents_impl_exception_handling(monkeypatch):
+def test_list_published_agents_impl_exception_handling(monkeypatch):
     """Test exception handling in list_published_agents_impl"""
     # Mock query_all_agent_info_by_tenant_id to raise an exception
     test_exception = RuntimeError("Database connection failed")
@@ -1796,7 +1843,7 @@ async def test_list_published_agents_impl_exception_handling(monkeypatch):
 
     # Verify that the exception is caught and re-raised as ValueError
     with pytest.raises(ValueError, match="Failed to list published agents: Database connection failed"):
-        await list_published_agents_impl(tenant_id="tenant1", user_id="user1")
+        asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
 
 
 def test_publish_version_impl_with_a2a_new_agent(monkeypatch, mock_agent_draft, mock_tools_draft, mock_relations_draft, mock_skills_draft):
diff --git a/test/backend/services/test_cas_service.py b/test/backend/services/test_cas_service.py
new file mode 100644
index 000000000..158847e5a
--- /dev/null
+++ b/test/backend/services/test_cas_service.py
@@ -0,0 +1,240 @@
+import os
+import sys
+import unittest
+from datetime import datetime
+from unittest.mock import MagicMock
+
+test_dir = os.path.dirname(__file__)
+backend_dir = os.path.abspath(os.path.join(test_dir, "../../../backend"))
+sys.path.insert(0, backend_dir)
+
+_MODULES_TO_RESTORE = [
+    "consts",
+    "consts.const",
+    "database.cas_session_db",
+    "database.oauth_account_db",
+    "database.user_tenant_db",
+    "services.oauth_service",
+    "services.skill_service",
+    "services.tool_configuration_service",
+    "utils.auth_utils",
+]
+_ORIGINAL_MODULES = {name: sys.modules.get(name) for name in _MODULES_TO_RESTORE}
+
+consts_mock = MagicMock()
+consts_mock.const = MagicMock()
+consts_mock.const.CAS_CA_BUNDLE = ""
+consts_mock.const.CAS_CALLBACK_BASE_URL = "http://localhost:3000"
+consts_mock.const.CAS_EMAIL_ATTRIBUTE = "mail"
+consts_mock.const.CAS_ENABLED = True
+consts_mock.const.CAS_LOGIN_MODE = "button"
+consts_mock.const.CAS_LOGOUT_URL = ""
+consts_mock.const.CAS_RENEW_BEFORE_SECONDS = 300
+consts_mock.const.CAS_RENEW_TIMEOUT_SECONDS = 10
+consts_mock.const.CAS_ROLE_ATTRIBUTE = "memberOf"
+consts_mock.const.CAS_ROLE_MAP_JSON = '{"cn=admins":"ADMIN"}'
+consts_mock.const.CAS_SERVER_URL = "https://cas.example.com/cas"
+consts_mock.const.CAS_SESSION_MAX_AGE_SECONDS = 3600
+consts_mock.const.CAS_SSL_VERIFY = True
+consts_mock.const.CAS_SYNTHETIC_EMAIL_DOMAIN = "cas.local"
+consts_mock.const.CAS_TENANT_ATTRIBUTE = "tenant"
+consts_mock.const.CAS_USER_ATTRIBUTE = "uid"
+consts_mock.const.CAS_VALIDATE_PATH = "/p3/serviceValidate"
+consts_mock.const.DEFAULT_TENANT_ID = "tenant_id"
+consts_mock.const.LOCAL_SESSION_MAX_AGE_SECONDS = 3600
+sys.modules["consts"] = consts_mock
+sys.modules["consts.const"] = consts_mock.const
+
+sys.modules["database.cas_session_db"] = MagicMock()
+sys.modules["database.oauth_account_db"] = MagicMock()
+sys.modules["database.user_tenant_db"] = MagicMock()
+sys.modules["services.oauth_service"] = MagicMock()
+sys.modules["services.skill_service"] = MagicMock()
+sys.modules["services.tool_configuration_service"] = MagicMock()
+sys.modules["utils.auth_utils"] = MagicMock()
+
+from services.cas_service import (  # noqa: E402
+    CasAuthenticationError,
+    build_login_url,
+    build_logout_url,
+    parse_logout_request,
+    parse_service_validate_response,
+    revoke_from_logout_request,
+)
+
+for _name, _module in _ORIGINAL_MODULES.items():
+    if _module is None:
+        sys.modules.pop(_name, None)
+    else:
+        sys.modules[_name] = _module
+sys.modules.pop("services.cas_service", None)
+
+
+class TestCasServiceParsing(unittest.TestCase):
+    def test_parse_success_response_with_attributes(self):
+        xml = """
+        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
+          <cas:authenticationSuccess>
+            <cas:user>fallback-user</cas:user>
+            <cas:attributes>
+              <cas:uid>cas-user-1</cas:uid>
+              <cas:mail>User@Example.com</cas:mail>
+              <cas:memberOf>cn=admins</cas:memberOf>
+              <cas:tenant>tenant-a</cas:tenant>
+              <cas:SessionIndex>ST-123</cas:SessionIndex>
+              <cas:expiresAt>2026-05-26T10:00:00Z</cas:expiresAt>
+            </cas:attributes>
+          </cas:authenticationSuccess>
+        </cas:serviceResponse>
+        """
+
+        principal = parse_service_validate_response(xml, fallback_session_index="ST-fallback")
+
+        self.assertEqual(principal.cas_user_id, "cas-user-1")
+        self.assertEqual(principal.email, "user@example.com")
+        self.assertEqual(principal.role, "ADMIN")
+        self.assertEqual(principal.tenant_id, "tenant-a")
+        self.assertEqual(principal.session_index, "ST-123")
+        self.assertIsInstance(principal.expires_at, datetime)
+
+    def test_parse_failure_response_raises(self):
+        xml = """
+        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
+          <cas:authenticationFailure code="INVALID_TICKET">bad ticket</cas:authenticationFailure>
+        </cas:serviceResponse>
+        """
+
+        with self.assertRaises(CasAuthenticationError):
+            parse_service_validate_response(xml)
+
+    def test_parse_service_validate_response_rejects_xml_entities(self):
+        xml = """<?xml version="1.0"?>
+        <!DOCTYPE foo [<!ENTITY xxe "expanded-user">]>
+        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
+          <cas:authenticationSuccess>
+            <cas:user>&xxe;</cas:user>
+          </cas:authenticationSuccess>
+        </cas:serviceResponse>
+        """
+
+        with self.assertRaises(CasAuthenticationError):
+            parse_service_validate_response(xml)
+
+    def test_parse_logout_request_supports_user_and_session_index(self):
+        xml = """
+        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
+          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
+          <saml:NameID>cas-user-1</saml:NameID>
+          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
+        </samlp:LogoutRequest>
+        """
+
+        result = parse_logout_request(xml)
+
+        self.assertEqual(result["cas_user_id"], "cas-user-1")
+        self.assertEqual(result["session_index"], "ST-123")
+
+    def test_parse_logout_request_rejects_xml_entities(self):
+        xml = """<?xml version="1.0"?>
+        <!DOCTYPE foo [<!ENTITY xxe "cas-user-1">]>
+        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
+          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
+          <saml:NameID>&xxe;</saml:NameID>
+          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
+        </samlp:LogoutRequest>
+        """
+
+        result = parse_logout_request(xml)
+
+        self.assertEqual(result, {"cas_user_id": "", "session_index": ""})
+
+    def test_revoke_logout_request_falls_back_to_session_index_when_name_id_misses(self):
+        xml = """
+        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
+          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
+          <saml:NameID>different-cas-user</saml:NameID>
+          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
+        </samlp:LogoutRequest>
+        """
+        original_revoke_by_user = revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"]
+        original_revoke_by_index = revoke_from_logout_request.__globals__["revoke_cas_session_by_index"]
+        revoke_by_user = MagicMock(return_value=0)
+        revoke_by_index = MagicMock(return_value=1)
+        revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"] = revoke_by_user
+        revoke_from_logout_request.__globals__["revoke_cas_session_by_index"] = revoke_by_index
+        try:
+            result = revoke_from_logout_request(xml)
+        finally:
+            revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"] = original_revoke_by_user
+            revoke_from_logout_request.__globals__["revoke_cas_session_by_index"] = original_revoke_by_index
+
+        self.assertEqual(result["revoked"], 1)
+        self.assertEqual(result["cas_user_id"], "different-cas-user")
+        self.assertEqual(result["session_index"], "ST-123")
+        revoke_by_user.assert_called_once_with("different-cas-user")
+        revoke_by_index.assert_called_once_with("ST-123")
+
+    def test_build_login_url_includes_service_redirect(self):
+        url = build_login_url("/space")
+
+        self.assertIn("https://cas.example.com/cas/login?", url)
+        self.assertIn("service=http://localhost:3000/api/user/cas/callback?redirect=/space", url)
+
+    def test_build_logout_url_returns_empty_when_logout_url_is_not_configured(self):
+        url = build_logout_url()
+
+        self.assertEqual(url, "")
+
+    def test_build_logout_url_adds_nexent_service_to_configured_bare_logout_url(self):
+        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
+        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "https://sso.example.com/cas/logout"
+        try:
+            url = build_logout_url()
+        finally:
+            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
+
+        self.assertEqual(
+            url,
+            "https://sso.example.com/cas/logout?service=http://localhost:3000",
+        )
+
+    def test_build_logout_url_resolves_absolute_path_against_cas_server_url(self):
+        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
+        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "/logout"
+        try:
+            url = build_logout_url()
+        finally:
+            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
+
+        self.assertEqual(
+            url,
+            "https://cas.example.com/cas/logout?service=http://localhost:3000",
+        )
+
+    def test_build_logout_url_resolves_relative_path_against_cas_server_url(self):
+        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
+        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "logout"
+        try:
+            url = build_logout_url()
+        finally:
+            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
+
+        self.assertEqual(
+            url,
+            "https://cas.example.com/cas/logout?service=http://localhost:3000",
+        )
+
+    def test_build_logout_url_preserves_configured_logout_url_with_query(self):
+        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
+        configured = "https://sso.example.com/cas/logout?redirect=https%3A%2F%2Fidp.example.com%2Flogin"
+        build_logout_url.__globals__["CAS_LOGOUT_URL"] = configured
+        try:
+            url = build_logout_url()
+        finally:
+            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
+
+        self.assertEqual(url, configured)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/test/backend/services/test_data_process_service.py b/test/backend/services/test_data_process_service.py
index 27ab679d2..f93d54f4c 100644
--- a/test/backend/services/test_data_process_service.py
+++ b/test/backend/services/test_data_process_service.py
@@ -1595,43 +1595,21 @@ def test_get_data_process_service(self, mock_service_class):
         self.assertEqual(service2, mock_service)
         self.assertEqual(service1, service2)
 
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_success(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_success(self, mock_submit_chain):
         """
         Async implementation for testing successful batch task creation.
 
         This test verifies that the service correctly creates batch tasks.
         It ensures that:
         1. Individual tasks are created for each source in the request
-        2. The process_and_forward.delay method is called with correct parameters
+        2. submit_process_forward_chain is called with correct parameters
         3. Task IDs are collected and returned
         4. All valid source configurations are processed
         """
-        # Setup Celery signature mocks
-        process_sig_1 = MagicMock()
-        process_sig_1.set.return_value = process_sig_1
-        process_sig_2 = MagicMock()
-        process_sig_2.set.return_value = process_sig_2
-        forward_sig_1 = MagicMock()
-        forward_sig_1.set.return_value = forward_sig_1
-        forward_sig_2 = MagicMock()
-        forward_sig_2.set.return_value = forward_sig_2
-
-        # process.s returns different sig objects per call
-        mock_process.s.side_effect = [process_sig_1, process_sig_2]
-        mock_forward.s.side_effect = [forward_sig_1, forward_sig_2]
-
-        # chain(...).apply_async() returns result with id
-        chain_inst_1 = MagicMock()
-        chain_inst_1.apply_async.return_value = MagicMock(id="task_id_1")
-        chain_inst_2 = MagicMock()
-        chain_inst_2.apply_async.return_value = MagicMock(id="task_id_2")
-        mock_chain.side_effect = [chain_inst_1, chain_inst_2]
-
-        # Create test request
+        mock_submit_chain.side_effect = ["task_id_1", "task_id_2"]
+
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1652,27 +1630,23 @@ async def async_test_create_batch_tasks_impl_success(self, mock_process, mock_fo
             ]
         )
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result
         self.assertEqual(len(result), 2)
         self.assertEqual(result[0], "task_id_1")
         self.assertEqual(result[1], "task_id_2")
+        self.assertEqual(mock_submit_chain.call_count, 2)
 
-        # Verify chain was invoked for each source
-        self.assertEqual(mock_chain.call_count, 2)
-
-        # Verify process.s and forward.s were called with correct params
-        expected_process_calls = [
+        expected_calls = [
             {
                 'source': 'http://example.com/doc1.pdf',
                 'source_type': 'url',
                 'chunking_strategy': 'semantic',
                 'index_name': 'test_index_1',
                 'original_filename': 'doc1.pdf',
+                'authorization': 'Bearer test_token',
                 'embedding_model_id': None,
-                'tenant_id': None
+                'tenant_id': None,
             },
             {
                 'source': 'http://example.com/doc2.pdf',
@@ -1680,43 +1654,17 @@ async def async_test_create_batch_tasks_impl_success(self, mock_process, mock_fo
                 'chunking_strategy': 'fixed',
                 'index_name': 'test_index_2',
                 'original_filename': 'doc2.pdf',
+                'authorization': 'Bearer test_token',
                 'embedding_model_id': None,
-                'tenant_id': None
-            }
-        ]
-        actual_process_calls = [kwargs for args,
-                                kwargs in mock_process.s.call_args_list]
-        self.assertEqual(actual_process_calls, expected_process_calls)
-        process_sig_1.set.assert_called_once_with(queue='process_q')
-        process_sig_2.set.assert_called_once_with(queue='process_q')
-
-        expected_forward_calls = [
-            {
-                'index_name': 'test_index_1',
-                'source': 'http://example.com/doc1.pdf',
-                'source_type': 'url',
-                'original_filename': 'doc1.pdf',
-                'authorization': 'Bearer test_token'
+                'tenant_id': None,
             },
-            {
-                'index_name': 'test_index_2',
-                'source': 'http://example.com/doc2.pdf',
-                'source_type': 'url',
-                'original_filename': 'doc2.pdf',
-                'authorization': 'Bearer test_token'
-            }
         ]
-        actual_forward_calls = [kwargs for args,
-                                kwargs in mock_forward.s.call_args_list]
-        self.assertEqual(actual_forward_calls, expected_forward_calls)
-        forward_sig_1.set.assert_called_once_with(queue='forward_q')
-        forward_sig_2.set.assert_called_once_with(queue='forward_q')
-
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+        actual_calls = [kwargs for args, kwargs in mock_submit_chain.call_args_list]
+        self.assertEqual(actual_calls, expected_calls)
+
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_source(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_missing_source(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation with missing source field.
 
@@ -1727,18 +1675,8 @@ async def async_test_create_batch_tasks_impl_missing_source(self, mock_process,
         3. Only valid source configurations are processed
         4. The method continues processing other sources
         """
-        # Setup signature mocks
-        process_sig = MagicMock()
-        process_sig.set.return_value = process_sig
-        forward_sig = MagicMock()
-        forward_sig.set.return_value = forward_sig
-        mock_process.s.return_value = process_sig
-        mock_forward.s.return_value = forward_sig
-        chain_inst = MagicMock()
-        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
-        mock_chain.return_value = chain_inst
-
-        # Create test request with missing source
+        mock_submit_chain.return_value = "task_id_1"
+
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1759,27 +1697,19 @@ async def async_test_create_batch_tasks_impl_missing_source(self, mock_process,
             ]
         )
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result - only one task should be created
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-
-        # Verify chain called once with built signatures
-        mock_chain.assert_called_once()
-        mock_process.s.assert_called_once()
-        mock_forward.s.assert_called_once()
+        mock_submit_chain.assert_called_once()
         self.assertEqual(
-            mock_process.s.call_args[1]['source'], 'http://example.com/doc2.pdf')
+            mock_submit_chain.call_args[1]['source'], 'http://example.com/doc2.pdf')
         self.assertEqual(
-            mock_process.s.call_args[1]['index_name'], 'test_index_2')
+            mock_submit_chain.call_args[1]['index_name'], 'test_index_2')
 
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation with missing index_name field.
 
@@ -1790,18 +1720,8 @@ async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_proce
         3. Only valid source configurations are processed
         4. The method continues processing other sources
         """
-        # Setup signature mocks
-        process_sig = MagicMock()
-        process_sig.set.return_value = process_sig
-        forward_sig = MagicMock()
-        forward_sig.set.return_value = forward_sig
-        mock_process.s.return_value = process_sig
-        mock_forward.s.return_value = forward_sig
-        chain_inst = MagicMock()
-        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
-        mock_chain.return_value = chain_inst
-
-        # Create test request with missing index_name
+        mock_submit_chain.return_value = "task_id_1"
+
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1822,27 +1742,19 @@ async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_proce
             ]
         )
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result - only one task should be created
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-
-        # Verify chain called once with built signatures
-        mock_chain.assert_called_once()
-        mock_process.s.assert_called_once()
-        mock_forward.s.assert_called_once()
+        mock_submit_chain.assert_called_once()
         self.assertEqual(
-            mock_process.s.call_args[1]['source'], 'http://example.com/doc2.pdf')
+            mock_submit_chain.call_args[1]['source'], 'http://example.com/doc2.pdf')
         self.assertEqual(
-            mock_process.s.call_args[1]['index_name'], 'test_index_2')
+            mock_submit_chain.call_args[1]['index_name'], 'test_index_2')
 
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_both_required_fields(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_missing_both_required_fields(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation with both required fields missing.
 
@@ -1853,7 +1765,6 @@ async def async_test_create_batch_tasks_impl_missing_both_required_fields(self,
         3. No tasks are created when all sources are invalid
         4. The method returns an empty list
         """
-        # Create test request with all sources missing required fields
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1872,22 +1783,14 @@ async def async_test_create_batch_tasks_impl_missing_both_required_fields(self,
             ]
         )
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result - no tasks should be created
         self.assertEqual(len(result), 0)
+        mock_submit_chain.assert_not_called()
 
-        # Verify no chain created
-        mock_chain.assert_not_called()
-        mock_process.s.assert_not_called()
-        mock_forward.s.assert_not_called()
-
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_empty_sources(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_empty_sources(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation with empty sources list.
 
@@ -1897,26 +1800,17 @@ async def async_test_create_batch_tasks_impl_empty_sources(self, mock_process, m
         2. The method returns an empty list
         3. No errors occur during processing
         """
-        # Create test request with empty sources
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(sources=[])
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result - no tasks should be created
         self.assertEqual(len(result), 0)
+        mock_submit_chain.assert_not_called()
 
-        # Verify no chain created
-        mock_chain.assert_not_called()
-        mock_process.s.assert_not_called()
-        mock_forward.s.assert_not_called()
-
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_optional_fields(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_optional_fields(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation with optional fields.
 
@@ -1926,18 +1820,8 @@ async def async_test_create_batch_tasks_impl_optional_fields(self, mock_process,
         2. Optional fields are passed as None when not provided
         3. The method processes all valid sources regardless of optional field presence
         """
-        # Setup signature mocks
-        process_sig = MagicMock()
-        process_sig.set.return_value = process_sig
-        forward_sig = MagicMock()
-        forward_sig.set.return_value = forward_sig
-        mock_process.s.return_value = process_sig
-        mock_forward.s.return_value = forward_sig
-        chain_inst = MagicMock()
-        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
-        mock_chain.return_value = chain_inst
-
-        # Create test request with minimal required fields only
+        mock_submit_chain.return_value = "task_id_1"
+
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1949,31 +1833,22 @@ async def async_test_create_batch_tasks_impl_optional_fields(self, mock_process,
             ]
         )
 
-        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
-        # Verify result
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-
-        # Verify signatures built with None optional fields for process, and authorization on forward
-        mock_process.s.assert_called_once()
-        proc_kwargs = mock_process.s.call_args[1]
-        self.assertEqual(proc_kwargs['source'], 'http://example.com/doc1.pdf')
-        self.assertEqual(proc_kwargs['index_name'], 'test_index_1')
-        self.assertIsNone(proc_kwargs['source_type'])
-        self.assertIsNone(proc_kwargs['chunking_strategy'])
-        self.assertIsNone(proc_kwargs['original_filename'])
-
-        mock_forward.s.assert_called_once()
-        fwd_kwargs = mock_forward.s.call_args[1]
-        self.assertEqual(fwd_kwargs['authorization'], 'Bearer test_token')
-
-    @patch('backend.services.data_process_service.chain')
-    @patch('backend.services.data_process_service.forward')
-    @patch('backend.services.data_process_service.process')
+        mock_submit_chain.assert_called_once()
+        kwargs = mock_submit_chain.call_args[1]
+        self.assertEqual(kwargs['source'], 'http://example.com/doc1.pdf')
+        self.assertEqual(kwargs['index_name'], 'test_index_1')
+        self.assertIsNone(kwargs['source_type'])
+        self.assertIsNone(kwargs['chunking_strategy'])
+        self.assertIsNone(kwargs['original_filename'])
+        self.assertEqual(kwargs['authorization'], 'Bearer test_token')
+
+    @patch('backend.services.data_process_service.submit_process_forward_chain')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_no_authorization(self, mock_process, mock_forward, mock_chain):
+    async def async_test_create_batch_tasks_impl_no_authorization(self, mock_submit_chain):
         """
         Async implementation for testing batch task creation without authorization.
 
@@ -1983,18 +1858,8 @@ async def async_test_create_batch_tasks_impl_no_authorization(self, mock_process
         2. None is passed as authorization parameter
         3. The method processes all valid sources
         """
-        # Setup signature mocks
-        process_sig = MagicMock()
-        process_sig.set.return_value = process_sig
-        forward_sig = MagicMock()
-        forward_sig.set.return_value = forward_sig
-        mock_process.s.return_value = process_sig
-        mock_forward.s.return_value = forward_sig
-        chain_inst = MagicMock()
-        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
-        mock_chain.return_value = chain_inst
-
-        # Create test request
+        mock_submit_chain.return_value = "task_id_1"
+
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -2008,19 +1873,15 @@ async def async_test_create_batch_tasks_impl_no_authorization(self, mock_process
             ]
         )
 
-        # Create batch tasks without authorization
         result = await self.service.create_batch_tasks_impl(None, request)
 
-        # Verify result
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-
-        # Verify forward.s called with None authorization
-        mock_forward.s.assert_called_once()
-        fwd_kwargs = mock_forward.s.call_args[1]
-        self.assertEqual(fwd_kwargs['source'], 'http://example.com/doc1.pdf')
-        self.assertEqual(fwd_kwargs['index_name'], 'test_index_1')
-        self.assertIsNone(fwd_kwargs['authorization'])
+        mock_submit_chain.assert_called_once()
+        kwargs = mock_submit_chain.call_args[1]
+        self.assertEqual(kwargs['source'], 'http://example.com/doc1.pdf')
+        self.assertEqual(kwargs['index_name'], 'test_index_1')
+        self.assertIsNone(kwargs['authorization'])
 
     def test_create_batch_tasks_impl(self):
         """
@@ -2057,11 +1918,14 @@ async def async_test_process_uploaded_text_file(self, mock_data_process_core):
         """
         # Arrange: mock DataProcessCore.file_process to return mixed chunks
         mock_instance = MagicMock()
-        mock_instance.file_process.return_value = [
-            {"content": "First chunk"},
-            {"no_content": True},
-            {"content": "Second chunk"},
-        ]
+        mock_instance.file_process.return_value = (
+            [
+                {"content": "First chunk"},
+                {"no_content": True},
+                {"content": "Second chunk"},
+            ],
+            []  # images_info
+        )
         mock_data_process_core.return_value = mock_instance
 
         filename = "test.txt"
diff --git a/test/backend/services/test_mcp_service.py b/test/backend/services/test_mcp_service.py
index f5443bac7..280e96954 100644
--- a/test/backend/services/test_mcp_service.py
+++ b/test/backend/services/test_mcp_service.py
@@ -432,6 +432,10 @@ def test_mixed_special_chars(self):
 class TestRegisterOpenapiService:
     """Test register_openapi_service function"""
 
+    @staticmethod
+    def _headers_template():
+        return {}
+
     def test_register_service_success(self):
         """Test successful OpenAPI service registration"""
         service_name = "test_service"
@@ -442,7 +446,12 @@ def test_register_service_success(self):
         }
         server_url = "https://api.example.com"
 
-        result = mcp_service.register_openapi_service(service_name, openapi_json, server_url)
+        result = mcp_service.register_openapi_service(
+            service_name,
+            openapi_json,
+            server_url,
+            self._headers_template()
+        )
 
         assert result is True
         assert service_name in mcp_service._openapi_mcp_services
@@ -450,12 +459,12 @@ def test_register_service_success(self):
 
     def test_register_service_empty_name(self):
         """Test registration with empty service name"""
-        result = mcp_service.register_openapi_service("", {}, "https://api.example.com")
+        result = mcp_service.register_openapi_service("", {}, "https://api.example.com", self._headers_template())
         assert result is False
 
     def test_register_service_none_name(self):
         """Test registration with None service name"""
-        result = mcp_service.register_openapi_service(None, {}, "https://api.example.com")
+        result = mcp_service.register_openapi_service(None, {}, "https://api.example.com", self._headers_template())
         assert result is False
 
     def test_register_duplicate_service(self):
@@ -464,11 +473,21 @@ def test_register_duplicate_service(self):
         openapi_json = {"openapi": "3.0.0", "info": {}, "paths": {}}
 
         # First registration
-        result1 = mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
+        result1 = mcp_service.register_openapi_service(
+            service_name,
+            openapi_json,
+            "https://api.example.com",
+            self._headers_template()
+        )
         assert result1 is True
 
         # Second registration should fail
-        result2 = mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
+        result2 = mcp_service.register_openapi_service(
+            service_name,
+            openapi_json,
+            "https://api.example.com",
+            self._headers_template()
+        )
         assert result2 is False
 
     def test_register_service_without_server_url(self):
@@ -476,7 +495,7 @@ def test_register_service_without_server_url(self):
         service_name = "no_url_service"
         openapi_json = {"openapi": "3.0.0", "info": {}, "paths": {}}
 
-        result = mcp_service.register_openapi_service(service_name, openapi_json, "")
+        result = mcp_service.register_openapi_service(service_name, openapi_json, "", self._headers_template())
 
         assert result is True
 
@@ -487,12 +506,46 @@ def test_register_service_copies_openapi_spec(self):
 
         original_json = openapi_json.copy()
 
-        mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
+        mcp_service.register_openapi_service(
+            service_name,
+            openapi_json,
+            "https://api.example.com",
+            self._headers_template()
+        )
 
         # Verify original was not modified
         assert openapi_json == original_json
         assert "servers" not in openapi_json
 
+    @patch.object(mcp_service, 'FastMCP')
+    @patch.object(mcp_service.httpx, 'AsyncClient')
+    def test_register_service_passes_headers_template_to_async_client(
+        self, mock_async_client, mock_fastmcp
+    ):
+        """Test registration passes headers_template to HTTP client."""
+        mock_client = MagicMock()
+        mock_async_client.return_value = mock_client
+        mock_fastmcp.from_openapi.return_value = MagicMock()
+        headers_template = {
+            "Authorization": "Bearer {{token}}",
+            "X-Tenant-ID": "{{tenant_id}}"
+        }
+
+        result = mcp_service.register_openapi_service(
+            "headers_service",
+            {"openapi": "3.0.0", "info": {}, "paths": {}},
+            "https://api.example.com",
+            headers_template
+        )
+
+        assert result is True
+        mock_async_client.assert_called_once_with(
+            base_url="https://api.example.com",
+            timeout=120.0,
+            headers=headers_template
+        )
+        mock_fastmcp.from_openapi.assert_called_once()
+
     @patch.object(mcp_service, 'FastMCP')
     def test_register_service_from_openapi_failure(self, mock_fastmcp):
         """Test handling of FastMCP.from_openapi failure"""
@@ -501,7 +554,8 @@ def test_register_service_from_openapi_failure(self, mock_fastmcp):
         result = mcp_service.register_openapi_service(
             "fail_service",
             {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com"
+            "https://api.example.com",
+            self._headers_template()
         )
 
         assert result is False
@@ -515,7 +569,8 @@ def test_register_service_returns_none(self, mock_fastmcp):
         result = mcp_service.register_openapi_service(
             "none_service",
             {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com"
+            "https://api.example.com",
+            self._headers_template()
         )
 
         assert result is False
@@ -652,6 +707,38 @@ def test_refresh_clears_existing_services(self):
         assert "old_service" not in mcp_service._openapi_mcp_services
         assert "new_service" in mcp_service._openapi_mcp_services
 
+    @patch.object(mcp_service, 'register_openapi_service')
+    def test_refresh_passes_headers_template_to_register(self, mock_register):
+        """Test refresh passes headers_template to register_openapi_service."""
+        services_data = [
+            {
+                "mcp_service_name": "api_service_1",
+                "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
+                "server_url": "https://api1.example.com",
+                "headers_template": {
+                    "Authorization": "Bearer {{token}}",
+                    "X-Tenant-ID": "{{tenant_id}}"
+                }
+            }
+        ]
+        mcp_service.query_available_openapi_services.return_value = services_data
+        mock_register.return_value = True
+
+        result = mcp_service.refresh_openapi_services_by_tenant("tenant1")
+
+        assert result["registered"] == 1
+        assert result["skipped"] == 0
+        assert result["total"] == 1
+        mock_register.assert_called_once_with(
+            "api_service_1",
+            {"openapi": "3.0.0", "info": {}, "paths": {}},
+            "https://api1.example.com",
+            {
+                "Authorization": "Bearer {{token}}",
+                "X-Tenant-ID": "{{tenant_id}}"
+            }
+        )
+
     def test_refresh_remounts_local_service(self):
         """Test that refresh re-mounts local MCP service"""
         mcp_service.query_available_openapi_services.return_value = []
@@ -672,13 +759,21 @@ def test_refresh_remounts_local_service(self):
 class TestRefreshSingleOpenapiService:
     """Test refresh_single_openapi_service function"""
 
+    @staticmethod
+    def _headers_template():
+        return {
+            "Authorization": "Bearer {{token}}",
+            "X-Tenant-ID": "{{tenant_id}}"
+        }
+
     def test_refresh_existing_service(self):
         """Test refreshing an existing service"""
         services_data = [
             {
                 "mcp_service_name": "target_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com"
+                "server_url": "https://api.example.com",
+                "headers_template": self._headers_template()
             }
         ]
         mcp_service.query_available_openapi_services.return_value = services_data
@@ -737,7 +832,8 @@ def test_refresh_removes_old_instance(self):
             {
                 "mcp_service_name": "old_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com"
+                "server_url": "https://api.example.com",
+                "headers_template": self._headers_template()
             }
         ]
         mcp_service.query_available_openapi_services.return_value = services_data
@@ -746,6 +842,30 @@ def test_refresh_removes_old_instance(self):
 
         assert result["status"] == "refreshed"
 
+    @patch.object(mcp_service, 'register_openapi_service')
+    def test_refresh_existing_service_passes_headers_template(self, mock_register):
+        """Test refreshing a service passes headers_template to register_openapi_service."""
+        services_data = [
+            {
+                "mcp_service_name": "target_service",
+                "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
+                "server_url": "https://api.example.com",
+                "headers_template": self._headers_template()
+            }
+        ]
+        mcp_service.query_available_openapi_services.return_value = services_data
+        mock_register.return_value = True
+
+        result = mcp_service.refresh_single_openapi_service("target_service", "tenant1")
+
+        assert result["status"] == "refreshed"
+        mock_register.assert_called_once_with(
+            "target_service",
+            {"openapi": "3.0.0", "info": {}, "paths": {}},
+            "https://api.example.com",
+            self._headers_template()
+        )
+
     def test_refresh_deleted_service_removes_from_mounted_servers(self):
         """Test that deleting a service removes it from mounted_servers"""
         service_name = "mounted_delete_test"
@@ -834,14 +954,13 @@ def test_app_creates_once(self):
     def test_app_has_routes(self):
         """Test that app has expected routes"""
         app = mcp_service.get_mcp_management_app()
+        paths = app.openapi()["paths"]
 
-        routes = [route.path for route in app.routes]
-
-        assert "/tools/outer_api/refresh" in routes
-        assert "/tools/openapi_service/refresh" in routes
-        assert "/tools/openapi_service" in routes
-        assert "/tools/openapi_service/{service_name}/refresh" in routes
-        assert "/tools/outer_api" in routes
+        assert "/tools/outer_api/refresh" in paths
+        assert "/tools/openapi_service/refresh" in paths
+        assert "/tools/openapi_service" in paths
+        assert "/tools/openapi_service/{service_name}/refresh" in paths
+        assert "/tools/outer_api" in paths
 
 
 # ---------------------------------------------------------------------------
@@ -1006,7 +1125,11 @@ async def test_refresh_single_service_success(self):
             {
                 "mcp_service_name": "target_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com"
+                "server_url": "https://api.example.com",
+                "headers_template": {
+                    "Authorization": "Bearer {{token}}",
+                    "X-Tenant-ID": "{{tenant_id}}"
+                }
             }
         ]
 
diff --git a/test/backend/services/test_northbound_service.py b/test/backend/services/test_northbound_service.py
index 0d658e198..e98fc4ca1 100644
--- a/test/backend/services/test_northbound_service.py
+++ b/test/backend/services/test_northbound_service.py
@@ -1,93 +1,148 @@
+"""
+Tests for backend.services.northbound_service module.
+
+This module tests the northbound-facing service layer functions including:
+- Streaming chat (start/stop)
+- Conversation management (list, history, title update)
+- Agent info listing
+- Rate limiting and idempotency
+"""
 import sys
 import os
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../.."))
+import types
+from unittest.mock import MagicMock, AsyncMock, patch
 
 import pytest
-from unittest.mock import MagicMock, AsyncMock, patch
 
+# Add project root to path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../.."))
+
+# =============================================================================
+# Mock all required modules BEFORE importing northbound_service
+# =============================================================================
 
-# First mock the consts module to avoid ModuleNotFoundError
-consts_mock = MagicMock()
-consts_mock.const = MagicMock()
-consts_mock.const.MINIO_ENDPOINT = "http://localhost:9000"
-consts_mock.const.MINIO_ACCESS_KEY = "test_access_key"
-consts_mock.const.MINIO_SECRET_KEY = "test_secret_key"
-consts_mock.const.MINIO_REGION = "us-east-1"
-consts_mock.const.MINIO_DEFAULT_BUCKET = "test-bucket"
-consts_mock.const.POSTGRES_HOST = "localhost"
-consts_mock.const.POSTGRES_USER = "test_user"
-consts_mock.const.NEXENT_POSTGRES_PASSWORD = "test_password"
-consts_mock.const.POSTGRES_DB = "test_db"
-consts_mock.const.POSTGRES_PORT = 5432
-consts_mock.const.DEFAULT_TENANT_ID = "default_tenant"
-
-sys.modules['consts'] = consts_mock
-sys.modules['consts.const'] = consts_mock.const
-
-# Mock exceptions module
+# Mock consts.exceptions
 class LimitExceededError(Exception):
     pass
 
 class UnauthorizedError(Exception):
     pass
 
-exceptions_mock = MagicMock()
-exceptions_mock.LimitExceededError = LimitExceededError
-exceptions_mock.UnauthorizedError = UnauthorizedError
-sys.modules['consts.exceptions'] = exceptions_mock
-sys.modules['backend.consts.exceptions'] = exceptions_mock
-
-# Mock database client
-client_mock = MagicMock()
-client_mock.MinioClient = MagicMock()
-client_mock.get_db_session = MagicMock()
-sys.modules['database.client'] = client_mock
-sys.modules['backend.database.client'] = client_mock
-
-# Mock token_db module
-token_db_mock = MagicMock()
-token_db_mock.log_token_usage = MagicMock(return_value=1)
-token_db_mock.get_latest_usage_metadata = MagicMock(return_value={"query": "test"})
-sys.modules['database.token_db'] = token_db_mock
-sys.modules['backend.database.token_db'] = token_db_mock
-
-# Mock conversation_db module
-conversation_db_mock = MagicMock()
-conversation_db_mock.get_conversation_messages = MagicMock(return_value=[
+class ConversationNotFoundError(Exception):
+    pass
+
+consts_exceptions_mod = types.ModuleType("consts.exceptions")
+consts_exceptions_mod.LimitExceededError = LimitExceededError
+consts_exceptions_mod.UnauthorizedError = UnauthorizedError
+consts_exceptions_mod.ConversationNotFoundError = ConversationNotFoundError
+sys.modules["consts.exceptions"] = consts_exceptions_mod
+sys.modules["backend.consts.exceptions"] = consts_exceptions_mod
+
+# Mock consts.const
+consts_const_mod = types.ModuleType("consts.const")
+consts_const_mod.ASSET_OWNER_TENANT_ID = "asset-owner-tenant"
+sys.modules["consts.const"] = consts_const_mod
+
+# Mock consts package
+consts_package = types.ModuleType("consts")
+consts_package.exceptions = consts_exceptions_mod
+consts_package.const = consts_const_mod
+sys.modules["consts"] = consts_package
+
+# Mock database modules
+db_client_mod = types.ModuleType("database.client")
+db_client_mod.get_db_session = MagicMock()
+db_client_mod.as_dict = MagicMock()
+sys.modules["database.client"] = db_client_mod
+sys.modules["backend.database.client"] = db_client_mod
+
+db_package = types.ModuleType("database")
+db_package.client = db_client_mod
+sys.modules["database"] = db_package
+
+# Mock token_db
+token_db_mod = types.ModuleType("database.token_db")
+token_db_mod.log_token_usage = MagicMock(return_value=1)
+token_db_mod.get_latest_usage_metadata = MagicMock(return_value={"query": "test"})
+sys.modules["database.token_db"] = token_db_mod
+
+# Mock conversation_db
+conversation_db_mod = types.ModuleType("database.conversation_db")
+conversation_db_mod.get_conversation_messages = MagicMock(return_value=[
     {"message_role": "user", "message_content": "Hello"}
 ])
-sys.modules['database.conversation_db'] = conversation_db_mock
-sys.modules['backend.database.conversation_db'] = conversation_db_mock
-
-# Mock agent_service module
-agent_service_mock = MagicMock()
-agent_service_mock.run_agent_stream = AsyncMock()
-agent_service_mock.stop_agent_tasks = MagicMock(return_value={"message": "stopped"})
-agent_service_mock.list_all_agent_info_impl = AsyncMock(return_value=[{"agent_id": 1, "name": "test_agent"}])
-agent_service_mock.get_agent_id_by_name = AsyncMock(return_value=1)
-sys.modules['services.agent_service'] = agent_service_mock
-sys.modules['backend.services.agent_service'] = agent_service_mock
-
-# Mock conversation_management_service module
-conv_mgmt_mock = MagicMock()
-conv_mgmt_mock.save_conversation_user = MagicMock()
-conv_mgmt_mock.get_conversation_list_service = MagicMock(return_value=[
+conversation_db_mod.get_source_searches_by_message = MagicMock(return_value=[])
+sys.modules["database.conversation_db"] = conversation_db_mod
+
+# Mock attachment_db
+attachment_db_mod = types.ModuleType("database.attachment_db")
+attachment_db_mod.build_s3_url = MagicMock(return_value="s3://bucket/file")
+attachment_db_mod.get_file_url = MagicMock(return_value={"success": True, "url": "https://proxy.example/file"})
+attachment_db_mod.get_file_size_from_minio = MagicMock(return_value=0)
+attachment_db_mod._build_mcp_presigned_url = MagicMock(side_effect=lambda url: url)
+sys.modules["database.attachment_db"] = attachment_db_mod
+
+# Mock nexent.multi_modal.utils
+nexent_utils_mod = types.ModuleType("nexent.multi_modal.utils")
+nexent_utils_mod.parse_s3_url = MagicMock(return_value=("bucket", "path/file.txt"))
+sys.modules["nexent"] = types.ModuleType("nexent")
+sys.modules["nexent.multi_modal"] = types.ModuleType("nexent.multi_modal")
+sys.modules["nexent.multi_modal.utils"] = nexent_utils_mod
+
+# Mock services modules
+services_package = types.ModuleType("services")
+
+# Mock agent_service
+agent_service_mod = types.ModuleType("services.agent_service")
+agent_service_mod.run_agent_stream = AsyncMock()
+agent_service_mod.stop_agent_tasks = MagicMock(return_value={"message": "stopped"})
+agent_service_mod.get_agent_id_by_name = AsyncMock(return_value=1)
+sys.modules["services.agent_service"] = agent_service_mod
+
+# Mock conversation_management_service
+conv_mgmt_mod = types.ModuleType("services.conversation_management_service")
+conv_mgmt_mod.save_conversation_user = MagicMock()
+conv_mgmt_mod.get_conversation_list_service = MagicMock(return_value=[
     {"conversation_id": "1", "title": "Test"}
 ])
-conv_mgmt_mock.create_new_conversation = MagicMock(return_value={"conversation_id": 123})
-conv_mgmt_mock.update_conversation_title_service = MagicMock()
-sys.modules['services.conversation_management_service'] = conv_mgmt_mock
-sys.modules['backend.services.conversation_management_service'] = conv_mgmt_mock
-
-# Mock consts.model
-consts_model_mock = MagicMock()
-AgentRequest_mock = MagicMock()
-consts_model_mock.AgentRequest = AgentRequest_mock
-sys.modules['consts.model'] = consts_model_mock
+conv_mgmt_mod.create_new_conversation = MagicMock(return_value={"conversation_id": 123})
+conv_mgmt_mod.update_conversation_title = MagicMock()
+sys.modules["services.conversation_management_service"] = conv_mgmt_mod
+
+# Mock agent_version_service
+agent_version_mod = types.ModuleType("services.agent_version_service")
+agent_version_mod.list_published_agents_impl = AsyncMock(return_value=[
+    {"agent_id": 1, "name": "test_agent", "description": "Test agent"}
+])
+sys.modules["services.agent_version_service"] = agent_version_mod
+
+# Mock file_management_service
+file_mgmt_mod = types.ModuleType("services.file_management_service")
+file_mgmt_mod.upload_to_minio = AsyncMock(return_value=[])
+file_mgmt_mod.resolve_minio_upload_folder = MagicMock(return_value="attachments/user")
+file_mgmt_mod.validate_urls_access = MagicMock()
+sys.modules["services.file_management_service"] = file_mgmt_mod
+
+# Add to services package
+services_package.agent_service = agent_service_mod
+services_package.agent_version_service = agent_version_mod
+services_package.conversation_management_service = conv_mgmt_mod
+services_package.file_management_service = file_mgmt_mod
+sys.modules["services"] = services_package
+
+# Mock consts.model - create stub classes
+class AgentRequestStub:
+    def __init__(self, **kwargs):
+        for k, v in kwargs.items():
+            setattr(self, k, v)
+
+class ToolParamsRequestStub:
+    pass
 
-# Mock database.db_models
-db_models_mock = MagicMock()
-sys.modules['database.db_models'] = db_models_mock
+consts_model_mod = types.ModuleType("consts.model")
+consts_model_mod.AgentRequest = AgentRequestStub
+consts_model_mod.ToolParamsRequest = ToolParamsRequestStub
+sys.modules["consts.model"] = consts_model_mod
 
 # Now import the module under test
 from backend.services import northbound_service as ns
@@ -107,13 +162,12 @@ def __init__(self, request_id="req-123", tenant_id="tenant-1", user_id="user-1",
 @pytest.fixture(autouse=True)
 def reset_test_isolation():
     """Reset test isolation state before each test."""
-    # Clear idempotency state
     ns._IDEMPOTENCY_RUNNING.clear()
-    # Reset mock call counts
-    token_db_mock.log_token_usage.reset_mock()
+    ns._RATE_STATE.clear()
+    token_db_mod.log_token_usage.reset_mock()
     yield
-    # Cleanup after test
     ns._IDEMPOTENCY_RUNNING.clear()
+    ns._RATE_STATE.clear()
 
 
 class TestNorthboundContext:
@@ -149,23 +203,155 @@ def test_build_idempotency_key_normal(self):
         key = ns._build_idempotency_key("tenant1", "123", "agent1", "query")
         assert "tenant1" in key
         assert "123" in key
+        assert key.count(":") == 3
 
     def test_build_idempotency_key_with_none(self):
-        """Test with None values."""
+        """Test with None values are converted to empty string."""
         key = ns._build_idempotency_key("tenant1", None, "query")
         assert "tenant1" in key
-        # None values are converted to empty string
         assert "None" not in key
-        # Should contain the empty string from None conversion
-        assert "tenant1::" in key or ":query" in key
 
-    def test_build_idempotency_key_long_string(self):
+    def test_build_idempotency_key_long_string_hashed(self):
         """Test with long string gets hashed."""
         long_string = "a" * 100
         key = ns._build_idempotency_key(long_string)
-        # Should be hashed (not the full string)
         assert len(key) < 100
 
+    def test_build_idempotency_key_mixed_long_short(self):
+        """Test with mixed long and short values."""
+        long_val = "x" * 100
+        key = ns._build_idempotency_key("short", long_val, "another_short")
+        assert len(key) < 200
+
+    def test_build_idempotency_key_empty(self):
+        """Test with all empty values."""
+        key = ns._build_idempotency_key()
+        assert key == ""
+
+    def test_build_idempotency_key_single_value(self):
+        """Test with single value."""
+        key = ns._build_idempotency_key("only")
+        assert key == "only"
+
+
+class TestBuildTitleUpdateIdempotencyKey:
+    """Tests for _build_title_update_idempotency_key function."""
+
+    def test_title_update_key_format(self):
+        """Test that title is hashed in the key."""
+        key = ns._build_title_update_idempotency_key("tenant1", 123, "My Title")
+        assert "tenant1" in key
+        assert "123" in key
+        # Title should be hashed (SHA256 hex = 64 chars)
+        parts = key.split(":")
+        assert len(parts) == 3
+        assert len(parts[2]) == 64  # SHA256 hex digest
+
+    def test_title_update_key_different_titles_different_keys(self):
+        """Test that different titles produce different keys."""
+        key1 = ns._build_title_update_idempotency_key("tenant", 1, "Title A")
+        key2 = ns._build_title_update_idempotency_key("tenant", 1, "Title B")
+        assert key1 != key2
+
+    def test_title_update_key_same_inputs_same_key(self):
+        """Test that same inputs produce same key."""
+        key1 = ns._build_title_update_idempotency_key("tenant", 1, "Same Title")
+        key2 = ns._build_title_update_idempotency_key("tenant", 1, "Same Title")
+        assert key1 == key2
+
+
+class TestIdempotencyStartEnd:
+    """Tests for idempotency_start and idempotency_end functions."""
+
+    @pytest.mark.asyncio
+    async def test_idempotency_start_new_key(self):
+        """Test starting idempotency with new key succeeds."""
+        await ns.idempotency_start("new-key")
+        assert "new-key" in ns._IDEMPOTENCY_RUNNING
+
+    @pytest.mark.asyncio
+    async def test_idempotency_start_duplicate_key_raises(self):
+        """Test that duplicate key raises LimitExceededError."""
+        await ns.idempotency_start("duplicate-key")
+        with pytest.raises(LimitExceededError):
+            await ns.idempotency_start("duplicate-key")
+
+    @pytest.mark.asyncio
+    async def test_idempotency_end_removes_key(self):
+        """Test that idempotency_end removes the key."""
+        await ns.idempotency_start("end-key")
+        assert "end-key" in ns._IDEMPOTENCY_RUNNING
+        await ns.idempotency_end("end-key")
+        assert "end-key" not in ns._IDEMPOTENCY_RUNNING
+
+    @pytest.mark.asyncio
+    async def test_idempotency_end_nonexistent_key(self):
+        """Test that ending nonexistent key does not raise."""
+        await ns.idempotency_end("nonexistent-key")  # Should not raise
+
+    @pytest.mark.asyncio
+    async def test_idempotency_expired_key_can_be_reused(self, reset_test_isolation):
+        """Test that expired keys can be reused after TTL."""
+        # Use a very short TTL
+        await ns.idempotency_start("expire-key", ttl_seconds=1)
+        assert "expire-key" in ns._IDEMPOTENCY_RUNNING
+        # Wait for expiration
+        import asyncio
+        await asyncio.sleep(1.1)
+        # Should be able to start again with same key
+        await ns.idempotency_start("expire-key", ttl_seconds=1)
+
+
+class TestRateLimiting:
+    """Tests for rate limiting functionality."""
+
+    @pytest.mark.asyncio
+    async def test_rate_limit_first_request_allowed(self):
+        """Test first request under limit is allowed."""
+        await ns.check_and_consume_rate_limit("tenant-rate")
+        assert ns._RATE_STATE["tenant-rate"].get(ns._minute_bucket(), 0) == 1
+
+    @pytest.mark.asyncio
+    async def test_rate_limit_multiple_requests(self):
+        """Test multiple requests increment counter."""
+        for _ in range(5):
+            await ns.check_and_consume_rate_limit("tenant-multi")
+        assert ns._RATE_STATE["tenant-multi"].get(ns._minute_bucket(), 0) == 5
+
+    @pytest.mark.asyncio
+    async def test_rate_limit_exceeded_raises(self):
+        """Test that exceeding limit raises LimitExceededError."""
+        # Fill up to limit
+        for _ in range(ns._RATE_LIMIT_PER_MINUTE):
+            await ns.check_and_consume_rate_limit("tenant-limit")
+        with pytest.raises(LimitExceededError):
+            await ns.check_and_consume_rate_limit("tenant-limit")
+
+    @pytest.mark.asyncio
+    async def test_rate_limit_different_tenants(self):
+        """Test that different tenants have separate limits."""
+        for _ in range(10):
+            await ns.check_and_consume_rate_limit("tenant-a")
+        for _ in range(5):
+            await ns.check_and_consume_rate_limit("tenant-b")
+        assert ns._RATE_STATE["tenant-a"].get(ns._minute_bucket(), 0) == 10
+        assert ns._RATE_STATE["tenant-b"].get(ns._minute_bucket(), 0) == 5
+
+    @pytest.mark.asyncio
+    async def test_rate_limit_cleanup_old_buckets(self):
+        """Test that old minute buckets are cleaned up."""
+        # First, add a request to create an old bucket
+        old_bucket = str(int(ns._now_seconds() // 60) - 1)
+        ns._RATE_STATE["tenant-cleanup"] = {old_bucket: 50}
+        
+        # Make a new request - should trigger cleanup of old bucket
+        await ns.check_and_consume_rate_limit("tenant-cleanup")
+        
+        # Old bucket should be cleaned up, new bucket should have 1 request
+        current_bucket = ns._minute_bucket()
+        assert old_bucket not in ns._RATE_STATE["tenant-cleanup"]
+        assert ns._RATE_STATE["tenant-cleanup"].get(current_bucket, 0) == 1
+
 
 @pytest.mark.asyncio
 class TestStartStreamingChat:
@@ -173,30 +359,25 @@ class TestStartStreamingChat:
 
     async def test_start_streaming_chat_creates_conversation(self):
         """Test that new conversation is created when conversation_id is None."""
-        ctx = MockNorthboundContext(token_id=1)
+        ctx = MockNorthboundContext(token_id=0)
 
-        # Mock response
         mock_response = MagicMock()
         mock_response.headers = {}
-        agent_service_mock.run_agent_stream.return_value = mock_response
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock):
-            with patch.object(ns, 'idempotency_start', new_callable=AsyncMock):
-                with patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
-                    mock_history.return_value = {"data": {"history": []}}
-
-                    try:
-                        result = await ns.start_streaming_chat(
-                            ctx=ctx,
-                            conversation_id=None,
-                            agent_name="test_agent",
-                            query="test query"
-                        )
-                    except Exception:
-                        pass  # May fail due to other mocks
-
-                    # Verify create_new_conversation was called
-                    conv_mgmt_mock.create_new_conversation.assert_called()
+        agent_service_mod.run_agent_stream.return_value = mock_response
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
+            mock_history.return_value = {"data": {"history": []}}
+
+            await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=None,
+                agent_name="test_agent",
+                query="test query"
+            )
+
+            conv_mgmt_mod.create_new_conversation.assert_called()
 
     async def test_start_streaming_chat_logs_token_usage(self):
         """Test that token usage is logged when token_id > 0."""
@@ -204,27 +385,113 @@ async def test_start_streaming_chat_logs_token_usage(self):
 
         mock_response = MagicMock()
         mock_response.headers = {}
-        agent_service_mock.run_agent_stream.return_value = mock_response
+        agent_service_mod.run_agent_stream.return_value = mock_response
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
+            mock_history.return_value = {"data": {"history": []}}
+
+            await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=123,
+                agent_name="test_agent",
+                query="test query",
+                meta_data={"key": "value"}
+            )
+
+            token_db_mod.log_token_usage.assert_called()
+
+    async def test_start_streaming_chat_rate_limit_exceeded(self):
+        """Test that rate limit exceeded is properly propagated."""
+        ctx = MockNorthboundContext(token_id=0)
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock) as mock_limit:
+            mock_limit.side_effect = LimitExceededError("Rate exceeded")
+            with pytest.raises(LimitExceededError):
+                await ns.start_streaming_chat(
+                    ctx=ctx,
+                    conversation_id=123,
+                    agent_name="test_agent",
+                    query="test query"
+                )
+
+    async def test_start_streaming_chat_uses_existing_conversation(self):
+        """Test that existing conversation_id is used without creating new one."""
+        ctx = MockNorthboundContext(token_id=0)
+        conv_mgmt_mod.create_new_conversation.reset_mock()
+
+        mock_response = MagicMock()
+        mock_response.headers = {}
+        agent_service_mod.run_agent_stream.return_value = mock_response
+
+        async def mock_get_history(*args, **kwargs):
+            return {"data": {"history": []}}
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
+            await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=456,
+                agent_name="test_agent",
+                query="test query"
+            )
+
+            conv_mgmt_mod.create_new_conversation.assert_not_called()
+
+    async def test_start_streaming_chat_no_token_id_no_logging(self):
+        """Test that token usage is not logged when token_id is 0."""
+        ctx = MockNorthboundContext(token_id=0)
+        token_db_mod.log_token_usage.reset_mock()
+
+        mock_response = MagicMock()
+        mock_response.headers = {}
+        agent_service_mod.run_agent_stream.return_value = mock_response
+
+        async def mock_get_history(*args, **kwargs):
+            return {"data": {"history": []}}
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
+            await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=123,
+                agent_name="test_agent",
+                query="test query"
+            )
+
+            token_db_mod.log_token_usage.assert_not_called()
+
+    async def test_start_streaming_chat_with_attachments(self):
+        """Test streaming chat with attachment normalization."""
+        ctx = MockNorthboundContext(token_id=0)
+        attachments = ["s3://bucket/file.txt"]
+
+        mock_response = MagicMock()
+        mock_response.headers = {}
+        agent_service_mod.run_agent_stream.return_value = mock_response
 
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock):
-            with patch.object(ns, 'idempotency_start', new_callable=AsyncMock):
-                with patch.object(ns, 'idempotency_end', new_callable=AsyncMock):
-                    with patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
-                        mock_history.return_value = {"data": {"history": []}}
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history, \
+                patch.object(ns, '_normalize_northbound_attachments', return_value=[{"name": "file.txt"}]) as mock_norm:
+            mock_history.return_value = {"data": {"history": []}}
 
-                        try:
-                            await ns.start_streaming_chat(
-                                ctx=ctx,
-                                conversation_id=123,
-                                agent_name="test_agent",
-                                query="test query",
-                                meta_data={"key": "value"}
-                            )
-                        except Exception:
-                            pass
+            await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=123,
+                agent_name="test_agent",
+                query="test query",
+                attachments=attachments
+            )
 
-                        # Verify log_token_usage was called
-                        token_db_mock.log_token_usage.assert_called()
+            mock_norm.assert_called_once()
 
 
 @pytest.mark.asyncio
@@ -234,7 +501,7 @@ class TestStopChat:
     async def test_stop_chat_success(self):
         """Test successful stop chat."""
         ctx = MockNorthboundContext(token_id=1)
-        agent_service_mock.stop_agent_tasks.return_value = {"message": "stopped"}
+        agent_service_mod.stop_agent_tasks.return_value = {"message": "stopped"}
 
         result = await ns.stop_chat(ctx=ctx, conversation_id=123)
 
@@ -242,12 +509,22 @@ async def test_stop_chat_success(self):
         assert result["data"] == 123
 
     async def test_stop_chat_logs_token_usage(self):
-        """Test that token usage is logged."""
+        """Test that token usage is logged when token_id > 0."""
         ctx = MockNorthboundContext(token_id=1)
+        token_db_mod.log_token_usage.reset_mock()
 
         await ns.stop_chat(ctx=ctx, conversation_id=123, meta_data={"test": "data"})
 
-        token_db_mock.log_token_usage.assert_called()
+        token_db_mod.log_token_usage.assert_called()
+
+    async def test_stop_chat_no_token_id_no_logging(self):
+        """Test that token usage is not logged when token_id is 0."""
+        ctx = MockNorthboundContext(token_id=0)
+        token_db_mod.log_token_usage.reset_mock()
+
+        await ns.stop_chat(ctx=ctx, conversation_id=123)
+
+        token_db_mod.log_token_usage.assert_not_called()
 
 
 @pytest.mark.asyncio
@@ -256,7 +533,7 @@ class TestListConversations:
 
     async def test_list_conversations_success(self):
         """Test successful conversation listing."""
-        ctx = MockNorthboundContext(token_id=0)  # No token_id, no metadata lookup
+        ctx = MockNorthboundContext(token_id=0)
 
         result = await ns.list_conversations(ctx=ctx)
 
@@ -266,12 +543,11 @@ async def test_list_conversations_success(self):
     async def test_list_conversations_with_metadata(self):
         """Test that metadata is added when token_id > 0."""
         ctx = MockNorthboundContext(token_id=1)
-        token_db_mock.get_latest_usage_metadata.return_value = {"query": "test query"}
+        token_db_mod.get_latest_usage_metadata.return_value = {"query": "test query"}
 
         result = await ns.list_conversations(ctx=ctx)
 
-        # Should have called get_latest_usage_metadata
-        token_db_mock.get_latest_usage_metadata.assert_called()
+        token_db_mod.get_latest_usage_metadata.assert_called()
 
 
 @pytest.mark.asyncio
@@ -281,7 +557,7 @@ class TestGetConversationHistory:
     async def test_get_conversation_history_success(self):
         """Test successful history retrieval."""
         ctx = MockNorthboundContext(token_id=1)
-        conversation_db_mock.get_conversation_messages.return_value = [
+        conversation_db_mod.get_conversation_messages.return_value = [
             {"message_role": "user", "message_content": "Hello"},
             {"message_role": "assistant", "message_content": "Hi there"}
         ]
@@ -292,6 +568,19 @@ async def test_get_conversation_history_success(self):
         assert "data" in result
         assert "history" in result["data"]
 
+    async def test_get_conversation_history_fields_transformed(self):
+        """Test that message fields are properly transformed."""
+        ctx = MockNorthboundContext(token_id=0)
+        conversation_db_mod.get_conversation_messages.return_value = [
+            {"message_role": "user", "message_content": "Hello"}
+        ]
+
+        result = await ns.get_conversation_history(ctx=ctx, conversation_id=123)
+
+        history = result["data"]["history"]
+        assert history[0]["role"] == "user"
+        assert history[0]["content"] == "Hello"
+
 
 @pytest.mark.asyncio
 class TestGetConversationHistoryInternal:
@@ -300,7 +589,7 @@ class TestGetConversationHistoryInternal:
     async def test_get_conversation_history_internal_success(self):
         """Test internal history retrieval without logging."""
         ctx = MockNorthboundContext(token_id=0)
-        conversation_db_mock.get_conversation_messages.return_value = [
+        conversation_db_mod.get_conversation_messages.return_value = [
             {"message_role": "user", "message_content": "Hello"}
         ]
 
@@ -313,12 +602,12 @@ async def test_get_conversation_history_internal_success(self):
     async def test_get_conversation_history_internal_no_logging(self):
         """Test that internal function does not log token usage."""
         ctx = MockNorthboundContext(token_id=1)
-        conversation_db_mock.get_conversation_messages.return_value = []
+        conversation_db_mod.get_conversation_messages.return_value = []
+        token_db_mod.log_token_usage.reset_mock()
 
         await ns.get_conversation_history_internal(ctx=ctx, conversation_id=123)
 
-        # Should NOT call log_token_usage
-        token_db_mock.log_token_usage.assert_not_called()
+        token_db_mod.log_token_usage.assert_not_called()
 
 
 @pytest.mark.asyncio
@@ -326,9 +615,10 @@ class TestGetAgentInfoList:
     """Tests for get_agent_info_list function."""
 
     async def test_get_agent_info_list_success(self):
-        """Test successful agent info list retrieval."""
-        ctx = MockNorthboundContext(token_id=1)
-        agent_service_mock.list_all_agent_info_impl.return_value = [
+        """Test successful agent info list retrieval for asset owner tenant."""
+        # Use asset owner tenant to avoid merging asset owner agents
+        ctx = MockNorthboundContext(tenant_id="asset-owner-tenant", token_id=1)
+        agent_version_mod.list_published_agents_impl.return_value = [
             {"agent_id": 1, "name": "test_agent", "description": "Test"}
         ]
 
@@ -336,9 +626,21 @@ async def test_get_agent_info_list_success(self):
 
         assert result["message"] == "success"
         assert len(result["data"]) == 1
-        # agent_id should be removed
         assert "agent_id" not in result["data"][0]
 
+    async def test_get_agent_info_list_includes_asset_owner_agents(self):
+        """Test that asset owner agents are included for non-asset-owner tenants."""
+        ctx = MockNorthboundContext(tenant_id="other-tenant", token_id=0)
+        agent_version_mod.list_published_agents_impl.side_effect = [
+            [{"agent_id": 1, "name": "local_agent"}],
+            [{"agent_id": 2, "name": "asset_agent"}]
+        ]
+
+        result = await ns.get_agent_info_list(ctx=ctx)
+
+        assert len(result["data"]) == 2
+        agent_version_mod.list_published_agents_impl.assert_called()
+
 
 @pytest.mark.asyncio
 class TestUpdateConversationTitle:
@@ -359,8 +661,9 @@ async def test_update_conversation_title_success(self):
         assert "idempotency_key" in result
 
     async def test_update_conversation_title_logs_token_usage(self):
-        """Test that token usage is logged."""
+        """Test that token usage is logged when token_id > 0."""
         ctx = MockNorthboundContext(token_id=1)
+        token_db_mod.log_token_usage.reset_mock()
 
         await ns.update_conversation_title(
             ctx=ctx,
@@ -369,10 +672,10 @@ async def test_update_conversation_title_logs_token_usage(self):
             meta_data={"source": "api"}
         )
 
-        token_db_mock.log_token_usage.assert_called()
+        token_db_mod.log_token_usage.assert_called()
 
-    async def test_update_conversation_title_idempotency_key(self):
-        """Test that idempotency key is properly built."""
+    async def test_update_conversation_title_custom_idempotency_key(self):
+        """Test that custom idempotency key is used when provided."""
         ctx = MockNorthboundContext(tenant_id="tenant-1", token_id=1)
 
         result = await ns.update_conversation_title(
@@ -383,3 +686,726 @@ async def test_update_conversation_title_idempotency_key(self):
         )
 
         assert result["idempotency_key"] == "custom-key"
+
+    async def test_update_conversation_title_idempotency_prevents_duplicate(self):
+        """Test that duplicate requests within TTL are prevented."""
+        ctx = MockNorthboundContext(tenant_id="tenant-1", token_id=0)
+
+        # First call should succeed
+        await ns.update_conversation_title(
+            ctx=ctx,
+            conversation_id=123,
+            title="New Title"
+        )
+
+        # Second call with same params should raise LimitExceededError
+        with pytest.raises(LimitExceededError):
+            await ns.update_conversation_title(
+                ctx=ctx,
+                conversation_id=123,
+                title="New Title"
+            )
+
+
+class TestReleaseIdempotencyAfterDelay:
+    """Tests for _release_idempotency_after_delay function."""
+
+    @pytest.mark.asyncio
+    async def test_release_after_delay(self):
+        """Test that idempotency key is released after delay."""
+        import asyncio
+
+        await ns.idempotency_start("delayed-key")
+        assert "delayed-key" in ns._IDEMPOTENCY_RUNNING
+
+        asyncio.create_task(ns._release_idempotency_after_delay("delayed-key", seconds=0.1))
+        await asyncio.sleep(0.2)
+
+        assert "delayed-key" not in ns._IDEMPOTENCY_RUNNING
+
+
+class TestMinuteBucket:
+    """Tests for _minute_bucket helper function."""
+
+    def test_minute_bucket_returns_string(self):
+        """Test that minute bucket is a string."""
+        bucket = ns._minute_bucket()
+        assert isinstance(bucket, str)
+
+    def test_minute_bucket_consistent_for_same_time(self):
+        """Test that same time produces same bucket."""
+        ts = 1234567890.0
+        bucket1 = ns._minute_bucket(ts)
+        bucket2 = ns._minute_bucket(ts)
+        assert bucket1 == bucket2
+
+    def test_minute_bucket_different_for_different_minutes(self):
+        """Test that different minutes produce different buckets."""
+        ts1 = 1000000.0
+        ts2 = ts1 + 60
+        bucket1 = ns._minute_bucket(ts1)
+        bucket2 = ns._minute_bucket(ts2)
+        assert bucket1 != bucket2
+
+
+class TestStartStreamingChatErrorHandling:
+    """Tests for error handling in start_streaming_chat function."""
+
+    async def test_start_streaming_chat_unauthorized_error(self):
+        """Test that UnauthorizedError is properly propagated."""
+        ctx = MockNorthboundContext(token_id=0)
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock) as mock_limit:
+            mock_limit.side_effect = UnauthorizedError("Unauthorized")
+            with pytest.raises(UnauthorizedError):
+                await ns.start_streaming_chat(
+                    ctx=ctx,
+                    conversation_id=123,
+                    agent_name="test_agent",
+                    query="test query"
+                )
+
+    async def test_start_streaming_chat_get_agent_id_error(self):
+        """Test that get_agent_id_by_name error is wrapped properly."""
+        ctx = MockNorthboundContext(token_id=0)
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history, \
+                patch.object(ns, 'get_agent_id_by_name', new_callable=AsyncMock) as mock_get_id:
+            mock_history.return_value = {"data": {"history": []}}
+            mock_get_id.side_effect = Exception("Agent not found")
+
+            with pytest.raises(Exception) as exc_info:
+                await ns.start_streaming_chat(
+                    ctx=ctx,
+                    conversation_id=123,
+                    agent_name="nonexistent_agent",
+                    query="test query"
+                )
+            # The exception is wrapped in the outer try/except block
+            assert "Agent not found" in str(exc_info.value)
+
+    async def test_start_streaming_chat_save_message_error(self):
+        """Test that save_conversation_user error is wrapped properly."""
+        ctx = MockNorthboundContext(token_id=0)
+
+        mock_response = MagicMock()
+        mock_response.headers = {}
+        agent_service_mod.run_agent_stream.return_value = mock_response
+
+        async def mock_get_history(*args, **kwargs):
+            return {"data": {"history": []}}
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history), \
+                patch.object(ns, 'save_conversation_user', side_effect=Exception("DB error")):
+            with pytest.raises(Exception) as exc_info:
+                await ns.start_streaming_chat(
+                    ctx=ctx,
+                    conversation_id=123,
+                    agent_name="test_agent",
+                    query="test query"
+                )
+            assert "Failed to persist user message" in str(exc_info.value)
+
+    async def test_start_streaming_chat_token_logging_failure(self):
+        """Test that token logging failure is handled gracefully."""
+        ctx = MockNorthboundContext(token_id=1)
+
+        mock_response = MagicMock()
+        mock_response.headers = {}
+        agent_service_mod.run_agent_stream.return_value = mock_response
+        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
+
+        async def mock_get_history(*args, **kwargs):
+            return {"data": {"history": []}}
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
+                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
+                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
+            # Should not raise even if token logging fails
+            result = await ns.start_streaming_chat(
+                ctx=ctx,
+                conversation_id=123,
+                agent_name="test_agent",
+                query="test query",
+                meta_data={"key": "value"}
+            )
+            assert result is not None
+
+
+class TestStopChatErrorHandling:
+    """Tests for error handling in stop_chat function."""
+
+    async def test_stop_chat_error(self):
+        """Test that errors in stop_chat are wrapped properly."""
+        ctx = MockNorthboundContext(token_id=0)
+        agent_service_mod.stop_agent_tasks.side_effect = Exception("Stop failed")
+
+        with pytest.raises(Exception) as exc_info:
+            await ns.stop_chat(ctx=ctx, conversation_id=123)
+        assert "Failed to stop chat" in str(exc_info.value)
+
+    async def test_stop_chat_token_logging_failure(self):
+        """Test that token logging failure is handled gracefully."""
+        ctx = MockNorthboundContext(token_id=1)
+        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
+
+        with patch("backend.services.northbound_service.stop_agent_tasks", return_value={"message": "stopped"}):
+            # Should not raise even if token logging fails
+            result = await ns.stop_chat(ctx=ctx, conversation_id=123, meta_data={"key": "value"})
+            assert result is not None
+
+
+class TestListConversationsErrorHandling:
+    """Tests for error handling in list_conversations function."""
+
+    async def test_list_conversations_with_metadata_error(self):
+        """Test that metadata fetch error is handled gracefully."""
+        ctx = MockNorthboundContext(token_id=1)
+        conv_mgmt_mod.get_conversation_list_service.return_value = [
+            {"conversation_id": "1", "title": "Test"}
+        ]
+        token_db_mod.get_latest_usage_metadata.side_effect = Exception("DB error")
+
+        # Should not raise even if metadata fetch fails
+        result = await ns.list_conversations(ctx=ctx)
+        assert result["message"] == "success"
+
+    async def test_list_conversations_empty_meta_data_removed(self):
+        """Test that empty meta_data keys are removed from items."""
+        ctx = MockNorthboundContext(token_id=1)
+        conv_mgmt_mod.get_conversation_list_service.return_value = [
+            {"conversation_id": "1", "title": "Test", "meta_data": {}}
+        ]
+
+        result = await ns.list_conversations(ctx=ctx)
+        assert "meta_data" not in result["data"][0]
+
+    async def test_list_conversations_meta_data_with_no_usage_record(self):
+        """Test that meta_data is removed when get_latest_usage_metadata returns empty."""
+        ctx = MockNorthboundContext(token_id=1)
+        conv_mgmt_mod.get_conversation_list_service.return_value = [
+            {"conversation_id": "1", "title": "Test"}
+        ]
+        token_db_mod.get_latest_usage_metadata.return_value = None
+
+        result = await ns.list_conversations(ctx=ctx)
+        assert "meta_data" not in result["data"][0]
+
+    async def test_list_conversations_meta_data_set_when_present(self):
+        """Test that meta_data is set on item when get_latest_usage_metadata returns a non-empty value."""
+        ctx = MockNorthboundContext(token_id=1)
+        conv_mgmt_mod.get_conversation_list_service.return_value = [
+            {"conversation_id": "1", "title": "Test"}
+        ]
+        # Reset side_effect and set return_value
+        token_db_mod.get_latest_usage_metadata.side_effect = None
+        token_db_mod.get_latest_usage_metadata.return_value = {"query": "test query"}
+
+        result = await ns.list_conversations(ctx=ctx)
+        assert "meta_data" in result["data"][0]
+        assert result["data"][0]["meta_data"]["query"] == "test query"
+
+    async def test_list_conversations_meta_data_empty_dict_removed(self):
+        """Test that empty meta_data (empty dict) is removed from item."""
+        ctx = MockNorthboundContext(token_id=1)
+        conv_mgmt_mod.get_conversation_list_service.return_value = [
+            {"conversation_id": "1", "title": "Test"}
+        ]
+        # Reset side_effect and set return_value to empty dict (falsy)
+        token_db_mod.get_latest_usage_metadata.side_effect = None
+        token_db_mod.get_latest_usage_metadata.return_value = {}
+
+        result = await ns.list_conversations(ctx=ctx)
+        # Empty dict is falsy, so meta_data should be popped
+        assert "meta_data" not in result["data"][0]
+
+
+class TestGetConversationHistoryErrorHandling:
+    """Tests for error handling in get_conversation_history function."""
+
+    async def test_get_conversation_history_error(self):
+        """Test that errors in get_conversation_history are wrapped properly."""
+        ctx = MockNorthboundContext(token_id=0)
+        # Mock get_conversation_messages to raise an error
+        conversation_db_mod.get_conversation_messages.side_effect = Exception("DB error")
+
+        with pytest.raises(Exception) as exc_info:
+            await ns.get_conversation_history(ctx=ctx, conversation_id=123)
+        assert "Failed to get conversation history" in str(exc_info.value)
+
+
+class TestGetAgentInfoListErrorHandling:
+    """Tests for get_agent_info_list function."""
+
+    @pytest.mark.asyncio
+    async def test_get_agent_info_by_name_success(self):
+        """Test successful agent ID retrieval."""
+        agent_service_mod.get_agent_id_by_name.return_value = 42
+        
+        result = await ns.get_agent_info_by_name("test_agent", "tenant-1")
+        assert result == 42
+
+    @pytest.mark.asyncio
+    async def test_get_agent_info_by_name_error(self):
+        """Test that errors are wrapped properly."""
+        agent_service_mod.get_agent_id_by_name.side_effect = Exception("Agent not found")
+        
+        with pytest.raises(Exception) as exc_info:
+            await ns.get_agent_info_by_name("nonexistent", "tenant-1")
+        assert "Failed to get agent id" in str(exc_info.value)
+        assert "nonexistent" in str(exc_info.value)
+        assert "tenant-1" in str(exc_info.value)
+
+    async def test_get_agent_info_list_error(self):
+        """Test that errors in get_agent_info_list are wrapped properly."""
+        ctx = MockNorthboundContext(tenant_id="asset-owner-tenant", token_id=0)
+        agent_version_mod.list_published_agents_impl.side_effect = Exception("DB error")
+
+        with pytest.raises(Exception) as exc_info:
+            await ns.get_agent_info_list(ctx=ctx)
+        assert "Failed to get agent info list" in str(exc_info.value)
+
+
+class TestUpdateConversationTitleErrorHandling:
+    """Tests for error handling in update_conversation_title function."""
+
+    async def test_update_conversation_title_error(self):
+        """Test that errors in update_conversation_title are wrapped properly."""
+        ctx = MockNorthboundContext(token_id=0)
+        conv_mgmt_mod.update_conversation_title.side_effect = Exception("DB error")
+
+        with pytest.raises(Exception) as exc_info:
+            await ns.update_conversation_title(
+                ctx=ctx,
+                conversation_id=123,
+                title="New Title"
+            )
+        assert "Failed to update conversation title" in str(exc_info.value)
+
+    async def test_update_conversation_title_token_logging_failure(self):
+        """Test that token logging failure is handled gracefully."""
+        ctx = MockNorthboundContext(token_id=1)
+        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
+        # Ensure update_conversation_title_service succeeds
+        conv_mgmt_mod.update_conversation_title.side_effect = None
+        conv_mgmt_mod.update_conversation_title.return_value = True
+
+        # Should not raise even if token logging fails
+        result = await ns.update_conversation_title(
+            ctx=ctx,
+            conversation_id=123,
+            title="New Title",
+            meta_data={"key": "value"}
+        )
+        assert result["message"] == "success"
+
+    async def test_update_conversation_title_conversation_not_found(self):
+        """Test that ConversationNotFoundError is propagated without wrapping."""
+        ctx = MockNorthboundContext(token_id=0)
+        conv_mgmt_mod.update_conversation_title.side_effect = ConversationNotFoundError("Not found")
+
+        with pytest.raises(ConversationNotFoundError):
+            await ns.update_conversation_title(
+                ctx=ctx,
+                conversation_id=123,
+                title="New Title"
+            )
+
+
+class TestNormalizeAttachmentsErrorHandling:
+    """Tests for error handling in _normalize_northbound_attachments function."""
+
+    def test_normalize_attachments_parse_s3_url_error(self):
+        """Test that parse_s3_url ValueError is converted to ValueError."""
+        with patch("backend.services.northbound_service.parse_s3_url", side_effect=ValueError("Parse error")):
+            with pytest.raises(ValueError) as exc_info:
+                ns._normalize_northbound_attachments(
+                    ["s3://bucket/file.txt"],
+                    "user123",
+                    "tenant123"
+                )
+            assert "Invalid S3 URL format" in str(exc_info.value)
+
+    def test_normalize_attachments_permission_error_invalid_url(self):
+        """Test that PermissionError with invalid URL is converted to ValueError."""
+        with patch("backend.services.northbound_service.parse_s3_url", return_value=("bucket", "path/file.txt")), \
+                patch("backend.services.northbound_service.validate_urls_access",
+                      side_effect=PermissionError("Invalid S3 URL format: bad")):
+            with pytest.raises(ValueError) as exc_info:
+                ns._normalize_northbound_attachments(
+                    ["s3://bucket/path/file.txt"],
+                    "user123",
+                    "tenant123"
+                )
+            assert "Invalid S3 URL format" in str(exc_info.value)
+
+    def test_normalize_attachments_invalid_type(self):
+        """Test that non-list attachments raise ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            ns._normalize_northbound_attachments("s3://bucket/file.txt", "user123", "tenant123")
+        assert "attachments must be an array" in str(exc_info.value)
+
+    def test_normalize_attachments_empty_list(self):
+        """Test that an empty list returns an empty list."""
+        assert ns._normalize_northbound_attachments([], "user123", "tenant123") == []
+
+    def test_normalize_attachments_invalid_url(self):
+        """Test that an unsupported URL scheme raises ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            ns._normalize_northbound_attachments(["https://example.com/file.txt"], "user123", "tenant123")
+        assert "Invalid attachment format" in str(exc_info.value) or "Invalid S3 URL format" in str(exc_info.value)
+
+    def test_normalize_attachments_empty_string(self):
+        """Test that an empty-string attachment raises ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            ns._normalize_northbound_attachments([""], "user123", "tenant123")
+        assert "non-empty" in str(exc_info.value)
+
+    def test_normalize_attachments_whitespace_string(self):
+        """Test that a whitespace-only attachment raises ValueError."""
+        with pytest.raises(ValueError) as exc_info:
+            ns._normalize_northbound_attachments(["  "], "user123", "tenant123")
+        assert "non-empty" in str(exc_info.value)
+
+    def test_normalize_attachments_permission_denied(self):
+        """Test that a generic PermissionError is re-raised as-is."""
+        with patch(
+            "backend.services.northbound_service.validate_urls_access",
+            side_effect=PermissionError("Access denied: You don't have permission to access this file")
+        ):
+            with pytest.raises(PermissionError) as exc_info:
+                ns._normalize_northbound_attachments(["s3://bucket/attachments/other/file.txt"], "user123", "tenant123")
+            assert "Access denied" in str(exc_info.value)
+
+    def test_normalize_attachments_s3_url_success(self):
+        """Test successful normalization of an s3:// URL with assertions on collaborator calls."""
+        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
+                patch("backend.services.northbound_service.get_file_url", return_value={
+                    "success": True,
+                    "url": "https://proxy.example/file"
+                }) as mock_get_url, \
+                patch("backend.services.northbound_service.parse_s3_url", return_value=("nexent", "attachments/user123/report.pdf")):
+            result = ns._normalize_northbound_attachments(
+                ["s3://nexent/attachments/user123/report.pdf"],
+                "user123",
+                "tenant123",
+            )
+
+        mock_validate.assert_called_once_with(
+            ["s3://nexent/attachments/user123/report.pdf"],
+            "user123",
+            "tenant123",
+        )
+        mock_get_url.assert_called_once_with(
+            object_name="attachments/user123/report.pdf",
+            expires=86400,
+        )
+        assert result == [{
+            "name": "report.pdf",
+            "object_name": "attachments/user123/report.pdf",
+            "url": "/nexent/attachments/user123/report.pdf",
+            "type": "file",
+            "size": 0,
+            "description": "",
+            "presigned_url": "https://proxy.example/file",
+        }]
+
+    def test_normalize_attachments_no_presigned_url(self):
+        """Test that presigned_url is omitted when get_file_url returns no url."""
+        with patch("backend.services.northbound_service.validate_urls_access"), \
+                patch("backend.services.northbound_service.get_file_url", return_value={
+                    "success": True,
+                    "url": None
+                }), \
+                patch("backend.services.northbound_service.parse_s3_url", return_value=("nexent", "attachments/user123/report.pdf")):
+            result = ns._normalize_northbound_attachments(
+                ["s3://nexent/attachments/user123/report.pdf"],
+                "user123",
+                "tenant123",
+            )
+        assert "presigned_url" not in result[0]
+
+    def test_normalize_attachments_relative_path(self):
+        """Test support for attachments/xxx.md relative path format."""
+        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
+                patch("backend.services.northbound_service.get_file_url", return_value={
+                    "success": True,
+                    "url": "https://proxy.example/file"
+                }) as mock_get_url:
+            result = ns._normalize_northbound_attachments(
+                ["attachments/user123/report.pdf"],
+                "user123",
+                "tenant123",
+            )
+
+        mock_validate.assert_called_once_with(
+            ["s3://nexent/attachments/user123/report.pdf"],
+            "user123",
+            "tenant123",
+        )
+        mock_get_url.assert_called_once_with(
+            object_name="attachments/user123/report.pdf",
+            expires=86400,
+        )
+        assert result == [{
+            "name": "report.pdf",
+            "object_name": "attachments/user123/report.pdf",
+            "url": "/nexent/attachments/user123/report.pdf",
+            "type": "file",
+            "size": 0,
+            "description": "",
+            "presigned_url": "https://proxy.example/file",
+        }]
+
+    def test_normalize_attachments_nexent_path(self):
+        """Test support for nexent/xxx.md path format."""
+        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
+                patch("backend.services.northbound_service.get_file_url", return_value={
+                    "success": True,
+                    "url": "https://proxy.example/file"
+                }) as mock_get_url:
+            result = ns._normalize_northbound_attachments(
+                ["nexent/attachments/user123/report.pdf"],
+                "user123",
+                "tenant123",
+            )
+
+        mock_validate.assert_called_once_with(
+            ["s3://nexent/nexent/attachments/user123/report.pdf"],
+            "user123",
+            "tenant123",
+        )
+        mock_get_url.assert_called_once_with(
+            object_name="nexent/attachments/user123/report.pdf",
+            expires=86400,
+        )
+        assert result == [{
+            "name": "report.pdf",
+            "object_name": "nexent/attachments/user123/report.pdf",
+            "url": "/nexent/nexent/attachments/user123/report.pdf",
+            "type": "file",
+            "size": 0,
+            "description": "",
+            "presigned_url": "https://proxy.example/file",
+        }]
+
+    def test_normalize_attachments_absolute_path(self):
+        """Test support for /nexent/xxx.md absolute path format."""
+        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
+                patch("backend.services.northbound_service.get_file_url", return_value={
+                    "success": True,
+                    "url": "https://proxy.example/file"
+                }) as mock_get_url:
+            result = ns._normalize_northbound_attachments(
+                ["/nexent/attachments/user123/report.pdf"],
+                "user123",
+                "tenant123",
+            )
+
+        mock_validate.assert_called_once_with(
+            ["s3://nexent/attachments/user123/report.pdf"],
+            "user123",
+            "tenant123",
+        )
+        mock_get_url.assert_called_once_with(
+            object_name="attachments/user123/report.pdf",
+            expires=86400,
+        )
+        assert result == [{
+            "name": "report.pdf",
+            "object_name": "attachments/user123/report.pdf",
+            "url": "/nexent/attachments/user123/report.pdf",
+            "type": "file",
+            "size": 0,
+            "description": "",
+            "presigned_url": "https://proxy.example/file",
+        }]
+
+
+class TestNorthboundFileDescriptorAndUpload:
+    """Tests for _build_northbound_file_descriptor and upload_files_for_northbound."""
+
+    def test_build_file_descriptor_defaults(self):
+        """Test that descriptor uses file_name and includes presigned_url when present."""
+        result = ns._build_northbound_file_descriptor({
+            "file_name": "report.pdf",
+            "object_name": "attachments/user123/report.pdf",
+            "presigned_url": "https://proxy.example/file",
+        })
+
+        assert result["name"] == "report.pdf"
+        assert result["object_name"] == "attachments/user123/report.pdf"
+        assert result["type"] == "file"
+        assert result["size"] == 0
+        assert result["url"] == "/nexent/attachments/user123/report.pdf"
+        assert result["description"] == ""
+        assert result["presigned_url"] == "https://proxy.example/file"
+
+    def test_build_file_descriptor_with_original_filename(self):
+        """Test that original_file_name parameter takes precedence over upload_result file_name."""
+        result = ns._build_northbound_file_descriptor({
+            "file_name": "auto_generated_name.md",
+            "object_name": "attachments/user123/20260101120000_abc123.md",
+            "file_size": 0,
+        }, original_file_name="original-document.pdf", file_size=2048)
+
+        assert result["name"] == "original-document.pdf"
+        assert result["object_name"] == "attachments/user123/20260101120000_abc123.md"
+        assert result["type"] == "file"
+        assert result["size"] == 2048
+        assert result["url"] == "/nexent/attachments/user123/20260101120000_abc123.md"
+        assert result["description"] == ""
+
+    def test_build_file_descriptor_with_type_and_size(self):
+        """Test that explicit file_type and file_size override upload_result values."""
+        result = ns._build_northbound_file_descriptor({
+            "file_name": "image.png",
+            "object_name": "attachments/user123/image.png",
+            "file_size": 1024,
+            "content_type": "image/png",
+        }, file_type="image", file_size=2048)
+
+        assert result["name"] == "image.png"
+        assert result["object_name"] == "attachments/user123/image.png"
+        assert result["type"] == "image"
+        assert result["size"] == 2048
+        assert result["url"] == "/nexent/attachments/user123/image.png"
+        assert result["description"] == ""
+
+    def test_build_file_descriptor_no_filename(self):
+        """Test that basename(object_name) is used when no filename is provided."""
+        result = ns._build_northbound_file_descriptor({
+            "object_name": "attachments/user123/report.pdf",
+        })
+        assert result["name"] == "report.pdf"
+        assert result["object_name"] == "attachments/user123/report.pdf"
+        assert result["type"] == "file"
+
+    def test_build_file_descriptor_no_presigned_url(self):
+        """Test that presigned_url is omitted when not present in upload_result."""
+        result = ns._build_northbound_file_descriptor({
+            "file_name": "report.pdf",
+            "object_name": "attachments/user123/report.pdf",
+        })
+        assert "presigned_url" not in result
+
+    @pytest.mark.asyncio
+    async def test_upload_files_for_northbound_success(self):
+        """Test successful upload returns normalized descriptors and summary counts."""
+        ctx = ns.NorthboundContext(
+            request_id="req-123",
+            tenant_id="tenant123",
+            user_id="user123",
+            authorization="Bearer token",
+            token_id=1,
+        )
+        mock_file = MagicMock()
+        mock_file.filename = "report.pdf"
+
+        with patch(
+            "backend.services.northbound_service.resolve_minio_upload_folder",
+            return_value="attachments/user123"
+        ), patch(
+            "backend.services.northbound_service.upload_to_minio",
+            AsyncMock(return_value=[{
+                "success": True,
+                "file_name": "report.pdf",
+                "object_name": "attachments/user123/report.pdf",
+                "content_type": "application/pdf",
+                "file_size": 1024,
+                "presigned_url": "https://proxy.example/file",
+            }])
+        ):
+            result = await ns.upload_files_for_northbound(ctx, [mock_file])
+
+        assert result["summary"]["uploaded"] == 1
+        assert result["summary"]["failed"] == 0
+        assert result["files"][0]["object_name"] == "attachments/user123/report.pdf"
+        assert result["files"][0]["name"] == "report.pdf"
+        assert result["files"][0]["type"] == "file"
+        assert result["files"][0]["size"] == 1024
+        assert result["files"][0]["url"] == "/nexent/attachments/user123/report.pdf"
+        assert result["files"][0]["description"] == ""
+
+    @pytest.mark.asyncio
+    async def test_upload_files_for_northbound_no_files(self):
+        """Test that uploading with no files raises ValueError."""
+        ctx = ns.NorthboundContext(
+            request_id="req-123",
+            tenant_id="tenant123",
+            user_id="user123",
+            authorization="Bearer token",
+        )
+        with pytest.raises(ValueError) as exc_info:
+            await ns.upload_files_for_northbound(ctx, [])
+        assert "No files in the request" in str(exc_info.value)
+
+    @pytest.mark.asyncio
+    async def test_upload_files_for_northbound_all_failed(self):
+        """Test that all-failed uploads raise ValueError."""
+        ctx = ns.NorthboundContext(
+            request_id="req-123",
+            tenant_id="tenant123",
+            user_id="user123",
+            authorization="Bearer token",
+        )
+        mock_file = MagicMock()
+        mock_file.filename = "report.pdf"
+
+        with patch(
+            "backend.services.northbound_service.resolve_minio_upload_folder",
+            return_value="attachments/user123"
+        ), patch(
+            "backend.services.northbound_service.upload_to_minio",
+            AsyncMock(return_value=[{
+                "success": False,
+                "file_name": "report.pdf",
+                "object_name": None,
+            }])
+        ):
+            with pytest.raises(ValueError) as exc_info:
+                await ns.upload_files_for_northbound(ctx, [mock_file])
+        assert "No valid files uploaded" in str(exc_info.value)
+
+    @pytest.mark.asyncio
+    async def test_upload_files_for_northbound_mixed_results(self):
+        """Test that mixed success/failure results are reflected in the summary counts."""
+        ctx = ns.NorthboundContext(
+            request_id="req-123",
+            tenant_id="tenant123",
+            user_id="user123",
+            authorization="Bearer token",
+        )
+        mock_file1 = MagicMock()
+        mock_file1.filename = "report.pdf"
+        mock_file2 = MagicMock()
+        mock_file2.filename = "image.png"
+
+        with patch(
+            "backend.services.northbound_service.resolve_minio_upload_folder",
+            return_value="attachments/user123"
+        ), patch(
+            "backend.services.northbound_service.upload_to_minio",
+            AsyncMock(return_value=[
+                {
+                    "success": True,
+                    "file_name": "report.pdf",
+                    "object_name": "attachments/user123/report.pdf",
+                },
+                {
+                    "success": False,
+                    "file_name": "image.png",
+                    "object_name": None,
+                },
+            ])
+        ):
+            result = await ns.upload_files_for_northbound(ctx, [mock_file1, mock_file2])
+
+        assert result["summary"]["total"] == 2
+        assert result["summary"]["uploaded"] == 1
+        assert result["summary"]["failed"] == 1
diff --git a/test/backend/services/test_prompt_service.py b/test/backend/services/test_prompt_service.py
index 51964cef6..4d8e4f3f6 100644
--- a/test/backend/services/test_prompt_service.py
+++ b/test/backend/services/test_prompt_service.py
@@ -4,12 +4,71 @@
 import unittest
 import json
 import sys
+import atexit
 from unittest.mock import patch, MagicMock
 
+_MODULE_PATCH_SENTINEL = object()
+_MODULE_PATCH_NAMES = [
+    'boto3',
+    'elasticsearch',
+    'sqlalchemy',
+    'sqlalchemy.create_engine',
+    'sqlalchemy.orm',
+    'sqlalchemy.dialects',
+    'sqlalchemy.dialects.postgresql',
+    'sqlalchemy.sql',
+    'database.agent_db',
+    'database.tool_db',
+    'database.model_management_db',
+    'database.knowledge_db',
+    'database.client',
+    'database.db_models',
+    'utils.llm_utils',
+    'utils.prompt_template_utils',
+    'services.agent_service',
+    'services.prompt_template_service',
+    'nexent',
+    'nexent.core',
+    'nexent.core.agents',
+    'nexent.core.agents.agent_model',
+    'nexent.storage',
+    'nexent.storage.storage_client_factory',
+    'nexent.storage.minio_config',
+    'nexent.vector_database',
+    'nexent.memory',
+    'nexent.monitor',
+]
+_MODULE_PATCH_ORIGINALS = {
+    name: sys.modules.get(name, _MODULE_PATCH_SENTINEL)
+    for name in _MODULE_PATCH_NAMES
+}
+
+
+def _restore_patched_modules() -> None:
+    for name, original in _MODULE_PATCH_ORIGINALS.items():
+        if original is _MODULE_PATCH_SENTINEL:
+            sys.modules.pop(name, None)
+        else:
+            sys.modules[name] = original
+
+
+atexit.register(_restore_patched_modules)
+
+
+class MockToolConfig:
+    def __init__(self, *args, **kwargs):
+        for key, value in kwargs.items():
+            setattr(self, key, value)
+
+    def model_dump(self, **kwargs):
+        return {k: v for k, v in self.__dict__.items() if not k.startswith('_')}
+
 # Mock nexent module hierarchy BEFORE any backend imports that depend on it
 nexent_mock = MagicMock()
 nexent_core_mock = MagicMock()
 nexent_core_agents_mock = MagicMock()
+nexent_agent_model_mock = MagicMock()
+nexent_agent_model_mock.ToolConfig = MockToolConfig
 nexent_storage_mock = MagicMock()
 nexent_storage_storage_client_factory_mock = MagicMock()
 nexent_storage_minio_config_mock = MagicMock()
@@ -20,6 +79,7 @@
 sys.modules['nexent'] = nexent_mock
 sys.modules['nexent.core'] = nexent_core_mock
 sys.modules['nexent.core.agents'] = nexent_core_agents_mock
+sys.modules['nexent.core.agents.agent_model'] = nexent_agent_model_mock
 sys.modules['nexent.storage'] = nexent_storage_mock
 sys.modules['nexent.storage.storage_client_factory'] = nexent_storage_storage_client_factory_mock
 sys.modules['nexent.storage.minio_config'] = nexent_storage_minio_config_mock
@@ -43,6 +103,7 @@
 
 from consts.error_code import ErrorCode
 from consts.exceptions import AppException
+from consts.const import ENABLE_JIUWEN_SDK
 
 # Mock boto3 and minio client before importing the module under test
 import sys
@@ -60,39 +121,29 @@
 # This prevents real AWS/MinIO/Elasticsearch calls during import
 patch('botocore.client.BaseClient._make_api_call', return_value={}).start()
 
-# Patch storage factory and MinIO config validation to avoid errors during initialization
-# These patches must be started before any imports that use MinioClient
-storage_client_mock = MagicMock()
 minio_client_mock = MagicMock()
 minio_client_mock._ensure_bucket_exists = MagicMock()
 minio_client_mock.client = MagicMock()
-patch('nexent.storage.storage_client_factory.create_storage_client_from_config', return_value=storage_client_mock).start()
-patch('nexent.storage.minio_config.MinIOStorageConfig.validate', lambda self: None).start()
-patch('backend.database.client.MinioClient', return_value=minio_client_mock).start()
-patch('database.client.MinioClient', return_value=minio_client_mock).start()
-patch('backend.database.client.minio_client', minio_client_mock).start()
-patch('nexent.vector_database.elasticsearch_core.ElasticSearchCore', return_value=MagicMock()).start()
-patch('nexent.vector_database.elasticsearch_core.Elasticsearch', return_value=MagicMock()).start()
-patch('elasticsearch.Elasticsearch', return_value=MagicMock()).start()
-
-from jinja2 import StrictUndefined
 
 # Mock database submodules BEFORE importing prompt_service
-sys.modules['database'] = MagicMock()
 sys.modules['database.agent_db'] = MagicMock()
 sys.modules['database.tool_db'] = MagicMock()
 sys.modules['database.model_management_db'] = MagicMock()
 sys.modules['database.knowledge_db'] = MagicMock()
-sys.modules['database.client'] = MagicMock()
+mock_database_client = MagicMock()
+mock_database_client.MinioClient.return_value = minio_client_mock
+mock_database_client.minio_client = minio_client_mock
+sys.modules['database.client'] = mock_database_client
+sys.modules['backend.database.client'] = mock_database_client
 sys.modules['database.db_models'] = MagicMock()
 
+from jinja2 import StrictUndefined
+
 # Mock utils
-sys.modules['utils'] = MagicMock()
 sys.modules['utils.llm_utils'] = MagicMock()
 sys.modules['utils.prompt_template_utils'] = MagicMock()
 
 # Mock services
-sys.modules['services'] = MagicMock()
 sys.modules['services.agent_service'] = MagicMock()
 sys.modules['services.prompt_template_service'] = MagicMock()
 
@@ -103,6 +154,9 @@
     join_info_for_generate_system_prompt,
     join_info_for_optimize_prompt_section,
     optimize_prompt_section_impl,
+    PromptOptimizationService,
+    OptimizeRequest,
+    OptimizeResult,
 )
 
 
@@ -2062,6 +2116,128 @@ def mock_llm(model_id, content, sys_prompt, callback, tenant_id):
 
         self.assertGreater(len(result_list), 0)
 
+class TestPromptOptimizationService(unittest.TestCase):
+    """Tests for PromptOptimizationService Jiuwen SDK integration"""
+
+    @patch('backend.services.prompt_service.optimize_prompt_section_impl')
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
+    def test_optimize_nexent_fallback_general_mode(self, mock_impl):
+        """nexent 模式: mode=general 应该调用 optimize_prompt_section_impl"""
+        mock_impl.return_value = {
+            "section_type": "duty",
+            "section_title": "智能体角色",
+            "original_content": "old",
+            "optimized_content": "new",
+        }
+
+        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+        req = OptimizeRequest(
+            agent_id=1, model_id=1, task_description="task",
+            section_type="duty", section_title="智能体角色",
+            current_content="old", feedback="improve",
+            mode="general",
+        )
+        result = service.optimize(req)
+
+        self.assertEqual(result.source, "nexent")
+        self.assertEqual(result.optimized_content, "new")
+        mock_impl.assert_called_once()
+
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
+    def test_optimize_nexent_fallback_insert_mode_raises(self):
+        """nexent 模式: mode=insert 应该抛出 NexentCapabilityError"""
+        from adapters.exception import NexentCapabilityError
+
+        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+        req = OptimizeRequest(
+            agent_id=1, model_id=1, task_description="task",
+            section_type="duty", section_title="title",
+            current_content="old", feedback="improve",
+            mode="insert",
+        )
+        with self.assertRaises(NexentCapabilityError) as ctx:
+            service.optimize(req)
+        self.assertIn("insert", str(ctx.exception))
+
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
+    def test_optimize_nexent_fallback_select_mode_raises(self):
+        """nexent 模式: mode=select 应该抛出 NexentCapabilityError"""
+        from adapters.exception import NexentCapabilityError
+
+        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+        req = OptimizeRequest(
+            agent_id=1, model_id=1, task_description="task",
+            section_type="duty", section_title="title",
+            current_content="old", feedback="improve",
+            mode="select",
+        )
+        with self.assertRaises(NexentCapabilityError):
+            service.optimize(req)
+
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
+    def test_optimize_badcase_nexent_raises(self):
+        """nexent 模式: badcase 优化应该抛出 NexentCapabilityError"""
+        from adapters.exception import NexentCapabilityError
+
+        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+        with self.assertRaises(NexentCapabilityError) as ctx:
+            service.optimize_badcase(
+                current_content="old",
+                bad_cases=[{"question": "Q1", "answer": "A1"}],
+                agent_id=1, section_type="duty", section_title="title",
+            )
+        self.assertIn("badcase", str(ctx.exception))
+
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', True)
+    def test_is_jiuwen_mode_available_env_disabled(self):
+        """开关关闭时 Jiuwen SDK 不可用"""
+        from consts.const import ENABLE_JIUWEN_SDK
+
+        # Patch ENABLE_JIUWEN_SDK to False
+        with patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False):
+            service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+            self.assertFalse(service.is_jiuwen_mode_available())
+
+    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', True)
+    def test_is_jiuwen_mode_available_openjiuwen_missing(self):
+        """openjiuwen 未安装时 Jiuwen SDK 不可用"""
+        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
+        with patch('builtins.__import__', side_effect=ModuleNotFoundError("No module named 'openjiuwen'")):
+            self.assertFalse(service.is_jiuwen_mode_available())
+
+    def test_optimize_request_dataclass_fields(self):
+        """OptimizeRequest dataclass 所有字段正确"""
+        req = OptimizeRequest(
+            agent_id=1, model_id=2, task_description="task",
+            section_type="duty", section_title="title",
+            current_content="old", feedback="improve",
+            mode="insert", start_pos=5, end_pos=10,
+            tool_ids=[1, 2], sub_agent_ids=[3],
+            knowledge_base_display_names=["kb1"],
+        )
+        self.assertEqual(req.agent_id, 1)
+        self.assertEqual(req.model_id, 2)
+        self.assertEqual(req.mode, "insert")
+        self.assertEqual(req.start_pos, 5)
+        self.assertEqual(req.end_pos, 10)
+        self.assertEqual(req.tool_ids, [1, 2])
+        self.assertEqual(req.sub_agent_ids, [3])
+        self.assertEqual(req.knowledge_base_display_names, ["kb1"])
+
+    def test_optimize_result_dataclass_fields(self):
+        """OptimizeResult dataclass 所有字段正确"""
+        res = OptimizeResult(
+            optimized_content="new",
+            source="jiuwen",
+            section_type="duty",
+            section_title="title",
+            original_content="old",
+        )
+        self.assertEqual(res.optimized_content, "new")
+        self.assertEqual(res.source, "jiuwen")
+        self.assertEqual(res.section_type, "duty")
+        self.assertEqual(res.section_title, "title")
+        self.assertEqual(res.original_content, "old")
     @patch('backend.services.prompt_service.get_enabled_sub_agent_description_for_generate_prompt')
     @patch('backend.services.prompt_service.get_enabled_tool_description_for_generate_prompt')
     def test_generate_and_save_system_prompt_impl_auto_detect_no_resources(
diff --git a/test/backend/services/test_prompt_template_service.py b/test/backend/services/test_prompt_template_service.py
index 34415b203..48b27cd4c 100644
--- a/test/backend/services/test_prompt_template_service.py
+++ b/test/backend/services/test_prompt_template_service.py
@@ -16,6 +16,7 @@ def _reset_prompt_template_service_modules():
     yield
     sys.modules.pop("services.prompt_template_service", None)
     sys.modules.pop("database.prompt_template_db", None)
+    sys.modules.pop("consts.model", None)
 
 
 @pytest.fixture
@@ -23,20 +24,30 @@ def prompt_template_models(monkeypatch):
     if BACKEND_PATH not in sys.path:
         sys.path.insert(0, BACKEND_PATH)
 
-    nexent_module = types.ModuleType("nexent")
-    nexent_core_module = types.ModuleType("nexent.core")
-    nexent_agents_module = types.ModuleType("nexent.core.agents")
-    agent_model_module = types.ModuleType("nexent.core.agents.agent_model")
-    agent_model_module.ToolConfig = type("ToolConfig", (), {})
+    consts_model_module = types.ModuleType("consts.model")
 
-    monkeypatch.setitem(sys.modules, "nexent", nexent_module)
-    monkeypatch.setitem(sys.modules, "nexent.core", nexent_core_module)
-    monkeypatch.setitem(sys.modules, "nexent.core.agents", nexent_agents_module)
-    monkeypatch.setitem(sys.modules, "nexent.core.agents.agent_model", agent_model_module)
+    class PromptTemplateContentRequest:
+        def __init__(self, **kwargs):
+            for key, value in kwargs.items():
+                setattr(self, key, value)
+
+        def model_dump(self):
+            return dict(self.__dict__)
+
+    class PromptTemplateRequest:
+        def __init__(self, template_name, description, template_type, template_content_zh, template_content_en=None):
+            self.template_name = template_name
+            self.description = description
+            self.template_type = template_type
+            self.template_content_zh = template_content_zh
+            self.template_content_en = template_content_en
+
+    consts_model_module.PromptTemplateRequest = PromptTemplateRequest
+    consts_model_module.PromptTemplateContentRequest = PromptTemplateContentRequest
+    monkeypatch.setitem(sys.modules, "consts.model", consts_model_module)
 
-    consts_model = importlib.import_module("consts.model")
     consts_exceptions = importlib.import_module("consts.exceptions")
-    return consts_model, consts_exceptions
+    return consts_model_module, consts_exceptions
 
 
 @pytest.fixture
diff --git a/test/backend/services/test_tool_configuration_service.py b/test/backend/services/test_tool_configuration_service.py
index 29d2f75f6..37035b839 100644
--- a/test/backend/services/test_tool_configuration_service.py
+++ b/test/backend/services/test_tool_configuration_service.py
@@ -4720,6 +4720,37 @@ def test_import_openapi_service_extract_title_as_fallback(self, mock_logger, moc
         call_kwargs = mock_upsert.call_args.kwargs
         assert call_kwargs["description"] == "API Title Only"
 
+    @patch('backend.services.tool_configuration_service.upsert_openapi_service')
+    @patch('backend.services.tool_configuration_service.logger')
+    def test_import_openapi_service_with_headers_template(self, mock_logger, mock_upsert):
+        """Test import_openapi_service passes headers_template to upsert."""
+        mock_upsert.return_value = {"service_name": "test_service"}
+        headers_template = {
+            "Authorization": "Bearer {{token}}",
+            "X-Tenant-ID": "{{tenant_id}}"
+        }
+
+        openapi_json = {
+            "info": {"description": "Test API"},
+            "paths": {}
+        }
+
+        from backend.services.tool_configuration_service import import_openapi_service
+        result = import_openapi_service(
+            service_name="test_service",
+            openapi_json=openapi_json,
+            server_url="http://api.example.com",
+            tenant_id="tenant1",
+            user_id="user1",
+            headers_template=headers_template
+        )
+
+        assert result["service_name"] == "test_service"
+        call_kwargs = mock_upsert.call_args.kwargs
+        assert call_kwargs["headers_template"] == headers_template
+        assert call_kwargs["description"] == "Test API"
+        mock_logger.info.assert_called_once()
+
     @patch('backend.services.tool_configuration_service.upsert_openapi_service')
     @patch('backend.services.tool_configuration_service.logger')
     def test_import_openapi_service_overrides_servers_url(self, mock_logger, mock_upsert):
diff --git a/test/backend/services/test_vectordatabase_service.py b/test/backend/services/test_vectordatabase_service.py
index 952aaad79..0fcb851c4 100644
--- a/test/backend/services/test_vectordatabase_service.py
+++ b/test/backend/services/test_vectordatabase_service.py
@@ -1050,7 +1050,7 @@ def test_list_indices_with_stats(self, mock_get_knowledge, mock_get_user_tenant,
         mock_get_knowledge.return_value = [
             {"index_name": "index1",
              "embedding_model_name": "test-model", "group_ids": "1,2", "knowledge_sources": "elasticsearch",
-             "ingroup_permission": "EDIT", "tenant_id": "test_tenant"},
+             "ingroup_permission": "EDIT", "tenant_id": "test_tenant", "preserve_source_file": False},
             {"index_name": "index2", "embedding_model_name": "test-model",
              "group_ids": "", "knowledge_sources": "elasticsearch", "ingroup_permission": "READ_ONLY",
              "tenant_id": "test_tenant"}
@@ -1078,6 +1078,10 @@ def test_list_indices_with_stats(self, mock_get_knowledge, mock_get_user_tenant,
         # index2 has empty group_ids, so it gets the tenant default group [1]
         self.assertEqual(result["indices_info"][1]["group_ids"], [1])
 
+        # Verify preserve_source_file is included in indices_info
+        self.assertFalse(result["indices_info"][0]["preserve_source_file"])
+        self.assertTrue(result["indices_info"][1]["preserve_source_file"])
+
         self.mock_vdb_core.get_user_indices.assert_called_once_with("*")
         self.mock_vdb_core.get_indices_detail.assert_called_once_with(
             ["index1", "index2"])
@@ -2269,6 +2273,78 @@ def test_delete_documents(self, mock_delete_file, mock_update_last_doc):
         # Verify that delete_file was called with the correct path
         mock_delete_file.assert_called_once_with("test_path")
 
+    @patch('backend.services.vectordatabase_service.delete_file')
+    @patch('backend.services.vectordatabase_service.file_exists', return_value=False)
+    def test_delete_source_file(self, mock_file_exists, mock_delete_file):
+        mock_delete_file.return_value = {"success": True}
+        result = ElasticSearchService.delete_source_file(
+            "knowledge_base/doc.pdf"
+        )
+        self.assertTrue(result["deleted_minio"])
+        mock_delete_file.assert_called()
+
+    @patch(
+        'backend.services.vectordatabase_service.get_all_files_status',
+        new_callable=AsyncMock,
+    )
+    @patch('backend.services.vectordatabase_service.delete_file')
+    def test_delete_document_by_scope_source_only(
+        self, mock_delete_file, mock_get_status
+    ):
+        mock_get_status.return_value = {
+            "knowledge_base/doc.pdf": {"state": "COMPLETED"}
+        }
+        mock_delete_file.return_value = {"success": True}
+
+        result = asyncio.run(
+            ElasticSearchService.delete_document_by_scope(
+                "test_index",
+                "knowledge_base/doc.pdf",
+                "source_only",
+                self.mock_vdb_core,
+            )
+        )
+
+        self.assertEqual(result["scope"], "source_only")
+        self.assertEqual(result["deleted_es_count"], 0)
+        self.mock_vdb_core.delete_documents.assert_not_called()
+
+    @patch(
+        'backend.services.vectordatabase_service.get_all_files_status',
+        new_callable=AsyncMock,
+    )
+    def test_delete_document_by_scope_rejects_processing(
+        self, mock_get_status
+    ):
+        mock_get_status.return_value = {
+            "knowledge_base/doc.pdf": {"state": "PROCESSING"}
+        }
+
+        with self.assertRaises(ValueError):
+            asyncio.run(
+                ElasticSearchService.delete_document_by_scope(
+                    "test_index",
+                    "knowledge_base/doc.pdf",
+                    "source_only",
+                    self.mock_vdb_core,
+                )
+            )
+
+    @patch('backend.services.vectordatabase_service.file_exists', return_value=False)
+    def test_compute_source_available_completed_missing_minio(self, _mock_exists):
+        available = ElasticSearchService._compute_source_available({
+            "path_or_url": "knowledge_base/doc.pdf",
+            "status": "COMPLETED",
+        })
+        self.assertFalse(available)
+
+    def test_compute_source_available_processing_defaults_true(self):
+        available = ElasticSearchService._compute_source_available({
+            "path_or_url": "knowledge_base/doc.pdf",
+            "status": "PROCESSING",
+        })
+        self.assertTrue(available)
+
     @patch('backend.services.vectordatabase_service.update_last_doc_update_time')
     @patch('backend.services.vectordatabase_service.get_redis_service')
     def test_index_documents_respects_cancellation_flag(self, mock_get_redis_service, mock_update_last_doc):
@@ -4177,73 +4253,172 @@ def test_get_embedding_model_multi_embedding_type(self, mock_get_model_by_displa
             # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    def test_get_embedding_model_unknown_type(self):
+    @patch('backend.services.vectordatabase_service.get_model_records')
+    def test_get_embedding_model_no_model_name_no_records(self, mock_get_model_records):
         """
-        Test get_embedding_model when no model_name is provided.
+        Test get_embedding_model when no model_name is provided and no records exist.
 
         This test verifies that:
-        1. When no model_name is provided, the function returns (None, None)
-        2. The function handles missing model_name gracefully
+        1. When no model_name is provided and no model records exist, returns (None, None)
+        2. Embedding models are queried before multi_embedding models
         """
-        # Stop the mock from setUp to test the real function
+        mock_get_model_records.side_effect = [
+            [],
+            [],
+        ]
+
         self.get_embedding_model_patcher.stop()
 
         try:
-            # Execute - now we can call the real function
             from backend.services.vectordatabase_service import get_embedding_model
             result, model_id = get_embedding_model("test_tenant")
 
-            # Assert
             self.assertIsNone(result)
             self.assertIsNone(model_id)
+            mock_get_model_records.assert_any_call({"model_type": "embedding"}, "test_tenant")
+            mock_get_model_records.assert_any_call({"model_type": "multi_embedding"}, "test_tenant")
         finally:
-            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    def test_get_embedding_model_empty_type(self):
+    @patch('backend.services.vectordatabase_service.get_model_records')
+    def test_get_embedding_model_default_embedding_record(self, mock_get_model_records):
+        """
+        Test get_embedding_model falls back to the newest embedding model when model_name is omitted.
         """
-        Test get_embedding_model when no model_name is provided.
+        mock_get_model_records.return_value = [{
+            "model_id": 101,
+            "model_type": "embedding",
+            "model_name": "default-embedding",
+            "model_repo": "openai",
+            "api_key": "test_api_key",
+            "base_url": "https://test.api.com",
+            "max_tokens": 1024,
+            "ssl_verify": True,
+        }]
 
-        This test verifies that:
-        1. When no model_name is provided, the function returns (None, None)
-        2. The function handles missing model_name gracefully
+        self.get_embedding_model_patcher.stop()
+
+        try:
+            with patch('backend.services.vectordatabase_service.OpenAICompatibleEmbedding') as mock_embedding_class, \
+                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
+                mock_embedding_instance = MagicMock()
+                mock_embedding_class.return_value = mock_embedding_instance
+                mock_get_model_name.return_value = "default-embedding"
+
+                from backend.services.vectordatabase_service import get_embedding_model
+                result, model_id = get_embedding_model("test_tenant")
+
+                self.assertEqual(result, mock_embedding_instance)
+                self.assertEqual(model_id, 101)
+                mock_get_model_records.assert_called_once_with({"model_type": "embedding"}, "test_tenant")
+        finally:
+            self.get_embedding_model_patcher.start()
+
+    @patch('backend.services.vectordatabase_service.get_model_records')
+    def test_get_embedding_model_fallback_to_multi_embedding(self, mock_get_model_records):
         """
-        # Stop the mock from setUp to test the real function
+        Test get_embedding_model falls back to multi_embedding when no embedding model exists.
+        """
+        mock_get_model_records.side_effect = [
+            [],
+            [{
+                "model_id": 202,
+                "model_type": "multi_embedding",
+                "model_name": "default-multi-embedding",
+                "model_repo": "jina",
+                "api_key": "test_api_key",
+                "base_url": "https://test.api.com",
+                "max_tokens": 2048,
+                "ssl_verify": True,
+            }],
+        ]
+
         self.get_embedding_model_patcher.stop()
 
         try:
-            # Execute - now we can call the real function
-            from backend.services.vectordatabase_service import get_embedding_model
-            result, model_id = get_embedding_model("test_tenant")
+            with patch('backend.services.vectordatabase_service.JinaEmbedding') as mock_embedding_class, \
+                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
+                mock_embedding_instance = MagicMock()
+                mock_embedding_class.return_value = mock_embedding_instance
+                mock_get_model_name.return_value = "default-multi-embedding"
 
-            # Assert
-            self.assertIsNone(result)
-            self.assertIsNone(model_id)
+                from backend.services.vectordatabase_service import get_embedding_model
+                result, model_id = get_embedding_model("test_tenant")
+
+                self.assertEqual(result, mock_embedding_instance)
+                self.assertEqual(model_id, 202)
+                self.assertEqual(mock_get_model_records.call_count, 2)
         finally:
-            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    def test_get_embedding_model_missing_type(self):
+    @patch('backend.services.vectordatabase_service.get_model_records')
+    def test_get_embedding_model_default_with_model_type_embedding(self, mock_get_model_records):
+        """
+        Test get_embedding_model queries by the provided model_type when model_name is omitted.
         """
-        Test get_embedding_model when no model_name is provided.
+        mock_get_model_records.return_value = [{
+            "model_id": 303,
+            "model_type": "embedding",
+            "model_name": "typed-embedding",
+            "model_repo": "openai",
+            "api_key": "test_api_key",
+            "base_url": "https://test.api.com",
+            "max_tokens": 1024,
+            "ssl_verify": True,
+        }]
 
-        This test verifies that:
-        1. When no model_name is provided, the function returns (None, None)
-        2. The function handles missing model_name gracefully
+        self.get_embedding_model_patcher.stop()
+
+        try:
+            with patch('backend.services.vectordatabase_service.OpenAICompatibleEmbedding') as mock_embedding_class, \
+                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
+                mock_embedding_instance = MagicMock()
+                mock_embedding_class.return_value = mock_embedding_instance
+                mock_get_model_name.return_value = "typed-embedding"
+
+                from backend.services.vectordatabase_service import get_embedding_model
+                result, model_id = get_embedding_model("test_tenant", model_type="embedding")
+
+                self.assertEqual(result, mock_embedding_instance)
+                self.assertEqual(model_id, 303)
+                mock_get_model_records.assert_called_once_with({"model_type": "embedding"}, "test_tenant")
+        finally:
+            self.get_embedding_model_patcher.start()
+
+    @patch('backend.services.vectordatabase_service.get_model_records')
+    def test_get_embedding_model_default_with_model_type_multi_embedding(self, mock_get_model_records):
         """
-        # Stop the mock from setUp to test the real function
+        Test get_embedding_model queries multi_embedding records when model_type is specified.
+        """
+        mock_get_model_records.return_value = [{
+            "model_id": 404,
+            "model_type": "multi_embedding",
+            "model_name": "typed-multi-embedding",
+            "model_repo": "jina",
+            "api_key": "test_api_key",
+            "base_url": "https://test.api.com",
+            "max_tokens": 2048,
+            "ssl_verify": True,
+        }]
+
         self.get_embedding_model_patcher.stop()
 
         try:
-            # Execute - now we can call the real function
-            from backend.services.vectordatabase_service import get_embedding_model
-            result, model_id = get_embedding_model("test_tenant")
+            with patch('backend.services.vectordatabase_service.JinaEmbedding') as mock_embedding_class, \
+                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
+                mock_embedding_instance = MagicMock()
+                mock_embedding_class.return_value = mock_embedding_instance
+                mock_get_model_name.return_value = "typed-multi-embedding"
 
-            # Assert
-            self.assertIsNone(result)
-            self.assertIsNone(model_id)
+                from backend.services.vectordatabase_service import get_embedding_model
+                result, model_id = get_embedding_model("test_tenant", model_type="multi_embedding")
+
+                self.assertEqual(result, mock_embedding_instance)
+                self.assertEqual(model_id, 404)
+                mock_get_model_records.assert_called_once_with(
+                    {"model_type": "multi_embedding"}, "test_tenant"
+                )
         finally:
-            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
     @patch('backend.services.vectordatabase_service.get_model_by_display_name')
diff --git a/test/backend/utils/test_auth_utils.py b/test/backend/utils/test_auth_utils.py
index af7fe0e1c..83b31a6ee 100644
--- a/test/backend/utils/test_auth_utils.py
+++ b/test/backend/utils/test_auth_utils.py
@@ -323,6 +323,22 @@ def test_get_current_user_id_with_mapping(monkeypatch):
     assert uid == "user-a" and tid == "tenant-a"
 
 
+def test_get_current_user_id_rejects_revoked_cas_session(monkeypatch):
+    monkeypatch.setattr(au, "IS_SPEED_MODE", False)
+    monkeypatch.setattr(au, "SUPABASE_JWT_SECRET", au.MOCK_JWT_SECRET_KEY)
+    monkeypatch.setattr(au, "SUPABASE_URL", "http://localhost:54321")
+    monkeypatch.setattr(au, "get_user_tenant_by_user_id",
+                        lambda u: {"tenant_id": "tenant-a"})
+    sys.modules["database.cas_session_db"] = MagicMock(
+        is_cas_session_active=MagicMock(return_value=False)
+    )
+
+    token = au.generate_session_jwt("user-a", 1000, session_id="cas-session-1")
+
+    with pytest.raises(UnauthorizedError, match="CAS session"):
+        au.get_current_user_id(token)
+
+
 def test_get_user_language_from_cookie():
     class Req:
         cookies = {"NEXT_LOCALE": "en"}
diff --git a/test/backend/utils/test_context_utils.py b/test/backend/utils/test_context_utils.py
index 66e789477..b58c46040 100644
--- a/test/backend/utils/test_context_utils.py
+++ b/test/backend/utils/test_context_utils.py
@@ -162,7 +162,6 @@ def test_empty_inputs_produces_skeleton(self):
             few_shots="Q: hi?\nA: Hello!",
             app_name="Test",
             app_description="Test",
-            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
@@ -184,7 +183,6 @@ class MockTool:
             few_shots="Q?",
             app_name="Test",
             app_description="Test",
-            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
@@ -207,7 +205,6 @@ class MockTool:
             few_shots="Q?",
             app_name="Test",
             app_description="Test",
-            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
diff --git a/test/backend/utils/test_memory_utils.py b/test/backend/utils/test_memory_utils.py
index 134c38923..b887ab79f 100644
--- a/test/backend/utils/test_memory_utils.py
+++ b/test/backend/utils/test_memory_utils.py
@@ -1,415 +1,352 @@
-import pytest
 import sys
-from unittest.mock import patch, MagicMock
+from types import SimpleNamespace
+from unittest.mock import MagicMock
+
+import pytest
 
 # Setup common mocks
-from test.common.test_mocks import setup_common_mocks, patch_minio_client_initialization, mock_constants
+from test.common.test_mocks import patch_minio_client_initialization, setup_common_mocks
 
 # Initialize common mocks
 mocks = setup_common_mocks()
 
 # Patch storage factory before importing
 with patch_minio_client_initialization():
-    from backend.utils.memory_utils import build_memory_config
+    from backend.utils.memory_utils import _sanitize_index_component, build_memory_config
 
 
 @pytest.fixture
 def mock_model_configs():
-    """Fixture to provide mock model configurations"""
+    """Fixture to provide mock model configurations."""
     llm_config = {
         "model_name": "gpt-4",
         "model_repo": "openai",
         "base_url": "https://api.openai.com/v1",
-        "api_key": "test-llm-key"
+        "api_key": "test-llm-key",
     }
     embedding_config = {
         "model_name": "text-embedding-ada-002",
         "model_repo": "openai",
         "base_url": "https://api.openai.com/v1",
         "api_key": "test-embed-key",
-        "max_tokens": 1536
+        "max_tokens": 1536,
     }
     return {
         "llm_config": llm_config,
-        "embedding_config": embedding_config
+        "embedding_config": embedding_config,
     }
 
 
 @pytest.fixture
 def mock_tenant_config_manager():
-    """Fixture to provide mock tenant config manager"""
+    """Fixture to provide mock tenant config manager."""
     return MagicMock()
 
 
-class TestMemoryUtils:
-    """Tests for backend.utils.memory_utils functions"""
+@pytest.fixture
+def model_mapping():
+    """Fixture to provide deterministic model config mapping."""
+    return {"llm": "llm", "embedding": "embedding"}
 
-    def test_build_memory_config_success(self, mocker, mock_constants, mock_model_configs, mock_tenant_config_manager):
-        """Builds a complete configuration successfully"""
-        # Use global fixtures for common mocks
-        mock_llm_config = mock_model_configs['llm_config']
-        mock_embed_config = mock_model_configs['embedding_config']
 
-        # Mock get_model_config return sequence
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            mock_llm_config,  # LLM
-            mock_embed_config  # embedding
-        ]
+@pytest.fixture
+def mock_constants():
+    """Fixture to provide Elasticsearch-related constants."""
+    return SimpleNamespace(
+        ES_HOST="http://localhost:9200",
+        ES_API_KEY="test-es-key",
+        ES_USERNAME="elastic",
+        ES_PASSWORD="test-password",
+    )
 
-        # Mock get_model_name_from_config
-        mock_get_model_name = MagicMock()
-        mock_get_model_name.side_effect = [
-            "openai/gpt-4", "openai/text-embedding-ada-002"]
 
-        # Provide deterministic mapping for model config keys
-        model_mapping = {"llm": "llm", "embedding": "embedding"}
+@pytest.fixture
+def patch_memory_dependencies(mocker, mock_tenant_config_manager, mock_constants, model_mapping):
+    """Patch shared dependencies used by build_memory_config."""
+    mocker.patch("backend.utils.memory_utils.tenant_config_manager", mock_tenant_config_manager)
+    mocker.patch("backend.utils.memory_utils._c", mock_constants)
+    mocker.patch("backend.utils.memory_utils.MODEL_CONFIG_MAPPING", model_mapping)
+    return mock_tenant_config_manager, mock_constants
+
+
+class TestSanitizeIndexComponent:
+    """Tests for the index component sanitizer."""
+
+    @pytest.mark.parametrize(
+        ("value", "expected"),
+        [
+            ("OpenAI", "openai"),
+            ("azure/openai", "azure_openai"),
+            ("Model Name", "model_name"),
+            ("repo.name-1", "repo.name-1"),
+            ("MIXED/Chars@Here", "mixed_chars_here"),
+            ("", ""),
+        ],
+    )
+    def test_sanitize_index_component(self, value, expected):
+        """Sanitizer lowercases input and replaces unsupported characters."""
+        assert _sanitize_index_component(value) == expected
 
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_constants)
-        mocker.patch(
-            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
-        mocker.patch(
-            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
 
-        # Execute
+class TestMemoryUtils:
+    """Tests for backend.utils.memory_utils functions."""
+
+    def test_build_memory_config_success(
+        self,
+        mocker,
+        mock_model_configs,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+        mock_constants,
+    ):
+        """Builds a complete configuration successfully."""
+        mock_llm_config = mock_model_configs["llm_config"]
+        mock_embed_config = mock_model_configs["embedding_config"]
+        mock_tenant_config_manager.get_model_config.side_effect = [mock_llm_config, mock_embed_config]
+
+        mock_get_model_name = mocker.patch(
+            "backend.utils.memory_utils.get_model_name_from_config",
+            side_effect=["openai/gpt-4", "openai/text-embedding-ada-002"],
+        )
+
         result = build_memory_config("test-tenant-id")
 
-        # Structure
         assert isinstance(result, dict)
-        assert "llm" in result
-        assert "embedder" in result
-        assert "vector_store" in result
-        assert "telemetry" in result
-
-        # LLM
-        assert result["llm"]["provider"] == "openai"
-        assert result["llm"]["config"]["model"] == "openai/gpt-4"
-        assert result["llm"]["config"]["openai_base_url"] == "https://api.openai.com/v1"
-        assert result["llm"]["config"]["api_key"] == "test-llm-key"
-
-        # Embedder
-        assert result["embedder"]["provider"] == "openai"
-        assert result["embedder"]["config"]["model"] == "openai/text-embedding-ada-002"
-        assert result["embedder"]["config"]["openai_base_url"] == "https://api.openai.com/v1"
-        assert result["embedder"]["config"]["embedding_dims"] == 1536
-        assert result["embedder"]["config"]["api_key"] == "test-embed-key"
-
-        # Vector store
-        assert result["vector_store"]["provider"] == "elasticsearch"
-        assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_text-embedding-ada-002_1536"
-        assert result["vector_store"]["config"]["host"] == "http://localhost"
-        assert result["vector_store"]["config"]["port"] == 9200
-        assert result["vector_store"]["config"]["embedding_model_dims"] == 1536
-        assert result["vector_store"]["config"]["verify_certs"] is False
-        assert result["vector_store"]["config"]["api_key"] == "test-es-key"
-        assert result["vector_store"]["config"]["user"] == "elastic"
-        assert result["vector_store"]["config"]["password"] == "test-password"
+        assert result["llm"] == {
+            "provider": "openai",
+            "config": {
+                "model": "openai/gpt-4",
+                "openai_base_url": "https://api.openai.com/v1",
+                "api_key": "test-llm-key",
+            },
+        }
+        assert result["embedder"] == {
+            "provider": "openai",
+            "config": {
+                "model": "openai/text-embedding-ada-002",
+                "openai_base_url": "https://api.openai.com/v1",
+                "embedding_dims": 1536,
+                "api_key": "test-embed-key",
+            },
+        }
+        assert result["vector_store"] == {
+            "provider": "elasticsearch",
+            "config": {
+                "collection_name": "mem0_openai_text-embedding-ada-002_1536",
+                "host": "http://localhost",
+                "port": 9200,
+                "embedding_model_dims": 1536,
+                "verify_certs": False,
+                "api_key": mock_constants.ES_API_KEY,
+                "user": mock_constants.ES_USERNAME,
+                "password": mock_constants.ES_PASSWORD,
+            },
+        }
+        assert result["telemetry"] == {"enabled": False}
 
-        # Telemetry
-        assert result["telemetry"]["enabled"] is False
-
-        # Called for both models
         assert mock_get_model_name.call_count == 2
         mock_get_model_name.assert_any_call(mock_llm_config)
         mock_get_model_name.assert_any_call(mock_embed_config)
-
-    def test_build_memory_config_missing_llm_config(self, mocker, mock_tenant_config_manager):
-        """Raises when LLM config is missing"""
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            None,  # LLM is None
-            {"model_name": "test-embed", "max_tokens": 1536}  # embedding present
-        ]
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
-            build_memory_config("test-tenant-id")
-
-        assert "Missing LLM configuration for tenant" in str(exc_info.value)
-
-    def test_build_memory_config_llm_config_missing_model_name(self, mocker):
-        """Raises when LLM config lacks model_name"""
-        mock_tenant_config_manager = MagicMock()
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            {"api_key": "test-key"},  # LLM missing model_name
-            {"model_name": "test-embed", "max_tokens": 1536}  # embedding present
-        ]
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
-            build_memory_config("test-tenant-id")
-
-        assert "Missing LLM configuration for tenant" in str(exc_info.value)
-
-    def test_build_memory_config_missing_embedding_config(self, mocker, mock_tenant_config_manager):
-        """Raises when embedding config is missing"""
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm"},  # LLM present
-            None  # embedding is None
-        ]
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
-            build_memory_config("test-tenant-id")
-
-        assert "Missing embedding-model configuration for tenant" in str(
-            exc_info.value)
-
-    def test_build_memory_config_embedding_config_missing_max_tokens(self, mocker):
-        """Raises when embedding config lacks max_tokens"""
-        mock_tenant_config_manager = MagicMock()
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm"},  # LLM present
-            {"model_name": "test-embed"}  # embedding missing max_tokens
-        ]
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
-            build_memory_config("test-tenant-id")
-
-        assert "Missing embedding-model configuration for tenant" in str(
-            exc_info.value)
-
-    def test_build_memory_config_missing_es_host(self, mocker):
-        """Raises when ES_HOST is missing"""
-        mock_tenant_config_manager = MagicMock()
+        assert mock_tenant_config_manager.get_model_config.call_count == 2
+
+    @pytest.mark.parametrize(
+        "llm_raw",
+        [None, {}, {"api_key": "test-key"}, {"model_name": ""}],
+    )
+    def test_build_memory_config_missing_llm_config(self, llm_raw, patch_memory_dependencies, mock_tenant_config_manager):
+        """Raises when LLM config is missing or incomplete."""
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm"},
-            {"model_name": "test-embed", "max_tokens": 1536}
+            llm_raw,
+            {"model_name": "test-embed", "max_tokens": 1536},
         ]
 
-        mock_const = MagicMock()
-        mock_const.ES_HOST = None  # ES_HOST is None
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
+        with pytest.raises(ValueError, match="Missing LLM configuration for tenant"):
             build_memory_config("test-tenant-id")
 
-        assert "ES_HOST is not configured" in str(exc_info.value)
-
-    def test_build_memory_config_invalid_es_host_format(self, mocker):
-        """Raises when ES_HOST format is invalid"""
-        mock_tenant_config_manager = MagicMock()
+    @pytest.mark.parametrize(
+        "embed_raw",
+        [None, {}, {"model_name": "test-embed"}, {"model_name": "test-embed", "max_tokens": 0}],
+    )
+    def test_build_memory_config_missing_embedding_config(
+        self,
+        embed_raw,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+    ):
+        """Raises when embedding config is missing or incomplete."""
         mock_tenant_config_manager.get_model_config.side_effect = [
             {"model_name": "test-llm"},
-            {"model_name": "test-embed", "max_tokens": 1536}
+            embed_raw,
         ]
 
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "invalid-host"  # invalid format
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
+        with pytest.raises(ValueError, match="Missing embedding-model configuration for tenant"):
             build_memory_config("test-tenant-id")
 
-        assert "ES_HOST must include scheme, host and port" in str(
-            exc_info.value)
-
-    def test_build_memory_config_es_host_missing_scheme(self, mocker):
-        """Raises when ES_HOST is missing scheme"""
-        mock_tenant_config_manager = MagicMock()
-        mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm"},
-            {"model_name": "test-embed", "max_tokens": 1536}
-        ]
-
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "localhost:9200"  # missing scheme
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
+    @pytest.mark.parametrize("es_host", [None, ""])
+    def test_build_memory_config_missing_es_host(self, es_host, patch_memory_dependencies, mock_constants):
+        """Raises when ES_HOST is not configured."""
+        mock_constants.ES_HOST = es_host
 
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
+        with pytest.raises(ValueError, match="ES_HOST is not configured"):
             build_memory_config("test-tenant-id")
 
-        assert "ES_HOST must include scheme, host and port" in str(
-            exc_info.value)
-
-    def test_build_memory_config_es_host_missing_port(self, mocker):
-        """Raises when ES_HOST is missing port"""
-        mock_tenant_config_manager = MagicMock()
+    @pytest.mark.parametrize(
+        "es_host",
+        [
+            "invalid-host",
+            "localhost:9200",
+            "http://localhost",
+            "http://:9200",
+        ],
+    )
+    def test_build_memory_config_invalid_es_host_format(self, es_host, patch_memory_dependencies, mock_tenant_config_manager, mock_constants):
+        """Raises when ES_HOST is missing required URL parts."""
         mock_tenant_config_manager.get_model_config.side_effect = [
             {"model_name": "test-llm"},
-            {"model_name": "test-embed", "max_tokens": 1536}
+            {"model_name": "test-embed", "max_tokens": 1536},
         ]
+        mock_constants.ES_HOST = es_host
 
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "http://localhost"  # missing port
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-
-        # Should raise
-        with pytest.raises(ValueError) as exc_info:
+        with pytest.raises(
+            ValueError,
+            match="ES_HOST must include scheme, host and port, e.g. http://host:9200",
+        ):
             build_memory_config("test-tenant-id")
 
-        assert "ES_HOST must include scheme, host and port" in str(
-            exc_info.value)
-
-    def test_build_memory_config_with_https_es_host(self, mocker):
-        """HTTPS ES_HOST is parsed correctly and collection name composes"""
-        mock_tenant_config_manager = MagicMock()
+    def test_build_memory_config_with_https_es_host(
+        self,
+        mocker,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+        mock_constants,
+    ):
+        """HTTPS ES host is parsed correctly."""
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm", "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
-            {"model_name": "test-embed", "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
+            {
+                "model_name": "test-llm",
+                "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-llm-key",
+            },
+            {
+                "model_name": "test-embed",
+                "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-embed-key",
+                "max_tokens": 1536,
+            },
         ]
-
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "https://elastic.example.com:9200"
-        mock_const.ES_API_KEY = "test-es-key"
-        mock_const.ES_USERNAME = "elastic"
-        mock_const.ES_PASSWORD = "test-password"
-
-        mock_get_model_name = MagicMock()
-        mock_get_model_name.side_effect = [
-            "openai/test-llm", "openai/test-embed"]
-
-        model_mapping = {"llm": "llm", "embedding": "embedding"}
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-        mocker.patch(
-            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
+        mock_constants.ES_HOST = "https://elastic.example.com:9200"
         mocker.patch(
-            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
+            "backend.utils.memory_utils.get_model_name_from_config",
+            side_effect=["openai/test-llm", "openai/test-embed"],
+        )
 
-        # Execute
         result = build_memory_config("test-tenant-id")
 
-        # ES fields
         assert result["vector_store"]["config"]["host"] == "https://elastic.example.com"
         assert result["vector_store"]["config"]["port"] == 9200
         assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_test-embed_1536"
 
-    def test_build_memory_config_with_custom_port(self, mocker):
-        """Custom ES port is parsed and applied; collection name composed"""
-        mock_tenant_config_manager = MagicMock()
+    def test_build_memory_config_with_custom_port(
+        self,
+        mocker,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+        mock_constants,
+    ):
+        """Custom ES port is parsed and applied."""
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "test-llm", "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
-            {"model_name": "test-embed", "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
+            {
+                "model_name": "test-llm",
+                "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-llm-key",
+            },
+            {
+                "model_name": "test-embed",
+                "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-embed-key",
+                "max_tokens": 1536,
+            },
         ]
-
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "http://localhost:9300"  # custom port
-        mock_const.ES_API_KEY = "test-es-key"
-        mock_const.ES_USERNAME = "elastic"
-        mock_const.ES_PASSWORD = "test-password"
-
-        mock_get_model_name = MagicMock()
-        mock_get_model_name.side_effect = [
-            "openai/test-llm", "openai/test-embed"]
-
-        model_mapping = {"llm": "llm", "embedding": "embedding"}
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
+        mock_constants.ES_HOST = "http://localhost:9300"
         mocker.patch(
-            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
-        mocker.patch(
-            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
+            "backend.utils.memory_utils.get_model_name_from_config",
+            side_effect=["openai/test-llm", "openai/test-embed"],
+        )
 
-        # Execute
         result = build_memory_config("test-tenant-id")
 
-        # ES fields
         assert result["vector_store"]["config"]["host"] == "http://localhost"
         assert result["vector_store"]["config"]["port"] == 9300
         assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_test-embed_1536"
 
-    def test_build_memory_config_sanitizes_slashes_in_repo_and_name(self, mocker):
-        """Slash characters in repo/name are replaced with underscores in collection name"""
-        mock_tenant_config_manager = MagicMock()
+    def test_build_memory_config_sanitizes_repo_and_name(
+        self,
+        mocker,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+    ):
+        """Collection name sanitizes repo and model name through the helper."""
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "gpt-4", "model_repo": "azure/openai",
-                "base_url": "https://api.example.com/v1", "api_key": "llm-key"},
-            {"model_name": "text-embed/ada-002", "model_repo": "azure/openai",
-                "base_url": "https://api.example.com/v1", "api_key": "embed-key", "max_tokens": 1536}
+            {
+                "model_name": "gpt-4",
+                "model_repo": "Azure/OpenAI Repo",
+                "base_url": "https://api.example.com/v1",
+                "api_key": "llm-key",
+            },
+            {
+                "model_name": "Text Embed@Ada/002",
+                "model_repo": "Azure/OpenAI Repo",
+                "base_url": "https://api.example.com/v1",
+                "api_key": "embed-key",
+                "max_tokens": 1536,
+            },
         ]
-
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "http://localhost:9200"
-        mock_const.ES_API_KEY = "test-es-key"
-        mock_const.ES_USERNAME = "elastic"
-        mock_const.ES_PASSWORD = "test-password"
-
-        model_mapping = {"llm": "llm", "embedding": "embedding"}
-        mock_get_model_name = MagicMock()
-        mock_get_model_name.side_effect = [
-            "azure/openai/gpt-4", "azure/openai/text-embed/ada-002"]
-
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-        mocker.patch(
-            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
         mocker.patch(
-            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
-
-        result = build_memory_config("tenant-with-slash")
-
-        assert result["vector_store"]["config"]["collection_name"] == "mem0_azure_openai_text-embed_ada-002_1536"
-
-    def test_build_memory_config_with_empty_model_repo(self, mocker):
-        """Empty model_repo yields collection name without repo segment"""
-        mock_tenant_config_manager = MagicMock()
+            "backend.utils.memory_utils.get_model_name_from_config",
+            side_effect=["azure/openai/gpt-4", "azure/openai/Text Embed@Ada/002"],
+        )
+
+        result = build_memory_config("tenant-with-special-chars")
+
+        assert result["vector_store"]["config"]["collection_name"] == (
+            "mem0_azure_openai_repo_text_embed_ada_002_1536"
+        )
+
+    @pytest.mark.parametrize("repo_value", ["", None])
+    def test_build_memory_config_without_repo_segment(
+        self,
+        repo_value,
+        mocker,
+        patch_memory_dependencies,
+        mock_tenant_config_manager,
+    ):
+        """Falsy model_repo omits the repo segment from the collection name."""
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {"model_name": "gpt-4", "model_repo": "",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
-            {"model_name": "text-embedding-ada-002", "model_repo": "",
-                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
+            {
+                "model_name": "gpt-4",
+                "model_repo": repo_value,
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-llm-key",
+            },
+            {
+                "model_name": "Text Embedding/ADA 002",
+                "model_repo": repo_value,
+                "base_url": "https://api.openai.com/v1",
+                "api_key": "test-embed-key",
+                "max_tokens": 1536,
+            },
         ]
-
-        mock_const = MagicMock()
-        mock_const.ES_HOST = "http://localhost:9200"
-        mock_const.ES_API_KEY = "test-es-key"
-        mock_const.ES_USERNAME = "elastic"
-        mock_const.ES_PASSWORD = "test-password"
-
-        mock_get_model_name = MagicMock()
-        mock_get_model_name.side_effect = [
-            "gpt-4", "text-embedding-ada-002"]  # no repo prefix
-
-        model_mapping = {"llm": "llm", "embedding": "embedding"}
-        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
-                     mock_tenant_config_manager)
-        mocker.patch('backend.utils.memory_utils._c', mock_const)
-        mocker.patch(
-            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
         mocker.patch(
-            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
+            "backend.utils.memory_utils.get_model_name_from_config",
+            side_effect=["gpt-4", "Text Embedding/ADA 002"],
+        )
 
-        # Execute
         result = build_memory_config("test-tenant-id")
 
-        # Model names
         assert result["llm"]["config"]["model"] == "gpt-4"
-        assert result["embedder"]["config"]["model"] == "text-embedding-ada-002"
-        # Collection name omits empty repo segment
-        assert result["vector_store"]["config"]["collection_name"] == "mem0_text-embedding-ada-002_1536"
+        assert result["embedder"]["config"]["model"] == "Text Embedding/ADA 002"
+        assert result["vector_store"]["config"]["collection_name"] == "mem0_text_embedding_ada_002_1536"
diff --git a/test/conftest.py b/test/conftest.py
index 4acb6aded..246d784a5 100644
--- a/test/conftest.py
+++ b/test/conftest.py
@@ -26,6 +26,8 @@
     "mem0.configs.embeddings.base": MagicMock(),
 }
 
+_optional_sdk_stubs = {}
+
 # Add backend and sdk directories to sys.path so that modules can be imported
 # as `from backend.xxx import ...` and `from sdk.xxx import ...`
 _test_root = os.path.dirname(os.path.abspath(__file__))
@@ -37,6 +39,9 @@
 if _sdk_dir not in sys.path:
     sys.path.insert(0, _sdk_dir)
 
+sys.modules.update({k: v for k, v in _mem0_stubs.items() if k not in sys.modules})
+sys.modules.update({k: v for k, v in _optional_sdk_stubs.items() if k not in sys.modules})
+
 _tmp_root = os.path.abspath(os.path.join(_test_root, "..", ".pytest-tmp"))
 os.makedirs(_tmp_root, exist_ok=True)
 os.environ.setdefault("TMP", _tmp_root)
diff --git a/test/sdk/container/test_docker_client.py b/test/sdk/container/test_docker_client.py
index e30f6bfdc..816159a00 100644
--- a/test/sdk/container/test_docker_client.py
+++ b/test/sdk/container/test_docker_client.py
@@ -1627,10 +1627,10 @@ def test_ensure_network_exists(self, docker_container_client):
         mock_network = MagicMock()
         docker_container_client.client.networks.get.return_value = mock_network
 
-        docker_container_client._ensure_network("nexent_nexent")
+        docker_container_client._ensure_network("nexent_network")
 
         docker_container_client.client.networks.get.assert_called_once_with(
-            "nexent_nexent")
+            "nexent_network")
         docker_container_client.client.networks.create.assert_not_called()
 
     def test_ensure_network_create_new(self, docker_container_client):
@@ -1640,12 +1640,12 @@ def test_ensure_network_create_new(self, docker_container_client):
         mock_network = MagicMock()
         docker_container_client.client.networks.create.return_value = mock_network
 
-        docker_container_client._ensure_network("nexent_nexent")
+        docker_container_client._ensure_network("nexent_network")
 
         docker_container_client.client.networks.get.assert_called_once_with(
-            "nexent_nexent")
+            "nexent_network")
         docker_container_client.client.networks.create.assert_called_once_with(
-            "nexent_nexent")
+            "nexent_network")
 
     def test_ensure_network_race_condition(self, docker_container_client):
         """Test ensuring network when race condition occurs (another process creates it)"""
@@ -1657,7 +1657,7 @@ def test_ensure_network_race_condition(self, docker_container_client):
         docker_container_client.client.networks.create.side_effect = APIError(
             "Network already exists")
 
-        docker_container_client._ensure_network("nexent_nexent")
+        docker_container_client._ensure_network("nexent_network")
 
         assert docker_container_client.client.networks.get.call_count == 2
         docker_container_client.client.networks.create.assert_called_once()
@@ -1672,7 +1672,7 @@ def test_ensure_network_create_fails_then_get_fails(self, docker_container_clien
             "Create failed")
 
         with pytest.raises(ContainerError, match="Failed to create or get Docker network"):
-            docker_container_client._ensure_network("nexent_nexent")
+            docker_container_client._ensure_network("nexent_network")
 
     def test_ensure_network_get_api_error(self, docker_container_client):
         """Test ensuring network when get raises APIError"""
@@ -1680,7 +1680,7 @@ def test_ensure_network_get_api_error(self, docker_container_client):
             "API error")
 
         with pytest.raises(ContainerError, match="Failed to get Docker network"):
-            docker_container_client._ensure_network("nexent_nexent")
+            docker_container_client._ensure_network("nexent_network")
 
 
 # ---------------------------------------------------------------------------
diff --git a/test/sdk/container/test_k8s_client.py b/test/sdk/container/test_k8s_client.py
index 42db8c58c..84e0bc557 100644
--- a/test/sdk/container/test_k8s_client.py
+++ b/test/sdk/container/test_k8s_client.py
@@ -11,6 +11,7 @@
     KubernetesContainerClient,
     ContainerError,
     ContainerConnectionError,
+    _sanitize_k8s_name,
 )
 from nexent.container.k8s_config import KubernetesContainerConfig
 
@@ -90,6 +91,79 @@ def mock_pod():
     return pod
 
 
+# ---------------------------------------------------------------------------
+# Test _sanitize_k8s_name
+# ---------------------------------------------------------------------------
+
+
+class TestSanitizeK8sName:
+    """Test _sanitize_k8s_name helper function"""
+
+    def test_sanitize_basic_alphanumeric(self):
+        """Test basic alphanumeric string passes through"""
+        assert _sanitize_k8s_name("test-service") == "test-service"
+        assert _sanitize_k8s_name("abc123") == "abc123"
+
+    def test_sanitize_lowercase_conversion(self):
+        """Test uppercase letters are converted to lowercase"""
+        assert _sanitize_k8s_name("TestService") == "testservice"
+        assert _sanitize_k8s_name("UPPERCASE") == "uppercase"
+
+    def test_sanitize_special_characters_replaced(self):
+        """Test special characters are replaced with dash"""
+        assert _sanitize_k8s_name("test@service") == "test-service"
+        assert _sanitize_k8s_name("foo#bar") == "foo-bar"
+        assert _sanitize_k8s_name("test$123") == "test-123"
+
+    def test_sanitize_consecutive_special_chars(self):
+        """Test consecutive special characters are collapsed to single dash"""
+        assert _sanitize_k8s_name("foo@@bar") == "foo-bar"
+        assert _sanitize_k8s_name("test@#$service") == "test-service"
+        assert _sanitize_k8s_name("a!!b") == "a-b"
+
+    def test_sanitize_leading_special_chars(self):
+        """Test leading special characters are removed"""
+        assert _sanitize_k8s_name("@test") == "test"
+        assert _sanitize_k8s_name("#foo") == "foo"
+        assert _sanitize_k8s_name("!test@service") == "test-service"
+
+    def test_sanitize_trailing_special_chars(self):
+        """Test trailing special characters are removed"""
+        assert _sanitize_k8s_name("test@") == "test"
+        assert _sanitize_k8s_name("test-service!") == "test-service"
+
+    def test_sanitize_mixed_case_with_specials(self):
+        """Test mixed case with special characters"""
+        assert _sanitize_k8s_name("Foo@Bar!Test") == "foo-bar-test"
+
+    def test_sanitize_empty_string(self):
+        """Test empty string returns 'unknown'"""
+        assert _sanitize_k8s_name("") == "unknown"
+
+    def test_sanitize_only_special_chars(self):
+        """Test string with only special characters returns 'unknown'"""
+        assert _sanitize_k8s_name("@@@") == "unknown"
+        assert _sanitize_k8s_name("!@#") == "unknown"
+
+    def test_sanitize_none(self):
+        """Test None returns 'unknown'"""
+        assert _sanitize_k8s_name(None) == "unknown"
+
+    def test_sanitize_with_dots(self):
+        """Test dots are converted to dashes"""
+        assert _sanitize_k8s_name("foo.bar") == "foo-bar"
+        assert _sanitize_k8s_name("foo...bar") == "foo-bar"
+
+    def test_sanitize_underscore_replaced(self):
+        """Test underscores are replaced with dash"""
+        assert _sanitize_k8s_name("foo_bar") == "foo-bar"
+
+    def test_sanitize_spaces_replaced(self):
+        """Test spaces are replaced with dash"""
+        assert _sanitize_k8s_name("foo bar") == "foo-bar"
+        assert _sanitize_k8s_name("foo  bar") == "foo-bar"
+
+
 # ---------------------------------------------------------------------------
 # Test KubernetesContainerClient.__init__
 # ---------------------------------------------------------------------------
@@ -192,6 +266,72 @@ def test_generate_pod_name_with_special_chars(self, k8s_container_client):
             assert "@" not in name
             assert "#" not in name
 
+    def test_generate_pod_name_consecutive_special_chars(self, k8s_container_client):
+        """Test pod name generation with consecutive special characters"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "foo@@bar", "tenant123", "user12345")
+            assert name == "mcp-foo-bar-tenant12-user1234-a1b2c3d4"
+            assert "--" not in name
+
+    def test_generate_pod_name_leading_special_chars(self, k8s_container_client):
+        """Test pod name generation with leading special characters"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "@test-service", "tenant123", "user12345")
+            # "@test-service" -> "test-service" (leading @ stripped)
+            assert name.startswith("mcp-test")
+            assert not name.startswith("mcp-@")
+
+    def test_generate_pod_name_trailing_special_chars(self, k8s_container_client):
+        """Test pod name generation with trailing special characters"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "test-service@", "tenant123", "user12345")
+            assert name == "mcp-test-service-tenant12-user1234-a1b2c3d4"
+            assert name.endswith("-a1b2c3d4")
+
+    def test_generate_pod_name_uppercase(self, k8s_container_client):
+        """Test pod name generation with uppercase letters"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "TestService", "tenant123", "user12345")
+            assert name == "mcp-testservice-tenant12-user1234-a1b2c3d4"
+
+    def test_generate_pod_name_underscores(self, k8s_container_client):
+        """Test pod name generation with underscores"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "test_service", "tenant_123", "user_12345")
+            # tenant_123 -> tenant-123 (9 chars), truncated to 8 -> tenant-1
+            # user_12345 -> user-12345 (10 chars), truncated to 8 -> user-123
+            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
+
+    def test_generate_pod_name_dots(self, k8s_container_client):
+        """Test pod name generation with dots"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "test.service", "tenant.123", "user.12345")
+            # tenant.123 -> tenant.123 (9 chars), truncated to 8 -> tenant.1
+            # user.12345 -> user.12345 (10 chars), truncated to 8 -> user.123
+            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
+
+    def test_generate_pod_name_spaces(self, k8s_container_client):
+        """Test pod name generation with spaces"""
+        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
+            mock_uuid.return_value.hex = "a1b2c3d4"
+            name = k8s_container_client._generate_pod_name(
+                "test service", "tenant 123", "user 12345")
+            # tenant 123 -> tenant 123 (9 chars), truncated to 8 -> tenant 1
+            # user 12345 -> user 12345 (10 chars), truncated to 8 -> user 123
+            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
+
     def test_generate_pod_name_long_user_id(self, k8s_container_client):
         """Test pod name generation with long user ID"""
         long_user_id = "a" * 20
@@ -216,7 +356,7 @@ def test_generate_pod_name_empty_tenant(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "", "user12345")
-            assert name == "mcp-test-service--user1234-a1b2c3d4"
+            assert name == "mcp-test-service-unknown-user1234-a1b2c3d4"
 
     def test_generate_pod_name_empty_user(self, k8s_container_client):
         """Test pod name generation with empty user_id"""
@@ -224,7 +364,7 @@ def test_generate_pod_name_empty_user(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "tenant123", "")
-            assert name == "mcp-test-service-tenant12--a1b2c3d4"
+            assert name == "mcp-test-service-tenant12-unknown-a1b2c3d4"
 
     def test_generate_pod_name_none_tenant(self, k8s_container_client):
         """Test pod name generation with None tenant_id"""
@@ -232,7 +372,7 @@ def test_generate_pod_name_none_tenant(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", None, "user12345")
-            assert name == "mcp-test-service--user1234-a1b2c3d4"
+            assert name == "mcp-test-service-unknown-user1234-a1b2c3d4"
 
     def test_generate_pod_name_none_user(self, k8s_container_client):
         """Test pod name generation with None user_id"""
@@ -240,7 +380,7 @@ def test_generate_pod_name_none_user(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "tenant123", None)
-            assert name == "mcp-test-service-tenant12--a1b2c3d4"
+            assert name == "mcp-test-service-tenant12-unknown-a1b2c3d4"
 
 
 # ---------------------------------------------------------------------------
@@ -1265,6 +1405,26 @@ def test_list_containers_service_filter_special_chars(self, k8s_container_client
 
         assert len(result) == 0
 
+    def test_list_containers_service_filter_consecutive_special_chars(self, k8s_container_client, mock_pod):
+        """Test listing containers with service filter containing consecutive special characters"""
+        k8s_container_client.core_v1.list_namespaced_pod.return_value = MagicMock(items=[mock_pod])
+
+        # The sanitized version of "test@@service" is "test-service"
+        # Since mock_pod's component is "test-service", it should match
+        result = k8s_container_client.list_containers(service_name="test@@service")
+
+        assert len(result) == 1
+
+    def test_list_containers_service_filter_leading_special_chars(self, k8s_container_client, mock_pod):
+        """Test listing containers with service filter containing leading special characters"""
+        k8s_container_client.core_v1.list_namespaced_pod.return_value = MagicMock(items=[mock_pod])
+
+        # The sanitized version of "@test-service" is "test-service" (leading @ stripped)
+        # Since mock_pod's component is "test-service", it should match
+        result = k8s_container_client.list_containers(service_name="@test-service")
+
+        assert len(result) == 1
+
     def test_list_containers_pod_no_ports(self, k8s_container_client):
         """Test listing containers when pod has no ports configured"""
         mock_pod_no_ports = MagicMock()
diff --git a/test/sdk/core/agents/test_agent_model.py b/test/sdk/core/agents/test_agent_model.py
index 19963d7b4..66856fda1 100644
--- a/test/sdk/core/agents/test_agent_model.py
+++ b/test/sdk/core/agents/test_agent_model.py
@@ -1259,6 +1259,34 @@ def test_agent_config_max_steps_rejects_out_of_bounds(self):
             )
 
 
+class TestAgentVerificationConfig:
+    """Tests for layered ReAct verification configuration."""
+
+    def test_default_verification_config_is_enabled(self):
+        config = agent_model_module.AgentVerificationConfig()
+
+        assert config.enabled is True
+        assert config.step_verification_enabled is True
+        assert config.final_verification_enabled is True
+        assert config.max_final_rounds == 2
+        assert "final_answer" in config.critical_events
+
+    def test_agent_config_has_default_verification_config(self):
+        config = agent_model_module.AgentConfig(
+            name="verified_agent",
+            description="Agent with default verification",
+            tools=[],
+            model_name="test",
+        )
+
+        assert config.verification_config.enabled is True
+        assert config.verification_config.strictness == "balanced"
+
+    def test_verification_config_rejects_invalid_rounds(self):
+        with pytest.raises(Exception):
+            agent_model_module.AgentVerificationConfig(max_final_rounds=0)
+
+
 # ----------------------------------------------------------------------------
 # Tests for model_rebuild
 # ----------------------------------------------------------------------------
diff --git a/test/sdk/core/agents/test_core_agent.py b/test/sdk/core/agents/test_core_agent.py
index 8f4f00ec6..3dd4f649e 100644
--- a/test/sdk/core/agents/test_core_agent.py
+++ b/test/sdk/core/agents/test_core_agent.py
@@ -279,6 +279,121 @@ def test_parse_code_blobs_run_format():
     assert result == expected
 
 
+# ----------------------------------------------------------------------------
+# Tests for layered final-answer verification policy
+# ----------------------------------------------------------------------------
+
+def _make_verification_controller(**config_overrides):
+    config = core_agent_module.AgentVerificationConfig(
+        enabled=True,
+        step_verification_enabled=True,
+        final_verification_enabled=True,
+        llm_verification_enabled=True,
+        **config_overrides,
+    )
+    observer = MagicMock()
+    observer.add_message = MagicMock()
+    model = MagicMock()
+    logger = MagicMock()
+    logger.log = MagicMock()
+    return core_agent_module.VerificationController(
+        config=config,
+        observer=observer,
+        agent_name="test-agent",
+        model=model,
+        logger=logger,
+    ), model
+
+
+def test_final_verification_skips_llm_for_greeting():
+    """Simple greetings should not require external evidence or tool output."""
+    controller, model = _make_verification_controller()
+
+    result = controller.verify_final_answer(
+        task="你好",
+        candidate="你好！有什么我可以帮你的吗？",
+        memory_summary="Step 1:\nCode:\nObservation:\nOutput:",
+        round_number=1,
+    )
+
+    assert result.passed is True
+    assert result.phase == "final_pass"
+    model.assert_not_called()
+
+
+def test_final_verification_pass_message_explains_reason():
+    """Passed verification events should tell users what was checked."""
+    controller, _ = _make_verification_controller()
+
+    controller.verify_final_answer(
+        task="你好",
+        candidate="你好！有什么我可以帮你的吗？",
+        memory_summary="Step 1:\nCode:\nObservation:\nOutput:",
+        round_number=1,
+    )
+
+    messages = [
+        json.loads(call.args[2])["message"]
+        for call in controller.observer.add_message.call_args_list
+    ]
+
+    assert any("基础自检通过" in message and "答案非空" in message for message in messages)
+    assert any("最终自检通过" in message and "轻量对话无需外部证据" in message for message in messages)
+
+
+def test_verification_feedback_does_not_count_as_tool_error():
+    """Self-verification feedback should not poison the next final-answer check."""
+    controller, _ = _make_verification_controller()
+    memory_summary = """
+Step 1:
+Observation:
+Verification feedback:
+- Event: final_answer
+- Severity: blocking
+- Failed criteria: evidence_grounding, tool_error_handling
+- Repair instruction: Provide more evidence.
+"""
+
+    result = controller.verify_before_final_answer(
+        candidate="你好！有什么我可以帮你的吗？",
+        observation=memory_summary,
+        step_number=2,
+    )
+
+    assert result.passed is True
+    assert "previous_errors_acknowledged" not in result.failed_criteria
+
+
+def test_llm_verifier_ignores_non_required_evidence_and_tool_error_failures():
+    """Verifier output is normalized when failed criteria are not required by policy."""
+    controller, _ = _make_verification_controller()
+    verifier_payload = json.dumps({
+        "passed": False,
+        "score": 0.5,
+        "status": "revise",
+        "failed_criteria": ["evidence_grounding", "tool_error_handling"],
+        "checks": [
+            {"name": "evidence_grounding", "passed": False},
+            {"name": "tool_error_handling", "passed": False},
+        ],
+        "revision_instruction": "Find evidence.",
+        "user_visible_note": "Missing evidence.",
+    })
+
+    result = controller._parse_llm_verifier_result(
+        verifier_payload,
+        {
+            "task_profile": "lightweight_conversation",
+            "evidence_required": False,
+            "tool_error_check_required": False,
+        },
+    )
+
+    assert result.passed is True
+    assert result.failed_criteria == []
+    assert result.score >= controller.config.pass_score
+
+
 def test_parse_code_blobs_run_format_with_newline():
     """Test parse_code_blobs with <code>\\ncontent\\n</code> pattern."""
     text = """Here is some code:
@@ -2372,13 +2487,13 @@ def test_handle_max_steps_reached_model_error_fallback(self):
         # Should return error message
         assert "Error in generating final LLM output" in result
 
-        # Verify logger was called with warning
+        # Verify logger was called with error
         agent.logger.log.assert_called()
-        warning_calls = [
+        error_calls = [
             call for call in agent.logger.log.call_args_list
-            if call[1].get("level") and "WARNING" in str(call[1].get("level"))
+            if call[1].get("level") and "ERROR" in str(call[1].get("level"))
         ]
-        assert len(warning_calls) >= 1
+        assert len(error_calls) >= 1
 
     def test_handle_max_steps_reached_creates_memory_step_with_error(self):
         """Test that a memory step with AgentMaxStepsError is created."""
@@ -2609,4 +2724,3 @@ def failing_truncate(content, max_length=1000):
         # Verify warning was logged via the except block
         # The exception handler logs via self.logger.log()
         agent.logger.log.assert_called()
-
diff --git a/test/sdk/core/agents/test_nexent_agent.py b/test/sdk/core/agents/test_nexent_agent.py
index ff8da11f8..882e28514 100644
--- a/test/sdk/core/agents/test_nexent_agent.py
+++ b/test/sdk/core/agents/test_nexent_agent.py
@@ -939,6 +939,88 @@ def test_create_local_tool_knowledge_base_with_display_name_map(nexent_agent_ins
     assert result.rerank_model == "mock_rerank_model"
 
 
+def test_create_local_tool_knowledge_base_with_document_paths_from_metadata(nexent_agent_instance):
+    """KnowledgeBaseSearchTool should receive document_paths from metadata via set_document_paths.
+
+    The `document_paths` parameter is declared with `exclude=True` so it must not
+    be passed to __init__. Instead it must be forwarded to `set_document_paths`
+    on the instance, sourced from `tool_config.metadata`. This guards against
+    the FieldInfo-iteration regression reported when document_paths is unset.
+    """
+    mock_kb_tool_class = MagicMock()
+    mock_kb_tool_instance = MagicMock()
+    mock_kb_tool_class.return_value = mock_kb_tool_instance
+
+    document_paths = ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
+
+    tool_config = ToolConfig(
+        class_name="KnowledgeBaseSearchTool",
+        name="knowledge_base_search",
+        description="desc",
+        inputs="{}",
+        output_type="string",
+        params={"top_k": 5, "index_names": ["kb1"]},
+        source="local",
+        metadata={
+            "vdb_core": "mock_vdb_core",
+            "embedding_model": "mock_embedding_model",
+            "document_paths": document_paths,
+        },
+    )
+
+    original_value = nexent_agent.__dict__.get("KnowledgeBaseSearchTool")
+    nexent_agent.__dict__["KnowledgeBaseSearchTool"] = mock_kb_tool_class
+
+    try:
+        nexent_agent_instance.create_local_tool(tool_config)
+    finally:
+        if original_value is not None:
+            nexent_agent.__dict__["KnowledgeBaseSearchTool"] = original_value
+        elif "KnowledgeBaseSearchTool" in nexent_agent.__dict__:
+            del nexent_agent.__dict__["KnowledgeBaseSearchTool"]
+
+    # document_paths is excluded and must not be forwarded to __init__.
+    init_kwargs = mock_kb_tool_class.call_args.kwargs
+    assert "document_paths" not in init_kwargs
+    # It must instead be applied via set_document_paths on the instance.
+    mock_kb_tool_instance.set_document_paths.assert_called_once_with(document_paths)
+
+
+def test_create_local_tool_knowledge_base_without_metadata_calls_set_document_paths_none(nexent_agent_instance):
+    """When metadata lacks document_paths, set_document_paths(None) must still be invoked.
+
+    Ensures the tool's internal filter is explicitly reset to None rather than
+    left as a stale FieldInfo default from the smolagents wrapper.
+    """
+    mock_kb_tool_class = MagicMock()
+    mock_kb_tool_instance = MagicMock()
+    mock_kb_tool_class.return_value = mock_kb_tool_instance
+
+    tool_config = ToolConfig(
+        class_name="KnowledgeBaseSearchTool",
+        name="knowledge_base_search",
+        description="desc",
+        inputs="{}",
+        output_type="string",
+        params={"top_k": 5, "index_names": ["kb1"]},
+        source="local",
+        metadata=None,
+    )
+
+    original_value = nexent_agent.__dict__.get("KnowledgeBaseSearchTool")
+    nexent_agent.__dict__["KnowledgeBaseSearchTool"] = mock_kb_tool_class
+
+    try:
+        nexent_agent_instance.create_local_tool(tool_config)
+    finally:
+        if original_value is not None:
+            nexent_agent.__dict__["KnowledgeBaseSearchTool"] = original_value
+        elif "KnowledgeBaseSearchTool" in nexent_agent.__dict__:
+            del nexent_agent.__dict__["KnowledgeBaseSearchTool"]
+
+    mock_kb_tool_instance.set_document_paths.assert_called_once_with(None)
+
+
 def test_create_local_tool_knowledge_base_with_empty_display_name_map(nexent_agent_instance):
     """Test KnowledgeBaseSearchTool creation handles empty display_name_to_index_map."""
     mock_kb_tool_class = MagicMock()
diff --git a/test/sdk/core/tools/test_knowledge_base_search_tool.py b/test/sdk/core/tools/test_knowledge_base_search_tool.py
index 53d02206a..7a4b23ebe 100644
--- a/test/sdk/core/tools/test_knowledge_base_search_tool.py
+++ b/test/sdk/core/tools/test_knowledge_base_search_tool.py
@@ -118,9 +118,67 @@ class VectorDatabaseCore:
 smolagents_mod = types.ModuleType("smolagents")
 smolagents_tools_mod = types.ModuleType("smolagents.tools")
 
+
 class Tool:
+    """Mock Tool class that properly handles Pydantic Field definitions."""
+
     def __init__(self, *args, **kwargs):
-        pass
+        from pydantic.fields import FieldInfo
+
+        # Set all provided kwargs as instance attributes
+        for key, value in kwargs.items():
+            setattr(self, key, value)
+
+        # For any Pydantic Field attributes defined in class hierarchy that weren't provided,
+        # extract their default values
+        for cls in type(self).__mro__:
+            if cls is Tool:
+                continue
+            if hasattr(cls, '__annotations__'):
+                for name, hint in cls.__annotations__.items():
+                    # Skip if already set from kwargs
+                    if name in self.__dict__:
+                        continue
+                    # Check if there's a class attribute that's a FieldInfo
+                    if hasattr(cls, name):
+                        value = getattr(cls, name)
+                        # Unwrap FieldInfo to get the default
+                        if isinstance(value, FieldInfo):
+                            # Handle default_factory
+                            if value.default_factory is not None:
+                                value = value.default_factory()
+                            else:
+                                value = value.default
+                        setattr(self, name, value)
+
+    def __setattr__(self, name, value):
+        from pydantic.fields import FieldInfo
+        # Unwrap FieldInfo when it's set after __init__ completes (not from kwargs)
+        if isinstance(value, FieldInfo):
+            # Check if this is a class-level default by looking at the class
+            for cls in type(self).__mro__:
+                if cls is Tool:
+                    continue
+                if hasattr(cls, name):
+                    class_attr = getattr(cls, name)
+                    if class_attr is value:
+                        # This is a class-level FieldInfo default, unwrap it
+                        if value.default_factory is not None:
+                            value = value.default_factory()
+                        else:
+                            value = value.default
+                        break
+            else:
+                # Not found in class hierarchy, unwrap it anyway
+                if value.default_factory is not None:
+                    value = value.default_factory()
+                else:
+                    value = value.default
+        self.__dict__[name] = value
+
+    def __repr__(self):
+        return f"<MockTool _internal_document_paths={getattr(self, '_internal_document_paths', 'MISSING')}>"
+
 
 smolagents_tools_mod.Tool = Tool
 smolagents_mod.tools = smolagents_tools_mod
@@ -497,15 +555,10 @@ def test_init_without_rerank_params(self, mock_observer):
             observer=mock_observer,
         )
 
-        # smolagents Tool doesn't properly handle Field defaults, so we check FieldInfo.default
-        try:
-            from pydantic import FieldInfo
-        except ImportError:
-            from pydantic.fields import FieldInfo
-        assert isinstance(tool.rerank, FieldInfo)
-        assert tool.rerank.default is False
-        assert tool.rerank_model_name.default == ""
-        assert tool.rerank_model.default is None
+        # Mock Tool properly unwraps Field defaults, so we check the actual values
+        assert tool.rerank is False
+        assert tool.rerank_model_name == ""
+        assert tool.rerank_model is None
 
     def test_forward_with_rerank_enabled(self, mock_observer, mock_vdb_core, mock_embedding_model, mocker):
         """Test forward method when rerank is enabled and model is provided."""
@@ -1516,3 +1569,298 @@ def test_forward_with_fieldinfo_rerank_default_only(self, mock_observer, mock_vd
         call_kwargs = mock_vdb_core.hybrid_search.call_args[1]
         # top_k from default is 3, multiplied by RERANK_OVERSEARCH_MULTIPLIER
         assert call_kwargs["top_k"] == 3 * RERANK_OVERSEARCH_MULTIPLIER
+
+
+class TestDocumentPathsAccessControl:
+    """Tests for document_paths access control functionality."""
+
+    def _create_mock_formatted_results_with_paths(self, paths: list) -> list:
+        """Create mock search results in FORMATTED format for _filter_by_document_paths tests.
+
+        After search_hybrid processes VDB results, the path_or_url is at the top level.
+        """
+        results = []
+        for path in paths:
+            results.append({
+                "path_or_url": path,
+                "title": f"Document {path}",
+                "content": f"Content for {path}",
+                "filename": f"{path}.txt",
+                "source_type": "file",
+                "create_time": "2024-01-01T12:00:00Z",
+                "score": 0.9,
+                "index": "test_index"
+            })
+        return results
+
+    def _create_mock_vdb_results_with_paths(self, paths: list) -> list:
+        """Create mock search results in VDB format for forward() tests.
+
+        VDB returns results with a nested 'document' object.
+        """
+        results = []
+        for path in paths:
+            results.append({
+                "document": {
+                    "path_or_url": path,
+                    "title": f"Document {path}",
+                    "content": f"Content for {path}",
+                    "filename": f"{path}.txt",
+                    "source_type": "file",
+                    "create_time": "2024-01-01T12:00:00Z",
+                },
+                "score": 0.9,
+                "index": "test_index"
+            })
+        return results
+        return results
+
+    def test_filter_by_document_paths_allows_matching(self, mock_vdb_core, mock_embedding_model):
+        """Test that results with path_or_url in the allowed list are returned."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"],
+        )
+
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        filtered = tool._filter_by_document_paths(results)
+
+        # Only doc1 and doc2 should be returned
+        assert len(filtered) == 2
+        assert all(r.get("path_or_url") in ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"] for r in filtered)
+
+    def test_filter_by_document_paths_rejects_non_matching(self, mock_vdb_core, mock_embedding_model):
+        """Test that results with path_or_url NOT in the allowed list are filtered out."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=["s3://bucket/doc1.txt"],
+        )
+
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        filtered = tool._filter_by_document_paths(results)
+
+        # Only doc1 should be returned
+        assert len(filtered) == 1
+        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
+
+    def test_filter_by_document_paths_empty_list_returns_all(self, mock_vdb_core, mock_embedding_model):
+        """Test that empty document_paths list returns all results."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=[],
+        )
+
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        filtered = tool._filter_by_document_paths(results)
+
+        # All results should be returned
+        assert len(filtered) == 3
+
+    def test_filter_by_document_paths_none_returns_all(self, mock_vdb_core, mock_embedding_model):
+        """Test that None document_paths (no filter) returns all results."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=None,
+        )
+
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        filtered = tool._filter_by_document_paths(results)
+
+        # All results should be returned
+        assert len(filtered) == 3
+
+    def test_filter_by_document_paths_results_missing_path(self, mock_vdb_core, mock_embedding_model):
+        """Test that results without path_or_url field are filtered out when filter is active."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=["s3://bucket/doc1.txt"],
+        )
+
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt"])
+        # Add a result without path_or_url (flat format, no nested document)
+        results.append({
+            "title": "No Path",
+            "content": "This document has no path_or_url",
+            "filename": "no_path.txt",
+            "source_type": "file",
+            "score": 0.8,
+            "index": "test_index"
+        })
+
+        filtered = tool._filter_by_document_paths(results)
+
+        # Only doc1 should be returned
+        assert len(filtered) == 1
+        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
+
+    def test_set_document_paths_method(self, mock_vdb_core, mock_embedding_model):
+        """Test the set_document_paths method updates the internal filter."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=None,
+        )
+
+        # Initially no filter
+        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"])
+        assert len(tool._filter_by_document_paths(results)) == 2
+
+        # Set document_paths filter
+        tool.set_document_paths(["s3://bucket/doc1.txt"])
+        filtered = tool._filter_by_document_paths(results)
+
+        # Only doc1 should be returned
+        assert len(filtered) == 1
+        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
+
+    def test_forward_with_document_paths_filter(self, mock_vdb_core, mock_embedding_model, mock_observer):
+        """Test that forward method applies document_paths filter to search results."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            observer=mock_observer,
+            document_paths=["s3://bucket/doc1.txt"],
+            top_k=5,
+        )
+
+        # Mock VDB returns 3 results, but only 1 matches the filter
+        # VDB returns nested 'document' format
+        mock_results = self._create_mock_vdb_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        mock_vdb_core.hybrid_search.return_value = mock_results
+
+        result = tool.forward("test query")
+        search_results = json.loads(result)
+
+        # Only doc1 should be in the result
+        assert len(search_results) == 1
+        assert search_results[0].get("url") == "s3://bucket/doc1.txt"
+
+    def test_forward_with_document_paths_filter_no_results_after_filter(self, mock_vdb_core, mock_embedding_model, mock_observer):
+        """Test that forward raises exception when all results are filtered out."""
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            observer=mock_observer,
+            document_paths=["s3://bucket/nonexistent.txt"],
+            top_k=5,
+        )
+
+        # Mock VDB returns 3 results, none match the filter
+        mock_results = self._create_mock_vdb_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
+        mock_vdb_core.hybrid_search.return_value = mock_results
+
+        # Should raise exception because after filtering, no results remain
+        with pytest.raises(Exception) as excinfo:
+            tool.forward("test query")
+
+        assert "No results found" in str(excinfo.value)
+
+    def test_filter_by_document_paths_unwraps_fieldinfo_default(self, mock_vdb_core, mock_embedding_model):
+        """Filter should tolerate a FieldInfo default instead of a concrete list.
+
+        Regression: smolagents' Tool wrapper does not expand FieldInfo defaults for
+        parameters declared with `exclude=True`, so `self._internal_document_paths`
+        may arrive as a FieldInfo. The filter must unwrap it instead of failing with
+        `TypeError: argument of type 'FieldInfo' is not iterable`.
+        """
+        try:
+            from pydantic import FieldInfo
+        except ImportError:
+            from pydantic.fields import FieldInfo
+
+        field_info_default = FieldInfo(default=["s3://bucket/doc1.txt"])
+
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=None,
+        )
+        # Simulate a FieldInfo being assigned directly (e.g. from smolagents wrapper).
+        tool._internal_document_paths = field_info_default
+
+        results = self._create_mock_formatted_results_with_paths(
+            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
+        )
+        filtered = tool._filter_by_document_paths(results)
+
+        assert len(filtered) == 1
+        assert filtered[0]["path_or_url"] == "s3://bucket/doc1.txt"
+
+    def test_filter_by_document_paths_unwraps_fieldinfo_default_factory(self, mock_vdb_core, mock_embedding_model):
+        """Filter should tolerate a FieldInfo with default_factory."""
+        try:
+            from pydantic import FieldInfo
+        except ImportError:
+            from pydantic.fields import FieldInfo
+
+        field_info_factory = FieldInfo(
+            default_factory=lambda: ["s3://bucket/doc2.txt"]
+        )
+
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=None,
+        )
+        tool._internal_document_paths = field_info_factory
+
+        results = self._create_mock_formatted_results_with_paths(
+            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
+        )
+        filtered = tool._filter_by_document_paths(results)
+
+        assert len(filtered) == 1
+        assert filtered[0]["path_or_url"] == "s3://bucket/doc2.txt"
+
+    def test_set_document_paths_unwraps_fieldinfo(self, mock_vdb_core, mock_embedding_model):
+        """set_document_paths should also accept FieldInfo input defensively."""
+        try:
+            from pydantic import FieldInfo
+        except ImportError:
+            from pydantic.fields import FieldInfo
+
+        tool = KnowledgeBaseSearchTool(
+            index_names=["kb1"],
+            search_mode="hybrid",
+            vdb_core=mock_vdb_core,
+            embedding_model=mock_embedding_model,
+            document_paths=None,
+        )
+
+        field_info = FieldInfo(default=["s3://bucket/doc1.txt"])
+        tool.set_document_paths(field_info)
+
+        results = self._create_mock_formatted_results_with_paths(
+            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
+        )
+        filtered = tool._filter_by_document_paths(results)
+
+        assert len(filtered) == 1
+        assert filtered[0]["path_or_url"] == "s3://bucket/doc1.txt"
+
+
diff --git a/test/sdk/core/tools/test_search_memory_tool.py b/test/sdk/core/tools/test_search_memory_tool.py
new file mode 100644
index 000000000..c17f2f14d
--- /dev/null
+++ b/test/sdk/core/tools/test_search_memory_tool.py
@@ -0,0 +1,209 @@
+import pytest
+from unittest.mock import MagicMock, patch, AsyncMock
+
+from sdk.nexent.core.utils.observer import MessageObserver, ProcessType
+from sdk.nexent.core.tools.search_memory_tool import SearchMemoryTool
+
+
+@pytest.fixture
+def mock_observer():
+    observer = MagicMock(spec=MessageObserver)
+    observer.lang = "en"
+    return observer
+
+
+@pytest.fixture
+def mock_user_config():
+    config = MagicMock()
+    config.agent_share_option = "always"
+    config.disable_agent_ids = []
+    config.disable_user_agent_ids = []
+    return config
+
+
+@pytest.fixture
+def search_memory_tool(mock_observer, mock_user_config):
+    return SearchMemoryTool(
+        memory_config={"test": "config"},
+        tenant_id="tenant_1",
+        user_id="user_1",
+        agent_id="agent_1",
+        memory_user_config=mock_user_config,
+        observer=mock_observer,
+    )
+
+
+def test_observer_english_message(search_memory_tool, mock_observer):
+    mock_observer.lang = "en"
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        search_memory_tool.forward("some query")
+
+    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "Searching memory...")
+
+
+def test_observer_chinese_message(search_memory_tool, mock_observer):
+    mock_observer.lang = "zh"
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        search_memory_tool.forward("some query")
+
+    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "搜索记忆中...")
+
+
+def test_no_observer(search_memory_tool):
+    search_memory_tool.observer = None
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"memory": "fact", "score": 0.9, "memory_level": "user"}]},
+    ):
+        result = search_memory_tool.forward("some query")
+
+    assert "Found 1 relevant memories" in result
+
+
+def test_forward_with_results(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"memory": "User prefers dark mode", "score": 0.92, "memory_level": "user_agent"},
+                {"memory": "User timezone is UTC+8", "score": 0.85, "memory_level": "user"},
+                {"memory": "Agent should confirm before executing", "score": 0.71, "memory_level": "agent"},
+            ]
+        },
+    ) as mock_search:
+        result = search_memory_tool.forward("user preferences", top_k=3)
+
+    assert "Found 3 relevant memories" in result
+    assert "(score: 0.92, level: user_agent) User prefers dark mode" in result
+    assert "(score: 0.85, level: user) User timezone is UTC+8" in result
+    assert "(score: 0.71, level: agent) Agent should confirm before executing" in result
+
+    mock_search.assert_called_once_with(
+        query_text="user preferences",
+        memory_config={"test": "config"},
+        tenant_id="tenant_1",
+        user_id="user_1",
+        agent_id="agent_1",
+        top_k=3,
+        memory_levels=["tenant", "user", "agent", "user_agent"],
+    )
+
+
+def test_forward_no_results(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        result = search_memory_tool.forward("nonexistent topic")
+
+    assert result == "No relevant memories found."
+
+
+def test_forward_default_top_k(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ) as mock_search:
+        search_memory_tool.forward("some query")
+
+    call_kwargs = mock_search.call_args[1]
+    assert call_kwargs["top_k"] == 5
+
+
+def test_forward_custom_top_k(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ) as mock_search:
+        search_memory_tool.forward("some query", top_k=10)
+
+    call_kwargs = mock_search.call_args[1]
+    assert call_kwargs["top_k"] == 10
+
+
+def test_forward_uses_content_field_fallback(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"content": "Fallback content field", "score": 0.8, "memory_level": "user"},
+            ]
+        },
+    ):
+        result = search_memory_tool.forward("query")
+
+    assert "Fallback content field" in result
+
+
+def test_levels_agent_share_never(search_memory_tool, mock_user_config):
+    mock_user_config.agent_share_option = "never"
+
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ) as mock_search:
+        search_memory_tool.forward("query")
+
+    call_kwargs = mock_search.call_args[1]
+    assert "agent" not in call_kwargs["memory_levels"]
+    assert "tenant" in call_kwargs["memory_levels"]
+    assert "user" in call_kwargs["memory_levels"]
+    assert "user_agent" in call_kwargs["memory_levels"]
+
+
+def test_levels_disable_agent_ids(search_memory_tool, mock_user_config):
+    mock_user_config.disable_agent_ids = ["agent_1"]
+
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ) as mock_search:
+        search_memory_tool.forward("query")
+
+    call_kwargs = mock_search.call_args[1]
+    assert "agent" not in call_kwargs["memory_levels"]
+    assert "tenant" in call_kwargs["memory_levels"]
+
+
+def test_levels_disable_user_agent_ids(search_memory_tool, mock_user_config):
+    mock_user_config.disable_user_agent_ids = ["agent_1"]
+
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ) as mock_search:
+        search_memory_tool.forward("query")
+
+    call_kwargs = mock_search.call_args[1]
+    assert "user_agent" not in call_kwargs["memory_levels"]
+    assert "agent" in call_kwargs["memory_levels"]
+
+
+def test_forward_exception_returns_friendly_error(search_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.search_memory_in_levels",
+        new_callable=AsyncMock,
+        side_effect=Exception("Elasticsearch timeout"),
+    ):
+        result = search_memory_tool.forward("query")
+
+    assert "Memory search failed" in result
+    assert "Elasticsearch timeout" in result
+    assert "Continuing without memory results" in result
diff --git a/test/sdk/core/tools/test_store_memory_tool.py b/test/sdk/core/tools/test_store_memory_tool.py
new file mode 100644
index 000000000..a3cfde9ef
--- /dev/null
+++ b/test/sdk/core/tools/test_store_memory_tool.py
@@ -0,0 +1,285 @@
+import pytest
+from unittest.mock import MagicMock, patch, AsyncMock
+
+from sdk.nexent.core.utils.observer import MessageObserver, ProcessType
+from sdk.nexent.core.tools.store_memory_tool import StoreMemoryTool
+
+
+@pytest.fixture
+def mock_observer():
+    observer = MagicMock(spec=MessageObserver)
+    observer.lang = "en"
+    return observer
+
+
+@pytest.fixture
+def mock_user_config():
+    config = MagicMock()
+    config.agent_share_option = "always"
+    config.disable_agent_ids = []
+    config.disable_user_agent_ids = []
+    return config
+
+
+@pytest.fixture
+def store_memory_tool(mock_observer, mock_user_config):
+    return StoreMemoryTool(
+        memory_config={"test": "config"},
+        tenant_id="tenant_1",
+        user_id="user_1",
+        agent_id="agent_1",
+        memory_user_config=mock_user_config,
+        observer=mock_observer,
+    )
+
+
+def test_observer_english_message(store_memory_tool, mock_observer):
+    mock_observer.lang = "en"
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        store_memory_tool.forward("some content")
+
+    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "Saving to memory...")
+
+
+def test_observer_chinese_message(store_memory_tool, mock_observer):
+    mock_observer.lang = "zh"
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        store_memory_tool.forward("some content")
+
+    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "保存到记忆中...")
+
+
+def test_no_observer(store_memory_tool):
+    store_memory_tool.observer = None
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ):
+        result = store_memory_tool.forward("some content")
+
+    assert "Stored successfully" in result
+
+
+def test_forward_add_event(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"event": "ADD", "memory": "User prefers dark mode"},
+                {"event": "ADD", "memory": "User works on Project X"},
+            ]
+        },
+    ) as mock_add:
+        result = store_memory_tool.forward("I prefer dark mode and work on Project X")
+
+    assert "Stored successfully" in result
+    assert "[ADD] User prefers dark mode" in result
+    assert "[ADD] User works on Project X" in result
+    assert store_memory_tool.store_count == 1
+
+    mock_add.assert_called_once_with(
+        messages=[{"role": "user", "content": "I prefer dark mode and work on Project X"}],
+        memory_config={"test": "config"},
+        tenant_id="tenant_1",
+        user_id="user_1",
+        agent_id="agent_1",
+        memory_levels=["user_agent", "agent"],
+    )
+
+
+def test_forward_update_event(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"event": "UPDATE", "memory": "User prefers dark mode and high contrast"},
+            ]
+        },
+    ):
+        result = store_memory_tool.forward("I also like high contrast")
+
+    assert "Stored successfully" in result
+    assert "[UPDATE] User prefers dark mode and high contrast" in result
+
+
+def test_forward_mixed_events(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"event": "ADD", "memory": "New fact"},
+                {"event": "NONE", "memory": "Existing fact"},
+                {"event": "DELETE", "memory": "Old fact"},
+                {"event": "UPDATE", "memory": "Updated fact"},
+            ]
+        },
+    ):
+        result = store_memory_tool.forward("some content")
+
+    assert "[ADD] New fact" in result
+    assert "[UPDATE] Updated fact" in result
+    assert "NONE" not in result
+    assert "DELETE" not in result
+
+
+def test_forward_no_results(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        result = store_memory_tool.forward("just a greeting")
+
+    assert result == "No new facts were extracted from the content."
+
+
+def test_forward_all_none_events(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={
+            "results": [
+                {"event": "NONE", "memory": "Already known fact"},
+            ]
+        },
+    ):
+        result = store_memory_tool.forward("already known info")
+
+    assert result == "The information was already present in memory (no changes needed)."
+
+
+def test_cost_guard_limit_reached(store_memory_tool):
+    store_memory_tool.store_count = 3
+
+    result = store_memory_tool.forward("some content")
+
+    assert "Memory storage limit reached" in result
+
+
+def test_cost_guard_increments_counter(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ):
+        store_memory_tool.forward("content 1")
+        store_memory_tool.forward("content 2")
+
+    assert store_memory_tool.store_count == 2
+
+
+def test_cost_guard_increments_even_with_no_facts(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": []},
+    ):
+        store_memory_tool.forward("nothing useful")
+
+    # store_count increments after asyncio.run succeeds, regardless of results
+    assert store_memory_tool.store_count == 1
+
+
+def test_levels_agent_share_never(store_memory_tool, mock_user_config):
+    mock_user_config.agent_share_option = "never"
+
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ) as mock_add:
+        store_memory_tool.forward("some content")
+
+    call_kwargs = mock_add.call_args[1]
+    assert call_kwargs["memory_levels"] == ["user_agent"]
+    assert "agent" not in call_kwargs["memory_levels"]
+
+
+def test_levels_agent_share_always(store_memory_tool, mock_user_config):
+    mock_user_config.agent_share_option = "always"
+
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ) as mock_add:
+        store_memory_tool.forward("some content")
+
+    call_kwargs = mock_add.call_args[1]
+    assert "user_agent" in call_kwargs["memory_levels"]
+    assert "agent" in call_kwargs["memory_levels"]
+
+
+def test_levels_disable_agent_ids(store_memory_tool, mock_user_config):
+    mock_user_config.disable_agent_ids = ["agent_1"]
+
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ) as mock_add:
+        store_memory_tool.forward("some content")
+
+    call_kwargs = mock_add.call_args[1]
+    assert "agent" not in call_kwargs["memory_levels"]
+    assert "user_agent" in call_kwargs["memory_levels"]
+
+
+def test_levels_disable_user_agent_ids(store_memory_tool, mock_user_config):
+    mock_user_config.disable_user_agent_ids = ["agent_1"]
+
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
+    ) as mock_add:
+        store_memory_tool.forward("some content")
+
+    call_kwargs = mock_add.call_args[1]
+    assert "user_agent" not in call_kwargs["memory_levels"]
+    assert "agent" in call_kwargs["memory_levels"]
+
+
+def test_levels_all_disabled(store_memory_tool, mock_user_config):
+    mock_user_config.disable_agent_ids = ["agent_1"]
+    mock_user_config.disable_user_agent_ids = ["agent_1"]
+
+    result = store_memory_tool.forward("some content")
+
+    assert result == "No memory levels available (all disabled by user preferences)."
+
+
+def test_forward_exception_returns_friendly_error(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        side_effect=Exception("Elasticsearch connection refused"),
+    ):
+        result = store_memory_tool.forward("some content")
+
+    assert "Failed to store memory" in result
+    assert "Elasticsearch connection refused" in result
+    assert "Continuing without saving" in result
+
+
+def test_forward_exception_does_not_increment_counter(store_memory_tool):
+    with patch(
+        "sdk.nexent.memory.memory_service.add_memory_in_levels",
+        new_callable=AsyncMock,
+        side_effect=Exception("connection error"),
+    ):
+        store_memory_tool.forward("some content")
+
+    assert store_memory_tool.store_count == 0
diff --git a/test/sdk/data_process/test_core.py b/test/sdk/data_process/test_core.py
index 6c47c3732..e0edced14 100644
--- a/test/sdk/data_process/test_core.py
+++ b/test/sdk/data_process/test_core.py
@@ -2,6 +2,22 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock
 from io import BytesIO
+import sys
+import types
+
+
+fake_unstructured = types.ModuleType("unstructured_inference")
+fake_models = types.ModuleType("unstructured_inference.models")
+fake_tables = types.ModuleType("unstructured_inference.models.tables")
+fake_tables.tables_agent = types.SimpleNamespace(model=None)
+fake_logger = types.ModuleType("unstructured_inference.logger")
+fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
+fake_models.tables = fake_tables
+fake_unstructured.models = fake_models
+sys.modules.setdefault("unstructured_inference", fake_unstructured)
+sys.modules.setdefault("unstructured_inference.models", fake_models)
+sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
+sys.modules.setdefault("unstructured_inference.logger", fake_logger)
 
 from sdk.nexent.data_process.core import DataProcessCore
 
diff --git a/test/sdk/data_process/test_file_splitter.py b/test/sdk/data_process/test_file_splitter.py
index 6e59d2b76..5c44131d7 100644
--- a/test/sdk/data_process/test_file_splitter.py
+++ b/test/sdk/data_process/test_file_splitter.py
@@ -1,4 +1,6 @@
 from io import BytesIO
+import sys
+import types
 
 import pytest
 
@@ -7,6 +9,19 @@
 pytest.importorskip("openpyxl")
 pytest.importorskip("pypdf")
 
+fake_unstructured = types.ModuleType("unstructured_inference")
+fake_models = types.ModuleType("unstructured_inference.models")
+fake_tables = types.ModuleType("unstructured_inference.models.tables")
+fake_tables.tables_agent = types.SimpleNamespace(model=None)
+fake_logger = types.ModuleType("unstructured_inference.logger")
+fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
+fake_models.tables = fake_tables
+fake_unstructured.models = fake_models
+sys.modules.setdefault("unstructured_inference", fake_unstructured)
+sys.modules.setdefault("unstructured_inference.models", fake_models)
+sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
+sys.modules.setdefault("unstructured_inference.logger", fake_logger)
+
 from sdk.nexent.data_process.file_splitter import FileSplitter
 
 
diff --git a/test/sdk/data_process/test_openpyxl_processor.py b/test/sdk/data_process/test_openpyxl_processor.py
index 91182470e..b8c5178fe 100644
--- a/test/sdk/data_process/test_openpyxl_processor.py
+++ b/test/sdk/data_process/test_openpyxl_processor.py
@@ -3,6 +3,22 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock, patch
 from copy import deepcopy
+import sys
+import types
+
+
+fake_unstructured = types.ModuleType("unstructured_inference")
+fake_models = types.ModuleType("unstructured_inference.models")
+fake_tables = types.ModuleType("unstructured_inference.models.tables")
+fake_tables.tables_agent = types.SimpleNamespace(model=None)
+fake_logger = types.ModuleType("unstructured_inference.logger")
+fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
+fake_models.tables = fake_tables
+fake_unstructured.models = fake_models
+sys.modules.setdefault("unstructured_inference", fake_unstructured)
+sys.modules.setdefault("unstructured_inference.models", fake_models)
+sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
+sys.modules.setdefault("unstructured_inference.logger", fake_logger)
 
 from sdk.nexent.data_process.openpyxl_processor import OpenPyxlProcessor
 
diff --git a/test/sdk/data_process/test_unstructured_processor.py b/test/sdk/data_process/test_unstructured_processor.py
index bfb828d10..83724e995 100644
--- a/test/sdk/data_process/test_unstructured_processor.py
+++ b/test/sdk/data_process/test_unstructured_processor.py
@@ -5,6 +5,20 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock, patch
 
+
+fake_unstructured = types.ModuleType("unstructured_inference")
+fake_models = types.ModuleType("unstructured_inference.models")
+fake_tables = types.ModuleType("unstructured_inference.models.tables")
+fake_tables.tables_agent = types.SimpleNamespace(model=None)
+fake_logger = types.ModuleType("unstructured_inference.logger")
+fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
+fake_models.tables = fake_tables
+fake_unstructured.models = fake_models
+sys.modules.setdefault("unstructured_inference", fake_unstructured)
+sys.modules.setdefault("unstructured_inference.models", fake_models)
+sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
+sys.modules.setdefault("unstructured_inference.logger", fake_logger)
+
 from sdk.nexent.data_process.unstructured_processor import UnstructuredProcessor
 
 
diff --git a/test/sdk/skills/test_skill_manager.py b/test/sdk/skills/test_skill_manager.py
index a262a4bbe..b23c0b8dd 100644
--- a/test/sdk/skills/test_skill_manager.py
+++ b/test/sdk/skills/test_skill_manager.py
@@ -1921,7 +1921,8 @@ def test_run_python_script_with_list_params(self, mocker):
 
             assert result == "ok"
             args = sp.run.call_args[0][0]
-            assert args == ["python", ANY, "-i", "a", "-i", "b", "-i", "c"]
+            assert args[0] == sys.executable
+            assert args[1:] == [ANY, "-i", "a", "-i", "b", "-i", "c"]
 
     def test_run_python_script_boolean_false_excluded(self, mocker):
         """Test boolean flags in string params are passed as-is (True)."""