diff --git a/.github/workflows/auto-unit-test.yml b/.github/workflows/auto-unit-test.yml
index dace8dab6..1595fc769 100644
--- a/.github/workflows/auto-unit-test.yml
+++ b/.github/workflows/auto-unit-test.yml
@@ -36,7 +36,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
-          python-version: '3.11'
+          python-version: '3.10'
 
       - name: Install uv
         run: pip install --upgrade uv
diff --git a/.github/workflows/sdk_publish.yml b/.github/workflows/sdk_publish.yml
index 3cc413381..1e5759277 100644
--- a/.github/workflows/sdk_publish.yml
+++ b/.github/workflows/sdk_publish.yml
@@ -21,7 +21,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
-          python-version: '3.11'
+          python-version: '3.10'
 
       - name: Install build dependencies
         run: |
diff --git a/.gitignore b/.gitignore
index e0bac2b47..ec5b3a3f9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -61,9 +61,4 @@ data/
 sdk/benchmark/.env
 /docker/.env.bak
 
-.venv
-
-.pytest-tmp
-doc/mermaid
-
-.claude/skills/python-import-triage
\ No newline at end of file
+.venv
\ No newline at end of file
diff --git a/backend/adapters/__init__.py b/backend/adapters/__init__.py
deleted file mode 100644
index ed46fc888..000000000
--- a/backend/adapters/__init__.py
+++ /dev/null
@@ -1,13 +0,0 @@
-from adapters.exception import JiuwenSDKError, JiuwenSDKUnavailableError, NexentCapabilityError
-
-try:
-    from adapters.jiuwen_sdk_adapter import JiuwenSDKAdapter
-except ModuleNotFoundError:
-    JiuwenSDKAdapter = None  # type: ignore[assignment, misc]
-
-__all__ = [
-    "JiuwenSDKError",
-    "JiuwenSDKUnavailableError",
-    "NexentCapabilityError",
-    "JiuwenSDKAdapter",
-]
diff --git a/backend/adapters/exception.py b/backend/adapters/exception.py
deleted file mode 100644
index 63812d3af..000000000
--- a/backend/adapters/exception.py
+++ /dev/null
@@ -1,13 +0,0 @@
-class JiuwenSDKError(Exception):
-    """Jiuwen SDK 调用失败的通用异常"""
-    pass
-
-
-class JiuwenSDKUnavailableError(JiuwenSDKError):
-    """Jiuwen SDK 不可用（依赖缺失或未启用）"""
-    pass
-
-
-class NexentCapabilityError(Exception):
-    """nexent 原生模式不支持该能力"""
-    pass
diff --git a/backend/adapters/jiuwen_sdk_adapter.py b/backend/adapters/jiuwen_sdk_adapter.py
deleted file mode 100644
index f62ce9d06..000000000
--- a/backend/adapters/jiuwen_sdk_adapter.py
+++ /dev/null
@@ -1,514 +0,0 @@
-"""
-openjiuwen SDK adapter for Nexent.
-
-This module must be imported lazily (not at module load time) because
-openjiuwen 0.1.13 has circular import bugs in its __init__.py files that
-prevent the SDK from loading unless we bypass them.
-
-Import flow:
-  backend/adapters/__init__.py -> try/except -> JiuwenSDKAdapter = None
-  -> when needed: _install_jiuwen_bypasser() -> openjiuwen imports work
-"""
-import asyncio
-import importlib.abc
-import importlib.machinery
-import json
-import logging
-import os
-import sys
-import types
-from typing import Any, List, Literal, Optional
-
-logger = logging.getLogger("jiuwen_adapter")
-
-from adapters.exception import JiuwenSDKError
-
-
-# ----------------------------------------------------------------------
-# Circular import bypasser for openjiuwen 0.1.13
-#
-# openjiuwen has broken __init__.py files that create circular import chains:
-#   tune/__init__.py -> tune.optimizer -> core.operator -> agent_evolving -> ...
-# This bypasser prevents those __init__.py files from executing while still
-# allowing regular .py submodule files to load normally.
-# ----------------------------------------------------------------------
-_CIRCULAR_CHAIN = {
-    "openjiuwen.agent_evolving",
-    "openjiuwen.agent_evolving.trainer",
-    "openjiuwen.agent_evolving.trainer.trainer",
-    "openjiuwen.agent_evolving.trainer.progress",
-    "openjiuwen.core",
-    "openjiuwen.dev_tools",
-    "openjiuwen.dev_tools.tune",
-    "openjiuwen.dev_tools.tune.optimizer",
-    "openjiuwen.dev_tools.tune.optimizer.instruction_optimizer",
-    "openjiuwen.dev_tools.prompt_builder",
-    "openjiuwen.dev_tools.prompt_builder.builder",
-}
-
-
-class _JiuwenInitBypasser(importlib.abc.MetaPathFinder, importlib.abc.Loader):
-    """
-    Meta path finder that intercepts __init__.py loading within openjiuwen,
-    blocking only the packages in the circular import chain while letting
-    all other modules (including base.py files) load normally.
-    """
-
-    def find_spec(self, fullname: str, path: Any, target: Any = None) -> Any:
-        if not fullname.startswith("openjiuwen") or fullname == "openjiuwen":
-            return None
-
-        try:
-            import openjiuwen as _oj
-
-            pkg_root = _oj.__path__[0]
-        except ImportError:
-            return None
-
-        parts = fullname.split(".")[1:]
-        file_path = pkg_root
-        for p in parts:
-            file_path = os.path.join(file_path, p)
-
-        is_package = os.path.isdir(file_path)
-        if not is_package:
-            return None
-
-        init_path = os.path.join(file_path, "__init__.py")
-        if not os.path.exists(init_path):
-            return None
-
-        if fullname not in _CIRCULAR_CHAIN:
-            return None
-
-        spec = importlib.machinery.ModuleSpec(
-            fullname, self, is_package=True, origin="<init bypassed>"
-        )
-        spec.submodule_search_locations = [file_path]
-        return spec
-
-    def create_module(self, module: Any) -> None:
-        return None
-
-    def exec_module(self, module: Any) -> None:
-        import openjiuwen as _oj
-
-        pkg_root = _oj.__path__[0]
-        parts = module.__name__.split(".")[1:]
-        file_path = pkg_root
-        for p in parts:
-            file_path = os.path.join(file_path, p)
-        module.__path__ = [file_path]
-        module.__file__ = os.path.join(file_path, "__init__.py")
-
-    def __getattr__(self, name: str) -> Any:
-        """Handle special attributes like find_distributions to prevent recursion."""
-        import openjiuwen as _oj
-        import importlib
-
-        # Prevent recursion when Python scans sys.meta_path for find_distributions etc.
-        if name in (
-            "find_distributions",
-            "find_module",
-            "__path__",
-            "__name__",
-            "__file__",
-            "__loader__",
-            "__package__",
-            "__spec__",
-        ):
-            raise AttributeError(name)
-
-        pkg_root = _oj.__path__[0]
-        parts = self.__name__.split(".")[1:] + [name]
-        file_path = pkg_root
-        for p in parts:
-            file_path = os.path.join(file_path, p)
-
-        # If it's a package directory, import it as a submodule
-        if os.path.isdir(file_path) and os.path.exists(os.path.join(file_path, "__init__.py")):
-            return importlib.import_module(f"{self.__name__}.{name}")
-        # If it's a regular .py file
-        if os.path.exists(file_path + ".py"):
-            return importlib.import_module(f"{self.__name__}.{name}")
-        raise AttributeError(name)
-
-
-_bypasser_installed = False
-
-
-def _install_jiuwen_bypasser() -> bool:
-    """
-    Install the circular import bypasser for openjiuwen.
-    Returns True if installed, False if already installed or openjiuwen not available.
-    """
-    global _bypasser_installed
-    if _bypasser_installed:
-        return True
-
-    # Stub missing optional dependencies before openjiuwen import chain reaches them
-    _stubbed = [
-        ("pymilvus", {"is_successful": lambda *args, **kwargs: True}),
-        ("dashscope", {}),
-        ("pdfplumber", {}),
-    ]
-    for _name, _attrs in _stubbed:
-        if _name not in sys.modules:
-            _mod = types.ModuleType(_name)
-            for _k, _v in _attrs.items():
-                setattr(_mod, _k, _v)
-            sys.modules[_name] = _mod
-            _mod.__path__ = []
-
-    # Pre-create nested stub modules for pymilvus.client.utils chain
-    if "pymilvus.client" not in sys.modules:
-        _client_mod = types.ModuleType("pymilvus.client")
-        _client_mod.__path__ = []
-        sys.modules["pymilvus.client"] = _client_mod
-    if "pymilvus.client.utils" not in sys.modules:
-        _utils_mod = types.ModuleType("pymilvus.client.utils")
-        _utils_mod.is_successful = lambda *args, **kwargs: True
-        sys.modules["pymilvus.client.utils"] = _utils_mod
-
-    # Stub dashscope sub-modules that may be imported lazily
-    _dashscope_subs = [
-        ("dashscope.api_entities", {}),
-        ("dashscope.api_entities.data", {}),
-        ("dashscope.api_entities.dashscope_response", {"DashScopeAPIResponse": object}),
-        ("dashscope.common", {"REQUEST_TIMEOUT_KEYWORD": "timeout"}),
-        ("dashscope.common.constants", {"REQUEST_TIMEOUT_KEYWORD": "timeout"}),
-    ]
-    for _name, _attrs in _dashscope_subs:
-        if _name not in sys.modules:
-            _m = types.ModuleType(_name)
-            _m.__path__ = []
-            for _k, _v in _attrs.items():
-                setattr(_m, _k, _v)
-            sys.modules[_name] = _m
-
-    try:
-        import openjiuwen  # noqa: F401
-    except ImportError:
-        return False
-
-    for finder in sys.meta_path:
-        if isinstance(finder, _JiuwenInitBypasser):
-            _bypasser_installed = True
-            return True
-
-    sys.meta_path.insert(0, _JiuwenInitBypasser())
-    _bypasser_installed = True
-    return True
-
-
-# ----------------------------------------------------------------------
-# Language helpers
-# ----------------------------------------------------------------------
-LANGUAGE_MAP = {"zh": "zh-CN", "en": "en-US"}
-
-
-def normalize_language(language: str) -> str:
-    return LANGUAGE_MAP.get(language, "zh-CN")
-
-
-def run_async(coro):
-    """
-    Safely run async coroutine from sync context (FastAPI or Celery).
-    Handles existing event loops properly.
-    """
-    try:
-        loop = asyncio.get_running_loop()
-    except RuntimeError:
-        return asyncio.run(coro)
-
-    if loop.is_running():
-        try:
-            import nest_asyncio
-            nest_asyncio.apply()
-            return loop.run_until_complete(coro)
-        except ImportError:
-            import concurrent.futures
-
-            def run_in_thread():
-                new_loop = asyncio.new_event_loop()
-                asyncio.set_event_loop(new_loop)
-                try:
-                    return new_loop.run_until_complete(coro)
-                finally:
-                    new_loop.close()
-
-            with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:
-                future = executor.submit(run_in_thread)
-                return future.result()
-
-    return loop.run_until_complete(coro)
-
-
-# ----------------------------------------------------------------------
-# Jiuwen SDK lazy import helpers
-# ----------------------------------------------------------------------
-def _lazy_import_jiuwen_config():
-    """Lazily import only lightweight Jiuwen config classes."""
-    _install_jiuwen_bypasser()
-
-    try:
-        import openjiuwen  # noqa: F401
-    except ImportError as e:
-        raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
-
-    from openjiuwen.core.foundation.llm.schema.config import (
-        ModelRequestConfig,
-        ModelClientConfig,
-        ProviderType,
-    )
-
-    return ModelRequestConfig, ModelClientConfig, ProviderType
-
-
-def build_jiuwen_model_configs(model_id: int, tenant_id: str):
-    """将 nexent 模型配置转换为 Jiuwen 配置对象"""
-    from database.model_management_db import get_model_by_model_id
-    from utils.config_utils import get_model_name_from_config
-
-    ModelRequestConfig, ModelClientConfig, ProviderType = _lazy_import_jiuwen_config()
-
-    model_config = get_model_by_model_id(model_id, tenant_id)
-    if not model_config:
-        raise JiuwenSDKError(f"model_id={model_id} not found")
-
-    api_base = (model_config.get("base_url", "") or "").strip()
-    if not api_base:
-        api_base = "https://api.openai.com/v1"
-
-    # Jiuwen ModelClientConfig defaults to timeout=60.0, max_retries=3.
-    # For prompt optimization calls, 60s can be too small. Reuse Nexent model config timeout_seconds.
-    timeout_seconds = model_config.get("timeout_seconds")
-    if timeout_seconds is None:
-        timeout_seconds = 120
-
-    ssl_cert = model_config.get("ssl_cert") or None
-    ssl_verify = model_config.get("ssl_verify", True)
-    if ssl_verify and not ssl_cert:
-        ssl_verify = False
-
-    client_config = ModelClientConfig(
-        client_provider=ProviderType.OpenAI,
-        api_key=model_config["api_key"],
-        api_base=api_base,
-        timeout=float(timeout_seconds),
-        verify_ssl=ssl_verify,
-        ssl_cert=ssl_cert,
-    )
-
-    request_config = ModelRequestConfig(
-        model_name=get_model_name_from_config(model_config),
-        temperature=0.3,
-    )
-    return request_config, client_config
-
-
-def _lazy_import_jiuwen_builders():
-    """Lazily import prompt builders only when optimization paths need them."""
-    _install_jiuwen_bypasser()
-
-    try:
-        import openjiuwen  # noqa: F401
-    except ImportError as e:
-        raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
-
-    from openjiuwen.dev_tools.prompt_builder.builder.feedback_prompt_builder import (
-        FeedbackPromptBuilder,
-    )
-    from openjiuwen.dev_tools.prompt_builder.builder.badcase_prompt_builder import (
-        BadCasePromptBuilder,
-    )
-
-    return FeedbackPromptBuilder, BadCasePromptBuilder
-
-
-def _unwrap_prompt_response(text: str) -> str:
-    """Strip JSON wrapper or markdown fence that Jiuwen LLM sometimes generates."""
-    _logger = logging.getLogger("jiuwen_adapter")
-    _logger.debug(f"[unwrap] raw ({len(text)} chars): {text[:200]}")
-
-    # Step 1: strip markdown code fences
-    text = text.strip()
-    if text.startswith("```"):
-        for lang in ("json", ""):
-            fence = f"```{lang}\n"
-            if text.startswith(fence):
-                text = text[len(fence):]
-                if text.endswith("\n```"):
-                    text = text[:-4]
-                elif text.endswith("```"):
-                    text = text[:-3]
-                break
-        text = text.strip()
-        _logger.debug(f"[unwrap] after fence strip ({len(text)} chars)")
-
-    # Step 2: try standard JSON parse (handles format 1 and 2)
-    if text.startswith("{"):
-        try:
-            parsed = json.loads(text)
-            if isinstance(parsed, dict) and "prompt" in parsed:
-                result = parsed["prompt"].strip()
-                _logger.debug(f"[unwrap] extracted prompt ({len(result)} chars)")
-                return result
-            if isinstance(parsed, dict) and "result" in parsed:
-                result = parsed["result"].strip()
-                _logger.debug(f"[unwrap] extracted result ({len(result)} chars)")
-                return result
-        except Exception:
-            pass
-
-    # Step 3: format 3 and 4 - raw text (possibly multi-line), return as-is
-    _logger.debug(f"[unwrap] no JSON wrapper, returning raw ({len(text)} chars)")
-    return text
-
-
-def _lazy_import_jiuwen_tune_types():
-    """Lazily import Jiuwen tune types only when badcase flow needs them."""
-    _install_jiuwen_bypasser()
-    from openjiuwen.dev_tools.tune.base import Case, EvaluatedCase
-    return Case, EvaluatedCase
-
-
-def to_jiuwen_evaluated_case(bad_case) -> Any:
-    """将 nexent BadCase 转换为 Jiuwen EvaluatedCase"""
-    Case, EvaluatedCase = _lazy_import_jiuwen_tune_types()
-
-    case = Case(
-        inputs={"question": bad_case.question},
-        label={"answer": bad_case.label or ""},
-    )
-    return EvaluatedCase(
-        case=case,
-        answer={"content": bad_case.answer},
-        score=0.0,
-        reason=bad_case.reason or "",
-    )
-
-
-# ----------------------------------------------------------------------
-# Main adapter class
-# ----------------------------------------------------------------------
-class JiuwenSDKAdapter:
-    """
-    Jiuwen SDK 调用适配器
-
-    封装 Jiuwen SDK 的所有调用，内部不处理降级，
-    失败时抛出 JiuwenSDKError，由上层 PromptOptimizationService 决定是否降级
-    """
-
-    def __init__(self, model_id: int, tenant_id: str):
-        self.model_id = model_id
-        self.tenant_id = tenant_id
-        self.logger = logging.getLogger("jiuwen_adapter")
-
-    def _ensure_available(self):
-        """确保 Jiuwen SDK 可用"""
-        if not _bypasser_installed:
-            _install_jiuwen_bypasser()
-
-        try:
-            import openjiuwen  # noqa: F401
-        except ImportError as e:
-            raise JiuwenSDKError(f"Jiuwen SDK 未安装: {e}") from e
-
-    def optimize(
-        self,
-        prompt: str,
-        feedback: str,
-        mode: Literal["general", "insert", "select"] = "general",
-        start_pos: Optional[int] = None,
-        end_pos: Optional[int] = None,
-        language: str = "zh",
-    ) -> str:
-        """
-        调用 Jiuwen FeedbackPromptBuilder
-
-        Raises:
-            JiuwenSDKError: SDK 调用失败
-        """
-        self._ensure_available()
-
-        logger.info(f"[jiuwen-adapter] mode={mode}, start_pos={start_pos}, end_pos={end_pos}")
-
-        request_config, client_config = build_jiuwen_model_configs(
-            self.model_id, self.tenant_id
-        )
-        logger.info(
-            f"[jiuwen-adapter] model_id={self.model_id}, tenant_id={self.tenant_id}, "
-            f"api_base={client_config.api_base}, model={request_config.model_name}, "
-            f"timeout={getattr(client_config, 'timeout', None)}, max_retries={getattr(client_config, 'max_retries', None)}"
-        )
-        FeedbackPromptBuilder, _ = _lazy_import_jiuwen_builders()
-
-        builder = FeedbackPromptBuilder(
-            model_config=request_config,
-            model_client_config=client_config,
-        )
-
-        try:
-            result = run_async(
-                builder.build(
-                    prompt=prompt,
-                    feedback=feedback,
-                    mode=mode,
-                    start_pos=start_pos,
-                    end_pos=end_pos,
-                    language=normalize_language(language),
-                )
-            )
-            if result is None:
-                raise JiuwenSDKError("Jiuwen FeedbackPromptBuilder 返回为空")
-            return _unwrap_prompt_response(str(result))
-        except Exception as e:
-            self.logger.error(f"Jiuwen FeedbackPromptBuilder 调用失败: {e}")
-            raise JiuwenSDKError(f"优化调用失败: {e}") from e
-
-    def optimize_badcase(
-        self,
-        prompt: str,
-        bad_cases: List,
-        language: str = "zh",
-    ) -> str:
-        """
-        调用 Jiuwen BadCasePromptBuilder
-
-        Raises:
-            JiuwenSDKError: SDK 调用失败
-        """
-        self._ensure_available()
-
-        _, BadCasePromptBuilder = _lazy_import_jiuwen_builders()
-
-        request_config, client_config = build_jiuwen_model_configs(
-            self.model_id, self.tenant_id
-        )
-        builder = BadCasePromptBuilder(
-            model_config=request_config,
-            model_client_config=client_config,
-        )
-
-        jiuwen_cases = [to_jiuwen_evaluated_case(bc) for bc in bad_cases]
-
-        try:
-            result = run_async(
-                builder.build(
-                    prompt=prompt,
-                    cases=jiuwen_cases,
-                    language=normalize_language(language),
-                )
-            )
-            if result is None:
-                raise JiuwenSDKError("Jiuwen BadCasePromptBuilder 返回为空")
-            return _unwrap_prompt_response(str(result))
-        except Exception as e:
-            self.logger.error(f"Jiuwen BadCasePromptBuilder 调用失败: {e}")
-            raise JiuwenSDKError(f"BadCasePromptBuilder 调用失败: {e}") from e
-
-    def generate(self, **kwargs) -> dict:
-        """调用 Jiuwen 提示词生成能力"""
-        self._ensure_available()
-        raise JiuwenSDKError("Jiuwen 提示词生成能力尚未实现")
diff --git a/backend/agents/create_agent_info.py b/backend/agents/create_agent_info.py
index 7e3b42e28..50df7eb99 100644
--- a/backend/agents/create_agent_info.py
+++ b/backend/agents/create_agent_info.py
@@ -1,12 +1,12 @@
-﻿import json
-import threading
+﻿import threading
 import logging
-from typing import Any, Dict, List, Optional
+from typing import List, Optional
 from urllib.parse import urljoin
+from datetime import datetime
 
 from jinja2 import Template, StrictUndefined
 from nexent.core.utils.observer import MessageObserver
-from nexent.core.agents.agent_model import AgentRunInfo, ModelConfig, AgentConfig, ToolConfig, ExternalA2AAgentConfig, AgentHistory, AgentVerificationConfig
+from nexent.core.agents.agent_model import AgentRunInfo, ModelConfig, AgentConfig, ToolConfig, ExternalA2AAgentConfig, AgentHistory
 from nexent.core.agents.agent_context import ContextManagerConfig
 from nexent.memory.memory_service import search_memory_in_levels
 
@@ -22,11 +22,7 @@
 from database.a2a_agent_db import PROTOCOL_JSONRPC
 from services.memory_config_service import build_memory_context
 from services.image_service import get_video_understanding_model, get_vlm_model
-from database.agent_db import (
-    search_agent_info_by_agent_id,
-    query_sub_agent_relations,
-    resolve_sub_agent_version_no,
-)
+from database.agent_db import search_agent_info_by_agent_id, query_sub_agents_id_list
 from database.agent_version_db import query_current_version_no
 from database.tool_db import search_tools_for_sub_agent
 from database.model_management_db import get_model_records, get_model_by_model_id
@@ -37,71 +33,12 @@
 from utils.config_utils import tenant_config_manager, get_model_name_from_config
 from utils.context_utils import build_context_components
 from consts.const import LOCAL_MCP_SERVER, MODEL_CONFIG_MAPPING, LANGUAGE, DATA_PROCESS_SERVICE, MINIO_DEFAULT_BUCKET
-from consts.model import AgentToolParamsRequest, ToolParamsRequest
 from consts.exceptions import ValidationError
 
 logger = logging.getLogger("create_agent_info")
 logger.setLevel(logging.DEBUG)
 
 
-def _normalize_tool_params_request(tool_params: Optional[ToolParamsRequest | Dict[str, Any]]) -> ToolParamsRequest:
-    """Normalize request-scoped tool parameter overrides into a ToolParamsRequest."""
-    if tool_params is None:
-        return ToolParamsRequest()
-    if isinstance(tool_params, ToolParamsRequest):
-        return tool_params
-    if not isinstance(tool_params, dict):
-        raise ValidationError("tool_params must be an object.")
-    try:
-        return ToolParamsRequest.model_validate(tool_params)
-    except Exception as exc:
-        raise ValidationError(f"Invalid tool_params payload: {exc}") from exc
-
-
-def _get_agent_tool_overrides(
-    tool_params: Optional[ToolParamsRequest],
-    agent_name: Optional[str],
-) -> Dict[str, Dict[str, Any]]:
-    """Resolve tool overrides for a specific agent by its name."""
-    if tool_params is None:
-        return {}
-    if not agent_name:
-        return {}
-    agent_override = tool_params.agents.get(agent_name)
-    if agent_override is None:
-        return {}
-    return dict(agent_override.tools)
-
-
-def _merge_tool_params(
-    tool_record: Dict[str, Any],
-    override_params: Optional[Dict[str, Any]],
-    extra_params: Optional[Dict[str, Any]] = None,
-) -> Dict[str, Any]:
-    """Merge request overrides on top of tool instance defaults from DB.
-
-    Args:
-        tool_record: Tool configuration from database
-        override_params: Request-scoped overrides from tool_params
-        extra_params: Additional internal params not in DB schema (e.g., document_paths)
-
-    Returns:
-        Merged params dict with DB defaults, overrides, and extra params
-    """
-    merged_params: Dict[str, Any] = {}
-    for param in tool_record.get("params", []):
-        merged_params[param["name"]] = param.get("default")
-
-    if override_params:
-        merged_params.update(override_params)
-
-    # Extra params (e.g., internal access control params) always take precedence
-    if extra_params:
-        merged_params.update(extra_params)
-
-    return merged_params
-
-
 def _build_internal_s3_url(file: dict) -> str:
     """Build a valid S3 URL for internal tools from uploaded file metadata."""
     if not isinstance(file, dict):
@@ -373,23 +310,18 @@ async def create_agent_config(
     allow_memory_search: bool = True,
     version_no: int = 0,
     override_model_id: int | None = None,
-    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
 ):
-    normalized_tool_params = _normalize_tool_params_request(tool_params)
     agent_info = search_agent_info_by_agent_id(
         agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
 
     # create sub agent
-    sub_agent_relations = query_sub_agent_relations(
+    sub_agent_id_list = query_sub_agents_id_list(
         main_agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
     managed_agents = []
-    for rel in sub_agent_relations:
-        sub_agent_id = rel['selected_agent_id']
-        sub_agent_version_no = resolve_sub_agent_version_no(
-            selected_agent_id=sub_agent_id,
-            selected_agent_version_no=rel.get('selected_agent_version_no'),
-            tenant_id=tenant_id,
-        )
+    for sub_agent_id in sub_agent_id_list:
+        # Get the current published version for this sub-agent (from draft version 0)
+        sub_agent_version_no = query_current_version_no(
+            agent_id=sub_agent_id, tenant_id=tenant_id) or 0
         sub_agent_config = await create_agent_config(
             agent_id=sub_agent_id,
             tenant_id=tenant_id,
@@ -399,20 +331,13 @@ async def create_agent_config(
             allow_memory_search=allow_memory_search,
             version_no=sub_agent_version_no,
             override_model_id=None,
-            tool_params=normalized_tool_params,
         )
         managed_agents.append(sub_agent_config)
 
     # create external A2A agents (synchronous function, no await needed)
     external_a2a_agents = _get_external_a2a_agents(agent_id, tenant_id, version_no)
 
-    tool_list = await create_tool_config_list(
-        agent_id,
-        tenant_id,
-        user_id,
-        version_no=version_no,
-        tool_params=normalized_tool_params,
-    )
+    tool_list = await create_tool_config_list(agent_id, tenant_id, user_id, version_no=version_no)
 
     # Build system prompt: prioritize segmented fields, fallback to original prompt field if not available
     duty_prompt = agent_info.get("duty_prompt", "")
@@ -458,77 +383,6 @@ async def create_agent_config(
             # Bubble up to streaming layer so it can emit <MEM_FAILED> and fall back
             raise Exception(f"Failed to retrieve memory list: {e}")
 
-    # Append active memory tools if memory is enabled
-    if memory_context.user_config.memory_switch and memory_context.memory_config:
-        try:
-            memory_metadata = {
-                "memory_config": memory_context.memory_config,
-                "memory_user_config": memory_context.user_config,
-                "tenant_id": memory_context.tenant_id,
-                "user_id": memory_context.user_id,
-                "agent_id": memory_context.agent_id,
-            }
-
-            store_tool_config = ToolConfig(
-                class_name="StoreMemoryTool",
-                name="store_memory",
-                description=(
-                    "Save important information to long-term memory for future recall. "
-                    "Use this when the user shares personal preferences, facts about themselves, "
-                    "project context, or instructions that should persist across conversations. "
-                    "Do NOT store transient information like temporary calculations, information "
-                    "already in the knowledge base, or data the user explicitly says to forget."
-                ),
-                inputs=json.dumps({
-                    "content": {
-                        "type": "string",
-                        "description": "The information to remember",
-                        "description_zh": "需要记住的信息"
-                    }
-                }, ensure_ascii=False),
-                output_type="string",
-                params={},
-                source="local",
-                usage=None,
-                metadata=memory_metadata,
-            )
-            tool_list.append(store_tool_config)
-
-            search_tool_config = ToolConfig(
-                class_name="SearchMemoryTool",
-                name="search_memory",
-                description=(
-                    "Search long-term memory for relevant information from previous interactions. "
-                    "Use this when you need context about the user's preferences, past decisions, "
-                    "or previously discussed topics that aren't in the current conversation. "
-                    "The system already provides some memory context automatically -- use this tool "
-                    "when you need to search for specific information not already available."
-                ),
-                inputs=json.dumps({
-                    "query": {
-                        "type": "string",
-                        "description": "Natural language query describing what to search for",
-                        "description_zh": "描述要搜索内容的自然语言查询"
-                    },
-                    "top_k": {
-                        "type": "integer",
-                        "description": "Maximum number of results to return",
-                        "description_zh": "返回结果的最大数量",
-                        "default": 5,
-                        "nullable": True
-                    }
-                }, ensure_ascii=False),
-                output_type="string",
-                params={},
-                source="local",
-                usage=None,
-                metadata=memory_metadata,
-            )
-            tool_list.append(search_tool_config)
-            logger.debug("Active memory tools appended to agent tool list")
-        except Exception as e:
-            logger.warning(f"Failed to append active memory tools: {e}")
-
     # Build knowledge base summary
     knowledge_base_summary = ""
     try:
@@ -559,6 +413,7 @@ async def create_agent_config(
     # Get skills list for prompt template
     skills = _get_skills_for_template(agent_id, tenant_id, version_no)
 
+    time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
     is_manager = len(managed_agents) > 0 or len(external_a2a_agents) > 0
 
     render_kwargs = {
@@ -573,6 +428,7 @@ async def create_agent_config(
         "APP_DESCRIPTION": app_description,
         "memory_list": memory_list,
         "knowledge_base_summary": knowledge_base_summary,
+        "time": time_str,
         "user_id": user_id,
     }
     system_prompt = Template(prompt_template["system_prompt"], undefined=StrictUndefined).render(render_kwargs)
@@ -601,6 +457,7 @@ async def create_agent_config(
             few_shots=few_shots_prompt,
             app_name=app_name,
             app_description=app_description,
+            time_str=time_str,
             user_id=user_id,
             language=language,
             is_manager=is_manager,
@@ -633,48 +490,21 @@ async def create_agent_config(
         external_a2a_agents=external_a2a_agents,
         context_manager_config=cm_config,
         context_components=context_components,
-        verification_config=AgentVerificationConfig.model_validate(agent_info.get("verification_config") or {}),
     )
     return agent_config
 
 
-async def create_tool_config_list(
-    agent_id,
-    tenant_id,
-    user_id,
-    version_no: int = 0,
-    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
-):
+async def create_tool_config_list(agent_id, tenant_id, user_id, version_no: int = 0):
+    # create tool
     tool_config_list = []
     langchain_tools = await discover_langchain_tools()
-    normalized_tool_params = _normalize_tool_params_request(tool_params)
 
     # now only admin can modify the agent, user_id is not used
     tools_list = search_tools_for_sub_agent(agent_id, tenant_id, version_no=version_no)
-
-    # Look up agent name for use in error messages.
-    # Agent name is optional for tool_params matching (matching uses tool identifiers only),
-    # but we include it in error messages so callers can identify which agent/tool caused a failure.
-    agent_info = search_agent_info_by_agent_id(agent_id=agent_id, tenant_id=tenant_id, version_no=version_no)
-    agent_name = agent_info.get("name") if agent_info else None
-    agent_tool_overrides = _get_agent_tool_overrides(normalized_tool_params, agent_name)
-
-    tool_keys_seen = set()
     for tool in tools_list:
-        tool_identifier = tool.get("name") or tool.get("class_name")
-        if tool_identifier in tool_keys_seen:
-            raise ValidationError(
-                f"Duplicate tool identifier '{tool_identifier}' found in agent '{agent_name or agent_id}'."
-            )
-        tool_keys_seen.add(tool_identifier)
-
-        override_params = None
-        if tool.get("name") in agent_tool_overrides:
-            override_params = agent_tool_overrides[tool.get("name")]
-        elif tool.get("class_name") in agent_tool_overrides:
-            override_params = agent_tool_overrides[tool.get("class_name")]
-
-        param_dict = _merge_tool_params(tool, override_params)
+        param_dict = {}
+        for param in tool.get("params", []):
+            param_dict[param["name"]] = param.get("default")
         tool_config = ToolConfig(
             class_name=tool.get("class_name"),
             name=tool.get("name"),
@@ -693,21 +523,12 @@ async def create_tool_config_list(
                     tool_config.metadata = langchain_tool
                     break
 
-        # Extract document_paths for KnowledgeBaseSearchTool (internal access control, not in DB schema)
-        document_paths = None
-        if override_params and "document_paths" in override_params:
-            document_paths = override_params.get("document_paths")
-        # Also check using the tool name as key
-        if not document_paths:
-            kb_overrides = agent_tool_overrides.get("knowledge_base_search")
-            if kb_overrides and "document_paths" in kb_overrides:
-                document_paths = kb_overrides.get("document_paths")
-
         # special logic for search tools that may use reranking models
         if tool_config.class_name == "KnowledgeBaseSearchTool":
-            rerank = tool_config.params.get("rerank", False)
-            rerank_model_name = tool_config.params.get("rerank_model_name", "")
+            rerank = param_dict.get("rerank", False)
+            rerank_model_name = param_dict.get("rerank_model_name", "")
             rerank_model = None
+            is_multimodal = bool(tool_config.params.pop("multimodal", False))
             if rerank and rerank_model_name:
                 rerank_model = get_rerank_model(
                     tenant_id=tenant_id, model_name=rerank_model_name
@@ -715,7 +536,7 @@ async def create_tool_config_list(
 
             # Build display_name to index_name mapping for LLM parameter conversion
             # Also build reverse mapping (index_name -> display_name) for knowledge_base_summary
-            index_names = tool_config.params.get("index_names", [])
+            index_names = param_dict.get("index_names", [])
             display_name_to_index_map = {}
             index_name_to_display_map = {}
             if index_names:
@@ -731,14 +552,12 @@ async def create_tool_config_list(
                 "rerank_model": rerank_model,
                 "display_name_to_index_map": display_name_to_index_map,
                 "index_name_to_display_map": index_name_to_display_map,
-                # Internal access control: restrict results to specific document paths (path_or_urls)
-                "document_paths": document_paths,
             }
 
+            # Must have embedding model for knowledge base search
             if not index_names:
                 raise ValidationError(
-                    f"[{agent_name or agent_id}] knowledge_base_search tool requires index_names, "
-                    f"but it is not configured in the agent and not provided via tool_params.")
+                    "Embedding model is required for knowledge_base_search but index_names is empty")
 
             embedding_model, _, _ = get_embedding_model_by_index_name(tenant_id, index_names[0])
             if not embedding_model:
@@ -747,8 +566,8 @@ async def create_tool_config_list(
                     f"Please configure an embedding model for this knowledge base.")
             tool_config.metadata["embedding_model"] = embedding_model
         elif tool_config.class_name in ["DifySearchTool", "DataMateSearchTool"]:
-            rerank = tool_config.params.get("rerank", False)
-            rerank_model_name = tool_config.params.get("rerank_model_name", "")
+            rerank = param_dict.get("rerank", False)
+            rerank_model_name = param_dict.get("rerank_model_name", "")
             rerank_model = None
             if rerank and rerank_model_name:
                 rerank_model = get_rerank_model(
@@ -1042,7 +861,6 @@ async def create_agent_run_info(
     is_debug: bool = False,
     override_version_no: int | None = None,
     override_model_id: int | None = None,
-    tool_params: Optional[ToolParamsRequest | Dict[str, Any]] = None,
 ):
     # Determine which version_no to use based on is_debug flag
     # If is_debug=false, use the current published version (current_version_no)
@@ -1075,7 +893,7 @@ async def create_agent_run_info(
     if override_model_id is not None:
         create_config_kwargs["override_model_id"] = override_model_id
 
-    agent_config = await create_agent_config(**create_config_kwargs, tool_params=tool_params)
+    agent_config = await create_agent_config(**create_config_kwargs)
 
     remote_mcp_list = await get_remote_mcp_server_list(tenant_id=tenant_id, is_need_auth=True)
     default_mcp_url = urljoin(LOCAL_MCP_SERVER, "sse")
diff --git a/backend/apps/agent_app.py b/backend/apps/agent_app.py
index 87abbf9e8..e280ff422 100644
--- a/backend/apps/agent_app.py
+++ b/backend/apps/agent_app.py
@@ -195,6 +195,8 @@ async def export_agent_api(request: AgentIDRequest, authorization: Optional[str]
                     "Content-Disposition": f"attachment; filename=\"{result.get('filename', 'agent_export.zip')}\""
                 }
             )
+        if isinstance(result, str):
+            result = json.loads(result)
         return ConversationResponse(code=0, message="success", data=result)
     except Exception as e:
         logger.error(f"Agent export error: {str(e)}")
@@ -619,5 +621,3 @@ async def list_published_agents_api(
         raise HTTPException(
             status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="Published agents list error."
         )
-
-
diff --git a/backend/apps/agent_repository_app.py b/backend/apps/agent_repository_app.py
deleted file mode 100644
index e9da2fde0..000000000
--- a/backend/apps/agent_repository_app.py
+++ /dev/null
@@ -1,134 +0,0 @@
-import logging
-from http import HTTPStatus
-from typing import Optional
-
-from fastapi import APIRouter, Body, Header, HTTPException, Query
-from starlette.responses import JSONResponse
-
-from consts.exceptions import SkillDuplicateError, UnauthorizedError
-from services.agent_repository_service import (
-    create_agent_repository_listing_impl,
-    import_agent_from_repository_impl,
-    list_agent_repository_listings_impl,
-    update_agent_repository_status_impl,
-)
-from utils.auth_utils import get_current_user_id
-
-agent_repository_router = APIRouter(prefix="/repository/agent")
-logger = logging.getLogger("agent_repository_app")
-
-
-@agent_repository_router.get("")
-async def list_agent_repository_listings_api(
-    status: Optional[str] = Query(None, description="Filter by listing status"),
-    authorization: str = Header(None),
-):
-    """List all marketplace repository listings with optional status filter."""
-    try:
-        get_current_user_id(authorization)
-        result = list_agent_repository_listings_impl(status=status)
-        return JSONResponse(status_code=HTTPStatus.OK, content=result)
-    except UnauthorizedError as e:
-        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
-    except ValueError as e:
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
-    except Exception as e:
-        logger.error(f"List agent repository listings error: {str(e)}")
-        raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
-            detail="List agent repository listings error.",
-        )
-
-
-@agent_repository_router.patch("/{agent_repository_id}/status")
-async def update_agent_repository_status_api(
-    agent_repository_id: int,
-    status: str = Body(
-        ...,
-        embed=True,
-        description=(
-            "New status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / "
-            "REJECTED (审核驳回) / SHARED (已共享)"
-        ),
-    ),
-    authorization: str = Header(None),
-):
-    """Update marketplace repository listing status (share, unshare, approve, reject)."""
-    try:
-        user_id, _ = get_current_user_id(authorization)
-        result = update_agent_repository_status_impl(
-            agent_repository_id=agent_repository_id,
-            status=status,
-            user_id=user_id,
-        )
-        return JSONResponse(status_code=HTTPStatus.OK, content=result)
-    except UnauthorizedError as e:
-        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
-    except ValueError as e:
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
-    except Exception as e:
-        logger.error(f"Update agent repository status error: {str(e)}")
-        raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
-            detail="Update agent repository status error.",
-        )
-
-
-@agent_repository_router.post("/{agent_id}/versions/{version_no}")
-async def create_agent_repository_listing_api(
-    agent_id: int,
-    version_no: int,
-    authorization: str = Header(None),
-):
-    """Create or update a marketplace repository listing from an agent version snapshot."""
-    try:
-        user_id, tenant_id = get_current_user_id(authorization)
-        result = await create_agent_repository_listing_impl(
-            agent_id=agent_id,
-            tenant_id=tenant_id,
-            user_id=user_id,
-            version_no=version_no,
-        )
-        return JSONResponse(status_code=HTTPStatus.OK, content=result)
-    except UnauthorizedError as e:
-        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
-    except ValueError as e:
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
-    except Exception as e:
-        logger.error(f"Create agent repository listing error: {str(e)}")
-        raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
-            detail="Create agent repository listing error.",
-        )
-
-
-@agent_repository_router.post("/{agent_repository_id}/import")
-async def import_agent_from_repository_api(
-    agent_repository_id: int,
-    authorization: Optional[str] = Header(None),
-):
-    """Import an agent tree from a marketplace repository listing into the current tenant."""
-    try:
-        await import_agent_from_repository_impl(
-            agent_repository_id=agent_repository_id,
-            authorization=authorization,
-        )
-        return JSONResponse(status_code=HTTPStatus.OK, content={})
-    except UnauthorizedError as e:
-        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail=str(e))
-    except SkillDuplicateError as exc:
-        raise HTTPException(
-            status_code=HTTPStatus.CONFLICT,
-            detail={
-                "type": "skill_duplicate",
-                "duplicate_skills": exc.duplicate_names,
-            },
-        )
-    except ValueError as e:
-        raise HTTPException(status_code=HTTPStatus.NOT_FOUND, detail=str(e))
-    except Exception as e:
-        logger.error(f"Import agent from repository error: {str(e)}")
-        raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
-            detail="Import agent from repository error.",
-        )
diff --git a/backend/apps/app_factory.py b/backend/apps/app_factory.py
index 02816cec1..219da5b82 100644
--- a/backend/apps/app_factory.py
+++ b/backend/apps/app_factory.py
@@ -101,16 +101,6 @@ async def generic_exception_handler(request, exc):
         if isinstance(exc, AppException):
             return await app_exception_handler(request, exc)
 
-        # Handle NexentCapabilityError with a friendly message
-        from adapters.exception import NexentCapabilityError as _NCE
-
-        if isinstance(exc, _NCE):
-            logger.warning(f"NexentCapabilityError: {exc}")
-            return JSONResponse(
-                status_code=400,
-                content={"message": str(exc)},
-            )
-
         logger.error(f"Generic Exception: {exc}")
         return JSONResponse(
             status_code=500,
diff --git a/backend/apps/cas_app.py b/backend/apps/cas_app.py
deleted file mode 100644
index dbf4815f8..000000000
--- a/backend/apps/cas_app.py
+++ /dev/null
@@ -1,156 +0,0 @@
-import html
-import logging
-from http import HTTPStatus
-from typing import Optional
-from urllib.parse import parse_qs, urlsplit
-
-from fastapi import APIRouter, HTTPException, Query, Request
-from fastapi.responses import HTMLResponse, JSONResponse, RedirectResponse
-
-from services.cas_service import (
-    CAS_SERVER_URL,
-    CasAuthenticationError,
-    build_login_url,
-    build_renew_url,
-    get_cas_config,
-    login_with_ticket,
-    renew_with_ticket,
-    revoke_from_logout_request,
-)
-
-logger = logging.getLogger(__name__)
-router = APIRouter(prefix="/user/cas", tags=["cas"])
-
-
-@router.get("/config")
-async def config():
-    return JSONResponse(
-        status_code=HTTPStatus.OK,
-        content={"message": "success", "data": get_cas_config()},
-    )
-
-
-@router.get("/login")
-async def login(redirect: str = Query("/", description="URL to return to after login")):
-    try:
-        login_url = _require_cas_server_redirect(build_login_url(redirect))
-        return RedirectResponse(url=login_url, status_code=HTTPStatus.FOUND)
-    except CasAuthenticationError as exc:
-        logger.warning("CAS login rejected: %s", exc)
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail="CAS login is not available")
-
-
-@router.get("/callback")
-async def callback(ticket: str = "", redirect: str = "/"):
-    try:
-        result = await login_with_ticket(ticket, redirect)
-        return JSONResponse(
-            status_code=HTTPStatus.OK,
-            content={"message": "CAS login successful", "data": result},
-        )
-    except CasAuthenticationError as exc:
-        logger.warning("CAS callback rejected: %s", exc)
-        raise HTTPException(status_code=HTTPStatus.UNAUTHORIZED, detail="CAS authentication failed")
-    except Exception as exc:
-        logger.error(f"CAS callback failed: {exc}")
-        raise HTTPException(status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="CAS login failed")
-
-
-@router.post("/callback")
-async def callback_logout(request: Request, logout_request: Optional[str] = None):
-    return await _handle_logout_request(request, logout_request, endpoint="callback")
-
-
-@router.get("/renew")
-async def renew():
-    try:
-        return RedirectResponse(url=build_renew_url(), status_code=HTTPStatus.FOUND)
-    except CasAuthenticationError as exc:
-        logger.warning("CAS renew rejected: %s", exc)
-        return _renew_html(False, "CAS renew failed")
-
-
-@router.get("/renew_callback")
-async def renew_callback(ticket: str = ""):
-    if not ticket:
-        return _renew_html(False, "CAS session is not active")
-    try:
-        result = await renew_with_ticket(ticket)
-        return JSONResponse(
-            status_code=HTTPStatus.OK,
-            content={"message": "CAS renew successful", "data": result},
-        )
-    except Exception as exc:
-        logger.warning(f"CAS renew failed: {exc}")
-        return _renew_html(False, "CAS renew failed")
-
-
-@router.post("/logout_callback")
-async def logout_callback(
-    request: Request,
-    logout_request: Optional[str] = None,
-):
-    return await _handle_logout_request(request, logout_request, endpoint="logout_callback")
-
-
-async def _handle_logout_request(
-    request: Request,
-    logout_request: Optional[str] = None,
-    endpoint: str = "unknown",
-):
-    logout_request = await _extract_logout_request(request, logout_request)
-    logger.info(
-        "CAS SLO %s received logoutRequest: present=%s length=%s",
-        endpoint,
-        bool(logout_request),
-        len(logout_request or ""),
-    )
-    result = revoke_from_logout_request(logout_request)
-    logger.info("CAS SLO %s revoke result: %s", endpoint, result)
-    return JSONResponse(
-        status_code=HTTPStatus.OK,
-        content={"message": "success", "data": result},
-    )
-
-
-async def _extract_logout_request(request: Request, logout_request: Optional[str] = None) -> str:
-    if logout_request:
-        return logout_request
-
-    query_logout_request = request.query_params.get("logoutRequest") or request.query_params.get("logout_request")
-    if query_logout_request:
-        return query_logout_request
-
-    body = await request.body()
-    raw_body = body.decode("utf-8") if body else ""
-    if not raw_body:
-        return ""
-
-    parsed = parse_qs(raw_body)
-    return (parsed.get("logoutRequest") or parsed.get("logout_request") or [raw_body])[0]
-
-
-def _renew_html(success: bool, reason: str = "") -> HTMLResponse:
-    status = "success" if success else "failed"
-    safe_reason = html.escape(reason)
-    return HTMLResponse(
-        status_code=HTTPStatus.OK,
-        content=f"""<!doctype html>
-<html><body><script>
-window.parent && window.parent.postMessage({{ type: "cas-renew-{status}", reason: "{safe_reason}" }}, window.location.origin);
-</script></body></html>""",
-    )
-
-
-def _require_cas_server_redirect(url: str) -> str:
-    parsed_url = urlsplit(url)
-    parsed_cas = urlsplit(CAS_SERVER_URL)
-    if (
-        parsed_url.scheme not in {"http", "https"}
-        or not parsed_url.netloc
-        or parsed_url.scheme != parsed_cas.scheme
-        or parsed_url.netloc != parsed_cas.netloc
-    ):
-        logger.warning("Blocked CAS redirect outside configured server: %s", url)
-        raise CasAuthenticationError("Invalid CAS redirect URL")
-    return url
diff --git a/backend/apps/config_app.py b/backend/apps/config_app.py
index a818ec7cb..8cb383df7 100644
--- a/backend/apps/config_app.py
+++ b/backend/apps/config_app.py
@@ -2,7 +2,6 @@
 
 from apps.app_factory import create_app
 from apps.agent_app import agent_config_router as agent_router
-from apps.agent_repository_app import agent_repository_router
 from apps.config_sync_app import router as config_sync_router
 from apps.datamate_app import router as datamate_router
 from apps.vectordatabase_app import router as vectordatabase_router
@@ -33,7 +32,6 @@
 from apps.monitoring_app import router as monitoring_router
 from apps.a2a_server_app import router as a2a_server_router
 from apps.haotian_app import router as haotian_router
-from apps.cas_app import router as cas_router
 from consts.const import IS_SPEED_MODE
 from services.prompt_template_service import sync_system_default_prompt_template
 
@@ -56,7 +54,6 @@ async def sync_default_prompt_template_on_startup():
 app.include_router(model_manager_router)
 app.include_router(config_sync_router)
 app.include_router(agent_router)
-app.include_router(agent_repository_router)
 app.include_router(vectordatabase_router)
 app.include_router(datamate_router)
 app.include_router(voice_router)
@@ -76,7 +73,6 @@ async def sync_default_prompt_template_on_startup():
     app.include_router(user_management_router)
 
 app.include_router(oauth_router)
-app.include_router(cas_router)
 
 app.include_router(summary_router)
 app.include_router(prompt_router)
diff --git a/backend/apps/northbound_app.py b/backend/apps/northbound_app.py
index 9f3b7e323..e6aff8e06 100644
--- a/backend/apps/northbound_app.py
+++ b/backend/apps/northbound_app.py
@@ -1,16 +1,14 @@
 import logging
 from http import HTTPStatus
 from typing import Optional, Dict, Any
-from urllib.parse import urlparse, unquote
-import re
+from urllib.parse import urlparse
 import uuid
 
 import httpx
-from fastapi import APIRouter, Body, File, Header, HTTPException, Query, Request, UploadFile
+from fastapi import APIRouter, Body, Header, Request, HTTPException, Query
 from fastapi.responses import JSONResponse, StreamingResponse
 
-from consts.exceptions import LimitExceededError, UnauthorizedError, ConversationNotFoundError
-from consts.model import ToolParamsRequest
+from consts.exceptions import LimitExceededError, UnauthorizedError
 from services.northbound_service import (
     NorthboundContext,
     get_conversation_history,
@@ -19,35 +17,16 @@
     stop_chat,
     get_agent_info_list,
     update_conversation_title,
-    upload_files_for_northbound,
 )
 
 from utils.auth_utils import validate_bearer_token, get_user_and_tenant_by_access_key
 
-from .file_management_app import build_content_disposition_header
-
 
 router = APIRouter(prefix="/nb/v1", tags=["northbound"])
 
 __all__ = ["router", "_get_northbound_context"]
 
 
-def _resolve_proxy_download_filename(presigned_url: str, content_disposition: str) -> str:
-    """Resolve a stable download filename for the northbound file proxy."""
-    if content_disposition:
-        filename_star_match = re.search(r"filename\*=UTF-8''([^;]+)", content_disposition)
-        if filename_star_match:
-            return unquote(filename_star_match.group(1)) or "download"
-
-        filename_match = re.search(r'filename="?([^";]+)"?', content_disposition)
-        if filename_match:
-            return filename_match.group(1) or "download"
-
-    path = unquote(urlparse(presigned_url).path)
-    filename = path.split("/")[-1].strip()
-    return filename or "download"
-
-
 async def _get_northbound_context(request: Request) -> NorthboundContext:
     """
     Build northbound context from request.
@@ -130,119 +109,13 @@ async def health_check():
     return {"status": "healthy", "service": "northbound-api"}
 
 
-@router.post(
-    "/chat/attachments/upload",
-    summary="Upload chat attachments for northbound runs",
-    description=(
-        "Upload one or more files for later use in `/nb/v1/chat/run`. "
-        "Successful uploads return reusable `s3_url` references."
-    ),
-)
-async def upload_chat_attachments(
-    request: Request,
-    files: list[UploadFile] = File(
-        ...,
-        description="List of files to upload",
-        examples=["report.pdf", "diagram.png"],
-    ),
-):
-    try:
-        ctx: NorthboundContext = await _get_northbound_context(request)
-        return JSONResponse(
-            status_code=HTTPStatus.OK,
-            content=await upload_files_for_northbound(ctx=ctx, files=files),
-        )
-    except LimitExceededError as e:
-        logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
-                            detail="Too Many Requests: rate limit exceeded")
-    except ValueError as e:
-        logging.error(f"Invalid northbound upload request: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
-    except PermissionError as e:
-        logging.error(f"Permission denied while uploading northbound files: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.FORBIDDEN, detail=str(e))
-    except HTTPException as e:
-        raise e
-    except Exception as e:
-        logging.error(f"Failed to upload northbound files: {str(e)}", exc_info=e)
-        raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail="Internal Server Error")
-
-
-@router.post(
-    "/chat/run",
-    summary="Start a northbound chat run with optional attachments",
-    description=(
-        "Run a northbound chat request. Upload attachments first through "
-        "`/nb/v1/chat/attachments/upload`, then pass the returned `s3_url` values "
-        "through the `attachments` field."
-    ),
-)
+@router.post("/chat/run")
 async def run_chat(
     request: Request,
-    conversation_id: Optional[int] = Body(
-        None,
-        embed=True,
-        description="Existing conversation ID. Omit to create a new conversation.",
-        examples=[123],
-    ),
-    agent_name: str = Body(
-        ...,
-        embed=True,
-        description="Target agent name.",
-        examples=["general-assistant"],
-    ),
-    query: str = Body(
-        ...,
-        embed=True,
-        description="User input to send to the agent.",
-        examples=["Summarize the uploaded report and list the key risks."],
-    ),
-    attachments: Optional[list] = Body(
-        None,
-        embed=True,
-        description="Attachments for the chat. Can be either a list of S3 URL strings"
-                    "or a list of attachment objects with full metadata.",
-        examples=[["s3://nexent/attachments/user123/20260609_report.pdf"]],
-    ),
-    meta_data: Optional[Dict[str, Any]] = Body(
-        None,
-        embed=True,
-        description="Optional metadata passed through for audit and usage logging.",
-        examples=[{"source": "crm", "ticket_id": "INC-1001"}],
-    ),
-    tool_params: Optional[ToolParamsRequest] = Body(
-        None,
-        embed=True,
-        description="Optional request-scoped overrides for tool initialization parameters. "
-            "Overrides DB-persisted params (ag_tool_instance_t.params) on a per-run basis. "
-            "Conflict resolution: request value wins over DB value. "
-            "Structure: agents -> {agent_name} -> tools -> {tool_name} -> {param_name: param_value}. "
-            "tool_name matching: first by tool.name, then by tool.class_name. "
-            "Unknown param names cause a ValidationError (400). "
-            "Metadata-derived fields (e.g., vdb_core, embedding_model) are recalculated "
-            "from merged params for tools like KnowledgeBaseSearchTool, DifySearchTool, DataMateSearchTool.",
-        examples=[{
-            "agents": {
-                "common_sense_qa_assistant": {
-                    "tools": {
-                        "analyze_text_file": {
-                            "chunk_size": 4000,
-                            "summary_only": True,
-                            "prompt": "Please provide a concise summary of this document focusing on key facts."
-                        },
-                        "knowledge_base_search": {
-                            "top_k": 10,
-                            "rerank": True,
-                            "rerank_model_name": "gte-rerank-v2",
-                            "index_names": ["nexent-docs", "faq-index"]
-                        }
-                    }
-                }
-            }
-        }],
-    ),
+    conversation_id: Optional[int] = Body(None, embed=True),
+    agent_name: str = Body(..., embed=True),
+    query: str = Body(..., embed=True),
+    meta_data: Optional[Dict[str, Any]] = Body(None, embed=True),
     idempotency_key: Optional[str] = Header(None, alias="Idempotency-Key"),
 ):
     try:
@@ -252,21 +125,13 @@ async def run_chat(
             conversation_id=conversation_id,
             agent_name=agent_name,
             query=query,
-            attachments=attachments,
             meta_data=meta_data,
-            tool_params=tool_params,
             idempotency_key=idempotency_key,
         )
     except LimitExceededError as e:
         logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
         raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
                             detail="Too Many Requests: rate limit exceeded")
-    except ValueError as e:
-        logging.error(f"Invalid northbound chat request: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.BAD_REQUEST, detail=str(e))
-    except PermissionError as e:
-        logging.error(f"Permission denied while running northbound chat: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.FORBIDDEN, detail=str(e))
     except HTTPException as e:
         raise e
     except Exception as e:
@@ -389,9 +254,6 @@ async def update_convs_title(
         logging.error(f"Too Many Requests: rate limit exceeded: {str(e)}", exc_info=e)
         raise HTTPException(status_code=HTTPStatus.TOO_MANY_REQUESTS,
                             detail="Too Many Requests: rate limit exceeded")
-    except ConversationNotFoundError as e:
-        logging.error(f"Conversation not found while updating title: {str(e)}", exc_info=e)
-        raise HTTPException(status_code=HTTPStatus.NOT_FOUND, detail=str(e))
     except HTTPException as e:
         raise e
     except Exception as e:
@@ -450,12 +312,12 @@ async def fetch_file_from_presigned_url(
 
         content_type = response.headers.get("Content-Type", "application/octet-stream")
         content_disposition = response.headers.get("Content-Disposition", "")
-        download_filename = _resolve_proxy_download_filename(presigned_url, content_disposition)
 
         headers = {
             "Content-Type": content_type,
-            "Content-Disposition": build_content_disposition_header(download_filename),
         }
+        if content_disposition:
+            headers["Content-Disposition"] = content_disposition
 
         return StreamingResponse(
             content=response.aiter_bytes(),
diff --git a/backend/apps/northbound_knowledge_app.py b/backend/apps/northbound_knowledge_app.py
index 02739d138..775d6c567 100644
--- a/backend/apps/northbound_knowledge_app.py
+++ b/backend/apps/northbound_knowledge_app.py
@@ -51,8 +51,7 @@ async def _require_asset_owner_context(request: Request) -> NorthboundContext:
 @router.get("/indices")
 async def get_list_indices(
     request: Request,
-    pattern: Annotated[str, Query(
-        description="Pattern to match index names")] = "*",
+    pattern: Annotated[str, Query(description="Pattern to match index names")] = "*",
 ):
     """List knowledge bases visible to the asset-owner tenant.
 
@@ -93,7 +92,7 @@ async def create_new_index(
         Optional[Dict[str, Any]],
         Body(
             description=(
-                "Request body with optional fields (ingroup_permission, group_ids, embedding_model_name, preserve_source_file)"
+                "Request body with optional fields (ingroup_permission, group_ids, embedding_model_name)"
             ),
         ),
     ] = None,
@@ -111,12 +110,10 @@ async def create_new_index(
         ingroup_permission = None
         group_ids = None
         embedding_model_name = None
-        preserve_source_file = None
         if body:
             ingroup_permission = body.get("ingroup_permission")
             group_ids = body.get("group_ids")
             embedding_model_name = body.get("embedding_model_name")
-            preserve_source_file = body.get("preserve_source_file")
 
         return ElasticSearchService.create_knowledge_base(
             knowledge_name=index_name,
@@ -127,7 +124,6 @@ async def create_new_index(
             ingroup_permission=ingroup_permission,
             group_ids=group_ids,
             embedding_model_name=embedding_model_name,
-            preserve_source_file=preserve_source_file,
         )
     except LimitExceededError as e:
         logger.exception("Rate limit exceeded while creating index")
@@ -226,65 +222,52 @@ async def delete_documents(
     request: Request,
     index_name: Annotated[str, Path(..., description="Name of the index")],
     path_or_url: Annotated[str, Query(..., description="Path or URL of documents to delete")],
-    scope: Annotated[
-        str,
-        Query(
-            description=(
-                "source_only: delete MinIO source only; "
-                "full: delete ES, MinIO, and Redis records"
-            ),
-        ),
-    ] = "full",
 ):
-    """Delete a document by scope. Restricted to asset administrators."""
+    """Delete documents by path or URL and clean up related Redis records.
+
+    Restricted to asset administrators (same auth as get_list_indices).
+    """
     try:
-        await _require_asset_owner_context(request)
+        ctx = await _require_asset_owner_context(request)
         vdb_core = get_vector_db_core(db_type=VectorDatabaseType.ELASTICSEARCH)
-        logger.debug(
-            "Deleting documents for index %s scope=%s", index_name, scope
-        )
-        result = await ElasticSearchService.delete_document_by_scope(
-            index_name, path_or_url, scope, vdb_core
-        )
+        logger.debug("Deleting documents for index %s", index_name)
+        result = ElasticSearchService.delete_documents(
+            index_name, path_or_url, vdb_core)
+
+        try:
+            redis_service = get_redis_service()
+            redis_cleanup_result = redis_service.delete_document_records(
+                index_name, path_or_url)
+
+            result["redis_cleanup"] = redis_cleanup_result
+
+            original_message = result.get(
+                "message", "Documents deleted successfully")
+            result["message"] = (
+                f"{original_message}. "
+                f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
+                f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
+                f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
+            )
 
-        if scope == "full":
-            try:
-                redis_service = get_redis_service()
-                redis_cleanup_result = redis_service.delete_document_records(
-                    index_name, path_or_url
-                )
-                result["redis_cleanup"] = redis_cleanup_result
-                original_message = result.get(
-                    "message", "Documents deleted successfully"
-                )
-                result["message"] = (
-                    f"{original_message}. "
-                    f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
-                    f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
-                    f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
-                )
-                if redis_cleanup_result.get("errors"):
-                    result["redis_warnings"] = redis_cleanup_result["errors"]
-            except Exception as redis_error:
-                logger.warning(
-                    "Redis cleanup failed for index %s: %s",
-                    index_name,
-                    redis_error,
-                )
-                result["redis_cleanup_error"] = str(redis_error)
-                original_message = result.get(
-                    "message", "Documents deleted successfully"
-                )
-                result["message"] = (
-                    f"{original_message}, but Redis cleanup encountered an error: "
-                    f"{str(redis_error)}"
-                )
+            if redis_cleanup_result.get("errors"):
+                result["redis_warnings"] = redis_cleanup_result["errors"]
+
+        except Exception as redis_error:
+            logger.warning(
+                "Redis cleanup failed for index %s: %s",
+                index_name,
+                redis_error,
+            )
+            result["redis_cleanup_error"] = str(redis_error)
+            original_message = result.get(
+                "message", "Documents deleted successfully")
+            result["message"] = (
+                f"{original_message}, but Redis cleanup encountered an error: "
+                f"{str(redis_error)}"
+            )
 
         return result
-    except ValueError as exc:
-        raise HTTPException(
-            status_code=HTTPStatus.BAD_REQUEST, detail=str(exc)
-        )
     except LimitExceededError as e:
         logger.exception("Rate limit exceeded while deleting documents")
         raise HTTPException(
diff --git a/backend/apps/prompt_app.py b/backend/apps/prompt_app.py
index 6b82a5c82..987729e69 100644
--- a/backend/apps/prompt_app.py
+++ b/backend/apps/prompt_app.py
@@ -4,19 +4,11 @@
 from fastapi import APIRouter, Header, Request
 from fastapi.responses import JSONResponse, StreamingResponse
 
-from consts.model import (
-    GeneratePromptRequest,
-    OptimizePromptSectionRequest,
-    OptimizePromptBadCaseRequest,
-    OptimizePromptFromDebugRequest,
-)
+from consts.model import GeneratePromptRequest, OptimizePromptSectionRequest
 from services.prompt_service import (
     gen_system_prompt_streamable,
-    OptimizeRequest,
-    OptimizeResult,
-    PromptOptimizationService,
+    optimize_prompt_section_impl,
 )
-from adapters.exception import NexentCapabilityError
 from utils.auth_utils import get_current_user_info
 
 router = APIRouter(prefix="/prompt")
@@ -56,140 +48,30 @@ async def optimize_prompt_section_api(
         http_request: Request,
         authorization: Optional[str] = Header(None)
 ):
-    _, tenant_id, language = get_current_user_info(
-        authorization, http_request)
-
-    service = PromptOptimizationService(
-        model_id=optimize_request.model_id,
-        tenant_id=tenant_id,
-        language=language,
-    )
-
-    try:
-        result = service.optimize(
-            OptimizeRequest(
-                agent_id=optimize_request.agent_id,
-                model_id=optimize_request.model_id,
-                task_description=optimize_request.task_description,
-                section_type=optimize_request.section_type,
-                section_title=optimize_request.section_title,
-                current_content=optimize_request.current_content,
-                feedback=optimize_request.feedback,
-                mode=optimize_request.mode,
-                start_pos=optimize_request.start_pos,
-                end_pos=optimize_request.end_pos,
-                tool_ids=optimize_request.tool_ids,
-                sub_agent_ids=optimize_request.sub_agent_ids,
-                knowledge_base_display_names=optimize_request.knowledge_base_display_names,
-            )
-        )
-        return JSONResponse(
-            status_code=HTTPStatus.OK,
-            content={
-                "message": "Success",
-                "data": {
-                    "optimized_content": result.optimized_content,
-                    "section_type": result.section_type,
-                    "section_title": result.section_title,
-                    "original_content": result.original_content,
-                }
-            },
-            headers={"X-Prompt-Source": result.source},
-        )
-    except NexentCapabilityError as e:
-        return JSONResponse(
-            status_code=HTTPStatus.BAD_REQUEST,
-            content={"message": str(e)},
-        )
-    except Exception as exc:
-        logger.exception(f"Error occurred while optimizing prompt section: {exc}")
-        raise
-
-
-@router.post("/optimize/badcase")
-async def optimize_prompt_badcase_api(
-        badcase_request: OptimizePromptBadCaseRequest,
-        http_request: Request,
-        authorization: Optional[str] = Header(None)
-):
-    _, tenant_id, language = get_current_user_info(
-        authorization, http_request)
-
-    service = PromptOptimizationService(
-        model_id=badcase_request.model_id,
-        tenant_id=tenant_id,
-        language=language,
-    )
-
-    try:
-        result = service.optimize_badcase(
-            current_content=badcase_request.current_content,
-            bad_cases=badcase_request.bad_cases,
-            agent_id=badcase_request.agent_id,
-            section_type=badcase_request.section_type,
-            section_title=badcase_request.section_title,
-            tool_ids=badcase_request.tool_ids,
-            sub_agent_ids=badcase_request.sub_agent_ids,
-            knowledge_base_display_names=badcase_request.knowledge_base_display_names,
-        )
-        return JSONResponse(
-            status_code=HTTPStatus.OK,
-            content={
-                "message": "Success",
-                "data": {
-                    "optimized_content": result.optimized_content,
-                    "section_type": result.section_type,
-                    "section_title": result.section_title,
-                    "original_content": result.original_content,
-                }
-            },
-            headers={"X-Prompt-Source": result.source},
-        )
-    except NexentCapabilityError as e:
-        return JSONResponse(
-            status_code=HTTPStatus.BAD_REQUEST,
-            content={"message": str(e)},
-        )
-
-
-@router.post("/optimize/from_debug")
-async def optimize_prompt_from_debug_api(
-        optimize_request: OptimizePromptFromDebugRequest,
-        http_request: Request,
-        authorization: Optional[str] = Header(None)
-):
-    _, tenant_id, language = get_current_user_info(
-        authorization, http_request)
-
-    service = PromptOptimizationService(
-        model_id=optimize_request.model_id,
-        tenant_id=tenant_id,
-        language=language,
-    )
-
     try:
-        result = service.optimize_from_debug(
+        _, tenant_id, language = get_current_user_info(
+            authorization, http_request)
+        optimized_section = optimize_prompt_section_impl(
             agent_id=optimize_request.agent_id,
+            model_id=optimize_request.model_id,
+            task_description=optimize_request.task_description,
+            tenant_id=tenant_id,
+            language=language,
+            section_type=optimize_request.section_type,
+            section_title=optimize_request.section_title,
+            current_content=optimize_request.current_content,
             feedback=optimize_request.feedback,
-            selected=optimize_request.selected,
-            history=optimize_request.history,
+            tool_ids=optimize_request.tool_ids,
+            sub_agent_ids=optimize_request.sub_agent_ids,
+            knowledge_base_display_names=optimize_request.knowledge_base_display_names,
         )
         return JSONResponse(
             status_code=HTTPStatus.OK,
             content={
-                "message": "Success",
-                "data": {
-                    "original_full_prompt": result.original_content,
-                    "optimized_full_prompt": result.optimized_content,
-                }
-            },
-            headers={"X-Prompt-Source": result.source},
-        )
-    except NexentCapabilityError as e:
-        return JSONResponse(
-            status_code=HTTPStatus.BAD_REQUEST,
-            content={"message": str(e)},
+                "message": "Prompt section optimized successfully",
+                "data": optimized_section,
+            }
         )
     except Exception as exc:
-        logger.exception(f"Error occurred while optimizing prompt from debug: {exc}")
+        logger.exception(f"Error occurred while optimizing prompt section: {exc}")
         raise
diff --git a/backend/apps/tool_config_app.py b/backend/apps/tool_config_app.py
index bfc8d5ca0..f0b7f9304 100644
--- a/backend/apps/tool_config_app.py
+++ b/backend/apps/tool_config_app.py
@@ -160,14 +160,12 @@ async def import_openapi_service_api(
         server_url: Base URL of the REST API server
         openapi_json: Complete OpenAPI JSON specification
         service_description: Optional service description
-        headers_template: Optional default headers template
         force_update: If True, replace all existing tools for this service
     """
     service_name = openapi_service_request.get("service_name")
     server_url = openapi_service_request.get("server_url")
     openapi_json = openapi_service_request.get("openapi_json")
     service_description = openapi_service_request.get("service_description")
-    headers_template = openapi_service_request.get("headers_template")
     force_update = openapi_service_request.get("force_update", False)
 
     if not service_name:
@@ -194,7 +192,6 @@ async def import_openapi_service_api(
             tenant_id=tenant_id,
             user_id=user_id,
             service_description=service_description,
-            headers_template=headers_template,
             force_update=force_update
         )
 
diff --git a/backend/apps/user_management_app.py b/backend/apps/user_management_app.py
index e79fde887..edbcdf27d 100644
--- a/backend/apps/user_management_app.py
+++ b/backend/apps/user_management_app.py
@@ -19,13 +19,12 @@
     ValidationError,
 )
 from consts.error_code import ErrorCode
-from services.cas_service import build_logout_url, CasAuthenticationError
 from services.user_management_service import get_authorized_client, validate_token, \
     check_auth_service_health, signup_user_with_invitation, signin_user, refresh_user_token, \
     get_session_by_authorization, get_user_info, create_token, list_tokens_by_user, delete_token, \
     update_password
 from services.user_service import delete_user_and_cleanup
-from utils.auth_utils import get_current_user_id, extract_session_id_from_authorization
+from utils.auth_utils import get_current_user_id
 
 
 load_dotenv()
@@ -151,18 +150,7 @@ async def logout(request: Request):
     authorization = request.headers.get("Authorization")
     try:
         # Make logout idempotent: if no token or token expired, still return success
-        session_id = None
-        cas_logout_url = ""
         if authorization:
-            session_id = extract_session_id_from_authorization(authorization)
-            if session_id:
-                from database.cas_session_db import revoke_cas_session_by_session_id
-
-                revoke_cas_session_by_session_id(session_id, actor="user")
-                try:
-                    cas_logout_url = build_logout_url()
-                except CasAuthenticationError as cas_err:
-                    logging.warning(f"CAS logout URL is unavailable: {str(cas_err)}")
             client = get_authorized_client(authorization)
             try:
                 client.auth.sign_out()
@@ -171,12 +159,7 @@ async def logout(request: Request):
                 logging.warning(
                     f"Sign out encountered an error but will be ignored: {str(signout_err)}")
         return JSONResponse(status_code=HTTPStatus.OK,
-                            content={
-                                "message": "Logout successful",
-                                "data": {
-                                    "cas_logout_url": cas_logout_url
-                                }
-                            })
+                            content={"message": "Logout successful"})
 
     except Exception as e:
         logging.error(f"User logout failed: {str(e)}")
@@ -231,10 +214,6 @@ async def get_user_information(request: Request):
         if not user_info:
             raise UnauthorizedError("User information not found")
 
-        user_info["user"]["auth_provider"] = (
-            "cas" if extract_session_id_from_authorization(authorization) else "local"
-        )
-
         return JSONResponse(status_code=HTTPStatus.OK,
                             content={"message": "Success",
                                      "data": user_info})
diff --git a/backend/apps/vectordatabase_app.py b/backend/apps/vectordatabase_app.py
index 505c39559..118537766 100644
--- a/backend/apps/vectordatabase_app.py
+++ b/backend/apps/vectordatabase_app.py
@@ -76,7 +76,7 @@ def create_new_index(
         embedding_dim: Optional[int] = Query(
             None, description="Dimension of the embedding vectors"),
         request: Dict[str, Any] = Body(
-            None, description="Request body with optional fields (ingroup_permission, group_ids, embedding_model_name, preserve_source_file)"),
+            None, description="Request body with optional fields (ingroup_permission, group_ids, embedding_model_name)"),
         vdb_core: VectorDatabaseCore = Depends(get_vector_db_core),
         authorization: Optional[str] = Header(None)
 ):
@@ -89,13 +89,11 @@ def create_new_index(
         group_ids = None
         embedding_model_name: Optional[str] = None
         is_multimodal: Optional[bool] = None
-        preserve_source_file: Optional[bool] = None
         if request:
             ingroup_permission = request.get("ingroup_permission")
             group_ids = request.get("group_ids")
             embedding_model_name = request.get("embeddingModel")
             is_multimodal = request.get("is_multimodal")
-            preserve_source_file = request.get("preserve_source_file")
 
         # Treat path parameter as user-facing knowledge base name for new creations
         return ElasticSearchService.create_knowledge_base(
@@ -108,7 +106,6 @@ def create_new_index(
             group_ids=group_ids,
             embedding_model_name=embedding_model_name,
             is_multimodal=is_multimodal,
-            preserve_source_file=preserve_source_file,
         )
     except Exception as e:
         raise HTTPException(
@@ -508,70 +505,54 @@ async def get_index_files(
 
 
 @router.delete("/{index_name}/documents")
-async def delete_documents(
+def delete_documents(
         index_name: str = Path(..., description="Name of the index"),
         path_or_url: str = Query(...,
                                  description="Path or URL of documents to delete"),
-        scope: str = Query(
-            "full",
-            description=(
-                "source_only: delete MinIO source only, keep ES chunks/vectors; "
-                "full: delete ES documents, MinIO source, and Redis task records"
-            ),
-        ),
         vdb_core: VectorDatabaseCore = Depends(get_vector_db_core)
 ):
-    """Delete a document by scope: source file only or full removal from the index."""
+    """Delete documents by path or URL and clean up related Redis records"""
     try:
-        result = await ElasticSearchService.delete_document_by_scope(
-            index_name, path_or_url, scope, vdb_core
-        )
+        # First delete the documents using existing service
+        result = ElasticSearchService.delete_documents(
+            index_name, path_or_url, vdb_core)
+
+        # Then clean up Redis records related to this specific document
+        try:
+            redis_service = get_redis_service()
+            redis_cleanup_result = redis_service.delete_document_records(
+                index_name, path_or_url)
+
+            # Add Redis cleanup info to the result
+            result["redis_cleanup"] = redis_cleanup_result
+
+            # Update the message to include Redis cleanup info
+            original_message = result.get(
+                "message", "Documents deleted successfully")
+            result["message"] = (
+                f"{original_message}. "
+                f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
+                f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
+                f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
+            )
 
-        if scope == "full":
-            try:
-                redis_service = get_redis_service()
-                redis_cleanup_result = redis_service.delete_document_records(
-                    index_name, path_or_url
-                )
-                result["redis_cleanup"] = redis_cleanup_result
-                original_message = result.get(
-                    "message", "Documents deleted successfully"
-                )
-                result["message"] = (
-                    f"{original_message}. "
-                    f"Cleaned up {redis_cleanup_result['total_deleted']} Redis records "
-                    f"({redis_cleanup_result['celery_tasks_deleted']} tasks, "
-                    f"{redis_cleanup_result['cache_keys_deleted']} cache keys)."
-                )
-                if redis_cleanup_result.get("errors"):
-                    result["redis_warnings"] = redis_cleanup_result["errors"]
-            except Exception as redis_error:
-                logger.warning(
-                    "Redis cleanup failed for document %s in index %s: %s",
-                    path_or_url,
-                    index_name,
-                    redis_error,
-                )
-                result["redis_cleanup_error"] = str(redis_error)
-                original_message = result.get(
-                    "message", "Documents deleted successfully"
-                )
-                result["message"] = (
-                    f"{original_message}, but Redis cleanup encountered an error: "
-                    f"{str(redis_error)}"
-                )
+            if redis_cleanup_result.get("errors"):
+                result["redis_warnings"] = redis_cleanup_result["errors"]
+
+        except Exception as redis_error:
+            logger.warning(
+                f"Redis cleanup failed for document {path_or_url} in index {index_name}: {str(redis_error)}")
+            result["redis_cleanup_error"] = str(redis_error)
+            original_message = result.get(
+                "message", "Documents deleted successfully")
+            result[
+                "message"] = f"{original_message}, but Redis cleanup encountered an error: {str(redis_error)}"
 
         return result
 
-    except ValueError as exc:
-        raise HTTPException(
-            status_code=HTTPStatus.BAD_REQUEST, detail=str(exc)
-        )
     except Exception as e:
         raise HTTPException(
-            status_code=HTTPStatus.INTERNAL_SERVER_ERROR,
-            detail=f"Error delete indexing documents: {e}",
-        )
+            status_code=HTTPStatus.INTERNAL_SERVER_ERROR, detail=f"Error delete indexing documents: {e}")
 
 
 @router.get("/{index_name}/documents/{path_or_url:path}/error-info")
diff --git a/backend/consts/const.py b/backend/consts/const.py
index 574d550c0..ac2196c2a 100644
--- a/backend/consts/const.py
+++ b/backend/consts/const.py
@@ -90,31 +90,6 @@ class VectorDatabaseType(str, Enum):
 OAUTH_CA_BUNDLE = os.getenv("OAUTH_CA_BUNDLE", "")
 
 
-# CAS SSO Configuration
-CAS_ENABLED = os.getenv("CAS_ENABLED", "false").lower() in ("true", "1", "yes", "on")
-CAS_SERVER_URL = os.getenv("CAS_SERVER_URL", "").rstrip("/")
-CAS_VALIDATE_PATH = os.getenv("CAS_VALIDATE_PATH", "/p3/serviceValidate")
-CAS_CALLBACK_BASE_URL = os.getenv("CAS_CALLBACK_BASE_URL", OAUTH_CALLBACK_BASE_URL).rstrip("/")
-# CAS login mode:
-# - disabled: disable CAS login entry and automatic CAS redirects.
-# - button: show CAS as an optional login entry.
-# - force: automatically redirect unauthenticated users to CAS login.
-CAS_LOGIN_MODE = os.getenv("CAS_LOGIN_MODE", "disabled").lower()
-CAS_USER_ATTRIBUTE = os.getenv("CAS_USER_ATTRIBUTE", "")
-CAS_EMAIL_ATTRIBUTE = os.getenv("CAS_EMAIL_ATTRIBUTE", "email")
-CAS_ROLE_ATTRIBUTE = os.getenv("CAS_ROLE_ATTRIBUTE", "role")
-CAS_TENANT_ATTRIBUTE = os.getenv("CAS_TENANT_ATTRIBUTE", "tenant_id")
-CAS_ROLE_MAP_JSON = os.getenv("CAS_ROLE_MAP_JSON", "")
-CAS_SESSION_MAX_AGE_SECONDS = int(os.getenv("CAS_SESSION_MAX_AGE_SECONDS", "3600") or 3600)
-LOCAL_SESSION_MAX_AGE_SECONDS = int(os.getenv("LOCAL_SESSION_MAX_AGE_SECONDS", "3600") or 3600)
-CAS_RENEW_BEFORE_SECONDS = int(os.getenv("CAS_RENEW_BEFORE_SECONDS", "300") or 300)
-CAS_RENEW_TIMEOUT_SECONDS = int(os.getenv("CAS_RENEW_TIMEOUT_SECONDS", "10") or 10)
-CAS_SYNTHETIC_EMAIL_DOMAIN = os.getenv("CAS_SYNTHETIC_EMAIL_DOMAIN", "cas.local")
-CAS_LOGOUT_URL = os.getenv("CAS_LOGOUT_URL", "")
-CAS_SSL_VERIFY = os.getenv("CAS_SSL_VERIFY", "true").lower() == "true"
-CAS_CA_BUNDLE = os.getenv("CAS_CA_BUNDLE", "")
-
-
 # ===== To be migrated to frontend configuration =====
 # Email Configuration
 IMAP_SERVER = os.getenv('IMAP_SERVER')
@@ -233,7 +208,6 @@ class VectorDatabaseType(str, Enum):
     "NEXENT_MCP_DOCKER_IMAGE", "nexent/nexent-mcp:latest")
 ENABLE_UPLOAD_IMAGE = os.getenv(
     "ENABLE_UPLOAD_IMAGE", "false").lower() == "true"
-ENABLE_JIUWEN_SDK = os.getenv("NEXENT_ENABLE_JIUWEN_SDK", "true").lower() == "true"
 
 
 # Celery Configuration
@@ -401,47 +375,36 @@ class VectorDatabaseType(str, Enum):
 OTEL_SERVICE_NAME = OTEL_SERVICE_NAME_RAW or "nexent-backend"
 OTEL_EXPORTER_OTLP_ENDPOINT_RAW = os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT")
 OTEL_EXPORTER_OTLP_ENDPOINT = OTEL_EXPORTER_OTLP_ENDPOINT_RAW or "http://localhost:4318"
-OTEL_EXPORTER_OTLP_TRACES_ENDPOINT = os.getenv(
-    "OTEL_EXPORTER_OTLP_TRACES_ENDPOINT", "")
-OTEL_EXPORTER_OTLP_METRICS_ENDPOINT = os.getenv(
-    "OTEL_EXPORTER_OTLP_METRICS_ENDPOINT", "")
+OTEL_EXPORTER_OTLP_TRACES_ENDPOINT = os.getenv("OTEL_EXPORTER_OTLP_TRACES_ENDPOINT", "")
+OTEL_EXPORTER_OTLP_METRICS_ENDPOINT = os.getenv("OTEL_EXPORTER_OTLP_METRICS_ENDPOINT", "")
 OTEL_EXPORTER_OTLP_PROTOCOL_RAW = os.getenv("OTEL_EXPORTER_OTLP_PROTOCOL")
 OTEL_EXPORTER_OTLP_PROTOCOL = OTEL_EXPORTER_OTLP_PROTOCOL_RAW or "http"
 OTEL_EXPORTER_OTLP_HEADERS_RAW = os.getenv("OTEL_EXPORTER_OTLP_HEADERS")
 OTEL_EXPORTER_OTLP_HEADERS = OTEL_EXPORTER_OTLP_HEADERS_RAW or ""
-OTEL_EXPORTER_OTLP_AUTHORIZATION = os.getenv(
-    "OTEL_EXPORTER_OTLP_AUTHORIZATION", "")
+OTEL_EXPORTER_OTLP_AUTHORIZATION = os.getenv("OTEL_EXPORTER_OTLP_AUTHORIZATION", "")
 OTEL_EXPORTER_OTLP_X_API_KEY = os.getenv("OTEL_EXPORTER_OTLP_X_API_KEY", "")
 OTEL_EXPORTER_OTLP_LANGFUSE_INGESTION_VERSION = os.getenv(
     "OTEL_EXPORTER_OTLP_LANGFUSE_INGESTION_VERSION", "")
 LANGSMITH_API_KEY = os.getenv("LANGSMITH_API_KEY", "")
 LANGSMITH_PROJECT = os.getenv("LANGSMITH_PROJECT", "")
-OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW = os.getenv(
-    "OTEL_EXPORTER_OTLP_METRICS_ENABLED")
+OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW = os.getenv("OTEL_EXPORTER_OTLP_METRICS_ENABLED")
 OTEL_EXPORTER_OTLP_METRICS_ENABLED = (
     OTEL_EXPORTER_OTLP_METRICS_ENABLED_RAW or "true").lower() == "true"
-MONITORING_INSTRUMENT_REQUESTS_RAW = os.getenv(
-    "MONITORING_INSTRUMENT_REQUESTS")
+MONITORING_INSTRUMENT_REQUESTS_RAW = os.getenv("MONITORING_INSTRUMENT_REQUESTS")
 MONITORING_INSTRUMENT_REQUESTS = (
     MONITORING_INSTRUMENT_REQUESTS_RAW or "false").lower() == "true"
-MONITORING_FASTAPI_INCLUDED_URLS = os.getenv(
-    "MONITORING_FASTAPI_INCLUDED_URLS", "")
-MONITORING_FASTAPI_EXCLUDED_URLS = os.getenv(
-    "MONITORING_FASTAPI_EXCLUDED_URLS", "")
-MONITORING_FASTAPI_EXCLUDE_SPANS = os.getenv(
-    "MONITORING_FASTAPI_EXCLUDE_SPANS", "receive,send")
+MONITORING_FASTAPI_INCLUDED_URLS = os.getenv("MONITORING_FASTAPI_INCLUDED_URLS", "")
+MONITORING_FASTAPI_EXCLUDED_URLS = os.getenv("MONITORING_FASTAPI_EXCLUDED_URLS", "")
+MONITORING_FASTAPI_EXCLUDE_SPANS = os.getenv("MONITORING_FASTAPI_EXCLUDE_SPANS", "receive,send")
 MONITORING_PROJECT_NAME = os.getenv("MONITORING_PROJECT_NAME", "")
 MONITORING_DASHBOARD_URL = os.getenv("MONITORING_DASHBOARD_URL", "")
-MONITORING_TRACE_CONTENT_MODE = os.getenv(
-    "MONITORING_TRACE_CONTENT_MODE", "summary")
+MONITORING_TRACE_CONTENT_MODE = os.getenv("MONITORING_TRACE_CONTENT_MODE", "summary")
 MONITORING_TRACE_MAX_CHARS = os.getenv("MONITORING_TRACE_MAX_CHARS", "4000")
 MONITORING_TRACE_MAX_ITEMS = os.getenv("MONITORING_TRACE_MAX_ITEMS", "20")
 TELEMETRY_SAMPLE_RATE_RAW = os.getenv("TELEMETRY_SAMPLE_RATE")
 TELEMETRY_SAMPLE_RATE = float(TELEMETRY_SAMPLE_RATE_RAW or "1.0")
 
 # Parse OTLP headers into dict format
-
-
 def _parse_otlp_headers(headers_str: str) -> dict:
     """Parse OTLP headers string into dict. Format: 'key1=value1,key2=value2'"""
     if not headers_str:
@@ -453,7 +416,6 @@ def _parse_otlp_headers(headers_str: str) -> dict:
             headers[key.strip()] = value.strip()
     return headers
 
-
 OTLP_HEADERS = _parse_otlp_headers(OTEL_EXPORTER_OTLP_HEADERS)
 if OTEL_EXPORTER_OTLP_AUTHORIZATION:
     OTLP_HEADERS["Authorization"] = OTEL_EXPORTER_OTLP_AUTHORIZATION
@@ -486,7 +448,7 @@ def _parse_otlp_headers(headers_str: str) -> dict:
 
 
 # APP Version
-APP_VERSION = "v2.2.1"
+APP_VERSION = "v2.2.0"
 
 
 # Skill Creation Streaming Configuration
diff --git a/backend/consts/model.py b/backend/consts/model.py
index 00e5b8a0a..6969999fe 100644
--- a/backend/consts/model.py
+++ b/backend/consts/model.py
@@ -1,8 +1,8 @@
 from enum import Enum
-from typing import Optional, Any, List, Dict, Literal
+from typing import Optional, Any, List, Dict
 
 from pydantic import BaseModel, Field, EmailStr, ConfigDict, field_validator
-from nexent.core.agents.agent_model import AgentVerificationConfig, ToolConfig
+from nexent.core.agents.agent_model import ToolConfig
 
 from consts.prompt_template import PROMPT_GENERATE_TEMPLATE_FIELD_ALIAS_MAP
 
@@ -230,24 +230,6 @@ class HistoryItem(BaseModel):
     minio_files: Optional[List[Dict[str, Any]]] = None
 
 
-class AgentToolParamsRequest(BaseModel):
-    """Request-scoped tool parameter overrides for a single agent."""
-
-    tools: Dict[str, Dict[str, Any]] = Field(
-        default_factory=dict,
-        description="Mapping from tool identifier to request-scoped override params",
-    )
-
-
-class ToolParamsRequest(BaseModel):
-    """Request-scoped tool parameter overrides for main and managed agents."""
-
-    agents: Dict[str, AgentToolParamsRequest] = Field(
-        default_factory=dict,
-        description="Mapping from agent identifier to tool parameter overrides",
-    )
-
-
 class AgentRequest(BaseModel):
     query: str
     conversation_id: Optional[int] = None
@@ -258,7 +240,6 @@ class AgentRequest(BaseModel):
     model_id: Optional[int] = None
     version_no: Optional[int] = None
     is_debug: Optional[bool] = False
-    tool_params: Optional[ToolParamsRequest] = None
 
 
 class MessageUnit(BaseModel):
@@ -433,9 +414,6 @@ class OptimizePromptSectionRequest(BaseModel):
     section_title: str
     current_content: str
     feedback: str
-    mode: Literal["general", "insert", "select"] = "general"
-    start_pos: Optional[int] = Field(None, description="Start position for insert/select mode")
-    end_pos: Optional[int] = Field(None, description="End position for insert/select mode")
     tool_ids: Optional[List[int]] = Field(
         None, description="Optional: tool IDs from frontend (takes precedence over database query)")
     sub_agent_ids: Optional[List[int]] = Field(
@@ -444,38 +422,6 @@ class OptimizePromptSectionRequest(BaseModel):
         None, description="Optional: knowledge base display names from frontend (takes precedence over database query)")
 
 
-class BadCaseItem(BaseModel):
-    question: str
-    answer: str
-    label: Optional[str] = None
-    reason: Optional[str] = None
-
-
-class OptimizePromptBadCaseRequest(BaseModel):
-    agent_id: int
-    model_id: int
-    current_content: str
-    bad_cases: List[BadCaseItem]
-    section_type: str
-    section_title: str
-    tool_ids: Optional[List[int]] = Field(None)
-    sub_agent_ids: Optional[List[int]] = Field(None)
-    knowledge_base_display_names: Optional[List[str]] = Field(None)
-
-
-class OptimizeFromDebugSelected(BaseModel):
-    user_question: str
-    assistant_answer: str
-
-
-class OptimizePromptFromDebugRequest(BaseModel):
-    agent_id: int
-    model_id: int
-    feedback: str
-    selected: OptimizeFromDebugSelected
-    history: Optional[List[HistoryItem]] = None
-
-
 class GenerateTitleRequest(BaseModel):
     conversation_id: int
     question: str
@@ -508,18 +454,8 @@ class AgentInfoRequest(BaseModel):
     group_ids: Optional[List[int]] = None
     ingroup_permission: Optional[str] = None
     enable_context_manager: Optional[bool] = None
-    verification_config: Optional[Dict[str, Any]] = None
-    greeting_message: Optional[str] = None
-    example_questions: Optional[List[str]] = None
     version_no: int = 0
 
-    @field_validator("verification_config", mode="before")
-    @classmethod
-    def normalize_verification_config(cls, value):
-        if value is None:
-            return None
-        return AgentVerificationConfig.model_validate(value).model_dump()
-
 
 class AgentIDRequest(BaseModel):
     agent_id: int
@@ -584,7 +520,6 @@ class MessageIdRequest(BaseModel):
 
 class ExportAndImportAgentInfo(BaseModel):
     agent_id: int
-    tenant_id: Optional[str] = None
     name: str
     display_name: Optional[str] = None
     description: str
@@ -592,7 +527,6 @@ class ExportAndImportAgentInfo(BaseModel):
     author: Optional[str] = None
     max_steps: int
     provide_run_summary: bool
-    verification_config: Optional[Dict[str, Any]] = None
     duty_prompt: Optional[str] = None
     constraint_prompt: Optional[str] = None
     few_shots_prompt: Optional[str] = None
@@ -622,11 +556,6 @@ class ExportAndImportDataFormat(BaseModel):
     mcp_info: List[MCPInfo]
 
 
-class AgentRepositorySnapshot(ExportAndImportDataFormat):
-    """Frozen marketplace snapshot: export format plus optional skill ZIP payloads."""
-    skills: Optional[List["SkillZipEntry"]] = None
-
-
 class SkillZipEntry(BaseModel):
     """A skill bundled inside an agent export ZIP."""
     skill_name: str
diff --git a/backend/data_process/tasks.py b/backend/data_process/tasks.py
index 4dd6edd69..f2a30f9b7 100644
--- a/backend/data_process/tasks.py
+++ b/backend/data_process/tasks.py
@@ -8,11 +8,9 @@
 import os
 import threading
 import time
-from dataclasses import dataclass
 from typing import Any, Dict, Optional, List, Tuple
 
 import aiohttp
-import requests
 import re
 import ray
 from celery import Task, chain, states, group, chord
@@ -21,7 +19,6 @@
 
 from utils.file_management_utils import get_file_size
 from database.attachment_db import get_file_stream
-from database.knowledge_db import get_knowledge_record
 from services.redis_service import get_redis_service
 from .app import app
 from .ray_actors import DataProcessorRayActor
@@ -46,12 +43,10 @@
 
 
 logger = logging.getLogger("data_process.tasks")
-ASYNC_SPLIT_RETRY_MAX = max(
-    FORWARD_REDIS_RETRY_MAX * 5, FORWARD_REDIS_RETRY_MAX)
+ASYNC_SPLIT_RETRY_MAX = max(FORWARD_REDIS_RETRY_MAX * 5, FORWARD_REDIS_RETRY_MAX)
 FORWARD_ES_CHUNK_BATCH_SIZE = 64
 IMAGE_METADATA_PROCESS_SOURCE = "UniversalImageExtractor"
 
-
 def _wait_for_split_ready(redis_key: str, timeout_s: int, poll_interval_ms: int) -> int:
     """
     Wait until async split aggregation is marked ready in Redis.
@@ -96,8 +91,7 @@ def _estimate_parallel_parts() -> int:
 def _compute_split_wait_timeout(parts_count: int) -> int:
     base_timeout = DP_REDIS_CHUNKS_WAIT_TIMEOUT_S
     waves = math.ceil(max(1, parts_count) / _estimate_parallel_parts())
-    dynamic_timeout = base_timeout + \
-        max(0, waves - 1) * max(1, PER_WAVE_TIMEOUT)
+    dynamic_timeout = base_timeout + max(0, waves - 1) * max(1, PER_WAVE_TIMEOUT)
     return min(MAX_TIMEOUT, max(base_timeout, dynamic_timeout))
 
 
@@ -184,6 +178,7 @@ def _build_balanced_batches(
     return batches
 
 
+
 # Thread lock for initializing Ray to prevent race conditions
 ray_init_lock = threading.Lock()
 
@@ -332,35 +327,6 @@ def run_in_thread():
         raise
 
 
-def _delete_source_file_via_http_sync(
-    *,
-    base_url: str,
-    index_name: str,
-    path_or_url: str,
-    scope: str,
-    timeout_s: float = 30.0,
-) -> Dict[str, Any]:
-    base = (base_url or "").rstrip("/")
-    if not base:
-        raise RuntimeError("ELASTICSEARCH_SERVICE is not configured")
-    url = f"{base}/indices/{index_name}/documents"
-    params = {"path_or_url": path_or_url, "scope": scope}
-
-    resp = requests.delete(url, params=params, timeout=timeout_s)
-    body_text = getattr(resp, "text", "")
-    parsed = None
-    try:
-        parsed = resp.json()
-    except Exception:
-        parsed = _parse_json_or_none(body_text) if body_text else None
-
-    return {
-        "http_status": getattr(resp, "status_code", None),
-        "response_json": parsed if isinstance(parsed, dict) else None,
-        "response_text": body_text if not isinstance(parsed, dict) else None,
-    }
-
-
 def _build_forward_error(
     message: str,
     index_name: str,
@@ -384,206 +350,6 @@ def _parse_json_or_none(text: str) -> Optional[Dict[str, Any]]:
         return None
 
 
-@dataclass(frozen=True)
-class _ForwardContext:
-    task_id: str
-    request_id: str
-    start_time: float
-    source: str
-    index_name: str
-    source_type: str
-    original_filename: Optional[str]
-
-
-def _init_forward_context(
-    *,
-    task_id: str,
-    request_id: str,
-    start_time: float,
-    source: str,
-    index_name: str,
-    source_type: str,
-    original_filename: Optional[str],
-) -> _ForwardContext:
-    return _ForwardContext(
-        task_id=task_id,
-        request_id=request_id,
-        start_time=start_time,
-        source=source,
-        index_name=index_name,
-        source_type=source_type,
-        original_filename=original_filename,
-    )
-
-
-def _is_forward_task_cancelled(ctx: _ForwardContext) -> bool:
-    try:
-        redis_service = get_redis_service()
-        return bool(redis_service.is_task_cancelled(ctx.task_id))
-    except Exception as exc:
-        logger.warning(
-            f"[{ctx.request_id}] FORWARD TASK: Failed to check cancellation flag for task {ctx.task_id}: "
-            f"{exc}"
-        )
-        return False
-
-
-def _build_forward_cancelled_result(ctx: _ForwardContext) -> Dict[str, Any]:
-    return {
-        'task_id': ctx.task_id,
-        'source': ctx.source,
-        'index_name': ctx.index_name,
-        'original_filename': ctx.original_filename,
-        'chunks_stored': 0,
-        'storage_time': 0,
-        'es_result': {
-            "success": False,
-            "message": "Indexing cancelled because document was deleted.",
-            "total_indexed": 0,
-            "total_submitted": 0,
-        },
-    }
-
-
-def _load_forward_chunks(
-    self: Task,
-    *,
-    processed_data: Dict[str, Any],
-    original_source: str,
-    original_index_name: str,
-    filename: Optional[str],
-) -> Tuple[Optional[List[Dict[str, Any]]], bool, str, str, Optional[str]]:
-    chunks = processed_data.get('chunks')
-    split_async = bool(processed_data.get('split_async'))
-
-    # If chunks are not in payload, try loading from Redis via the redis_key
-    if (not chunks) and processed_data.get('redis_key'):
-        redis_key = processed_data.get('redis_key')
-        if not REDIS_BACKEND_URL:
-            raise Exception(json.dumps({
-                "message": "REDIS_BACKEND_URL not configured to retrieve chunks",
-                "index_name": original_index_name,
-                "task_name": "forward",
-                "source": original_source,
-                "original_filename": filename
-            }, ensure_ascii=False))
-        try:
-            import redis
-            client = redis.Redis.from_url(
-                REDIS_BACKEND_URL, decode_responses=True)
-            ready_key = f"{redis_key}:ready"
-            if split_async:
-                ready_flag = client.get(ready_key)
-                if not ready_flag:
-                    retry_num = getattr(self.request, 'retries', 0)
-                    logger.info(
-                        f"[{self.request.id}] FORWARD TASK: Async split not ready for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                    raise self.retry(
-                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                        max_retries=ASYNC_SPLIT_RETRY_MAX,
-                        exc=Exception(json.dumps({
-                            "message": "Async split not ready; will retry",
-                            "index_name": original_index_name,
-                            "task_name": "forward",
-                            "source": original_source,
-                            "original_filename": filename
-                        }, ensure_ascii=False))
-                    )
-            cached = client.get(redis_key)
-            if cached:
-                try:
-                    logger.debug(
-                        f"[{self.request.id}] FORWARD TASK: Retrieved Redis key '{redis_key}', payload_length={len(cached)}")
-                    chunks = json.loads(cached)
-                except json.JSONDecodeError as jde:
-                    # Log raw prefix to help diagnose incorrect writes
-                    raw_preview = cached[:120] if isinstance(
-                        cached, str) else str(type(cached))
-                    logger.error(
-                        f"[{self.request.id}] FORWARD TASK: JSON decode error for key '{redis_key}': {str(jde)}; raw_prefix={raw_preview!r}")
-                    raise
-            else:
-                if split_async:
-                    retry_num = getattr(self.request, 'retries', 0)
-                    logger.info(
-                        f"[{self.request.id}] FORWARD TASK: Async split ready but chunks missing for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                    raise self.retry(
-                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                        max_retries=ASYNC_SPLIT_RETRY_MAX,
-                        exc=Exception(json.dumps({
-                            "message": "Async split ready but chunks missing; will retry",
-                            "index_name": original_index_name,
-                            "task_name": "forward",
-                            "source": original_source,
-                            "original_filename": filename
-                        }, ensure_ascii=False))
-                    )
-                # No busy-wait: release the worker slot and retry later
-                retry_num = getattr(self.request, 'retries', 0)
-                logger.info(
-                    f"[{self.request.id}] FORWARD TASK: Chunks not yet available for key {redis_key}. Retry {retry_num + 1}/{FORWARD_REDIS_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-                raise self.retry(
-                    countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                    max_retries=FORWARD_REDIS_RETRY_MAX,
-                    exc=Exception(json.dumps({
-                        "message": "Chunks not ready in Redis; will retry",
-                        "index_name": original_index_name,
-                        "task_name": "forward",
-                        "source": original_source,
-                        "original_filename": filename
-                    }, ensure_ascii=False))
-                )
-        except Retry:
-            raise
-        except Exception as exc:
-            raise Exception(json.dumps({
-                "message": f"Failed to retrieve chunks from Redis: {str(exc)}",
-                "index_name": original_index_name,
-                "task_name": "forward",
-                "source": original_source,
-                "original_filename": filename
-            }, ensure_ascii=False))
-
-    if processed_data.get('source'):
-        original_source = processed_data.get('source')
-    if processed_data.get('index_name'):
-        original_index_name = processed_data.get('index_name')
-    if processed_data.get('original_filename'):
-        filename = processed_data.get('original_filename')
-
-    logger.info(
-        f"[{self.request.id}] FORWARD TASK: Received data for source '{original_source}' with {len(chunks) if chunks else 'None'} chunks")
-
-    if chunks is None:
-        raise Exception(json.dumps({
-            "message": "No chunks received for forwarding",
-            "index_name": original_index_name,
-            "task_name": "forward",
-            "source": original_source,
-            "original_filename": filename
-        }, ensure_ascii=False))
-    if len(chunks) == 0:
-        if split_async and processed_data.get('redis_key'):
-            retry_num = getattr(self.request, 'retries', 0)
-            logger.info(
-                f"[{self.request.id}] FORWARD TASK: Empty chunks while waiting for async split. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
-            raise self.retry(
-                countdown=FORWARD_REDIS_RETRY_DELAY_S,
-                max_retries=ASYNC_SPLIT_RETRY_MAX,
-                exc=Exception(json.dumps({
-                    "message": "Chunks not ready in Redis (empty); will retry",
-                    "index_name": original_index_name,
-                    "task_name": "forward",
-                    "source": original_source,
-                    "original_filename": filename
-                }, ensure_ascii=False))
-            )
-        logger.warning(
-            f"[{self.request.id}] FORWARD TASK: Empty chunks list received for source {original_source}")
-
-    return chunks, split_async, original_source, original_index_name, filename
-
-
 def _extract_error_code_from_es_response(
     parsed_body: Optional[Dict[str, Any]],
     text: str,
@@ -638,7 +404,7 @@ async def _post():
         try:
             connector = aiohttp.TCPConnector(verify_ssl=False)
             timeout = aiohttp.ClientTimeout(total=600)
-
+            
             request_params: Dict[str, str] = {}
 
             if large_mode:
@@ -657,8 +423,7 @@ async def _post():
                     parsed_body = _parse_json_or_none(text)
 
                     if status >= 400:
-                        error_code = _extract_error_code_from_es_response(
-                            parsed_body, text)
+                        error_code = _extract_error_code_from_es_response(parsed_body, text)
                         if error_code:
                             raise Exception(json.dumps({
                                 "error_code": error_code
@@ -743,8 +508,7 @@ def get_actor(self) -> Any:
         if not self.actors:
             actor = self._create_and_warm_actor()
             if actor is None:
-                raise RuntimeError(
-                    "Global actor pool is empty and actor warm-up failed")
+                raise RuntimeError("Global actor pool is empty and actor warm-up failed")
             self.actors.append(actor)
         idx = self.rr_index % len(self.actors)
         self.rr_index += 1
@@ -788,12 +552,10 @@ def prewarm_ray_actors(target_size: Optional[int] = None) -> int:
     """
     Ensure a global shared pool of warm Ray actors exists for low-latency task execution.
     """
-    desired = RAY_GLOBAL_ACTOR_POOL_SIZE if target_size is None else max(
-        0, int(target_size))
+    desired = RAY_GLOBAL_ACTOR_POOL_SIZE if target_size is None else max(0, int(target_size))
     manager = _get_or_create_global_pool_manager()
     current_after = ray.get(
-        manager.ensure_pool.remote(
-            desired=desired, max_allowed=_estimate_parallel_parts())
+        manager.ensure_pool.remote(desired=desired, max_allowed=_estimate_parallel_parts())
     )
     logger.info(
         f"Global Ray actor pool ready: current={current_after}, desired={desired}"
@@ -816,7 +578,6 @@ def _get_split_actor() -> Any:
     """
     return get_ray_actor()
 
-
 class LoggingTask(Task):
     """Base task class with enhanced logging"""
 
@@ -884,8 +645,7 @@ def process_part(
             "chunks_count": len(chunks),
         }
     except Exception as e:
-        logger.error(
-            f"[process_part] Failed to process part for '{filename}': {str(e)}")
+        logger.error(f"[process_part] Failed to process part for '{filename}': {str(e)}")
         return {
             "part_redis_key": part_redis_key,
             "chunks_count": 0,
@@ -1399,8 +1159,7 @@ def process(
             fetch_start = time.perf_counter()
             file_stream = get_file_stream(source)
             if file_stream is None:
-                raise FileNotFoundError(
-                    f"Unable to fetch file from URL: {source}")
+                raise FileNotFoundError(f"Unable to fetch file from URL: {source}")
             file_data = file_stream.read()
             fetch_elapsed = time.perf_counter() - fetch_start
             logger.info(
@@ -1449,8 +1208,7 @@ def process(
                     if cached:
                         cached_chunks = json.loads(cached)
                         if isinstance(cached_chunks, list):
-                            image_metadata_chunk_count = _count_image_metadata_chunks(
-                                cached_chunks)
+                            image_metadata_chunk_count = _count_image_metadata_chunks(cached_chunks)
             except Exception as image_count_exc:
                 logger.warning(
                     f"[{self.request.id}] PROCESS TASK: Failed counting image metadata chunks for async split: {image_count_exc}")
@@ -1474,17 +1232,17 @@ def process(
         self.update_state(
             state=states.SUCCESS,
             meta={
-                'chunks_count': chunk_count,
-                'processing_time': elapsed_time,
-                'source': source,
-                'index_name': index_name,
-                'original_filename': original_filename,
-                'task_name': 'process',
-                'stage': 'text_extracted',
-                'file_size_mb': file_size_mb,
-                'processing_speed_mb_s': file_size_mb / elapsed_time if file_size_mb > 0 and elapsed_time > 0 else 0
-            }
-        )
+            'chunks_count': chunk_count,
+            'processing_time': elapsed_time,
+            'source': source,
+            'index_name': index_name,
+            'original_filename': original_filename,
+            'task_name': 'process',
+            'stage': 'text_extracted',
+            'file_size_mb': file_size_mb,
+            'processing_speed_mb_s': file_size_mb / elapsed_time if file_size_mb > 0 and elapsed_time > 0 else 0
+        }
+    )
 
         logger.info(
             f"[{self.request.id}] PROCESS TASK: Processing complete, waiting for forward task")
@@ -1650,34 +1408,165 @@ def forward(
     filename = original_filename
 
     try:
-        ctx = _init_forward_context(
-            task_id=task_id,
-            request_id=str(self.request.id),
-            start_time=start_time,
-            source=source,
-            index_name=index_name,
-            source_type=source_type,
-            original_filename=original_filename,
-        )
-
-        # Before doing any heavy work, check whether this task has been explicitly cancelled.
-        if _is_forward_task_cancelled(ctx):
-            logger.info(
-                f"[{self.request.id}] FORWARD TASK: Detected cancellation flag for task {task_id}; "
-                f"skipping chunk forwarding for source '{source}' in index '{index_name}'."
+        # Before doing any heavy work, check whether this task has been
+        # explicitly cancelled (for example, because the user deleted the
+        # document from the knowledge base configuration page).
+        try:
+            redis_service = get_redis_service()
+            if redis_service.is_task_cancelled(task_id):
+                logger.info(
+                    f"[{self.request.id}] FORWARD TASK: Detected cancellation flag for task {task_id}; "
+                    f"skipping chunk forwarding for source '{source}' in index '{index_name}'."
+                )
+                # Treat this as a graceful early exit. We still return a
+                # structured payload so callers can consider the task done.
+                return {
+                    'task_id': task_id,
+                    'source': source,
+                    'index_name': index_name,
+                    'original_filename': original_filename,
+                    'chunks_stored': 0,
+                    'storage_time': 0,
+                    'es_result': {
+                        "success": False,
+                        "message": "Indexing cancelled because document was deleted.",
+                        "total_indexed": 0,
+                        "total_submitted": 0,
+                    },
+                }
+        except Exception as cancel_check_exc:
+            logger.warning(
+                f"[{self.request.id}] FORWARD TASK: Failed to check cancellation flag for task {task_id}: "
+                f"{cancel_check_exc}"
             )
-            return _build_forward_cancelled_result(ctx)
-
-        chunks, split_async, original_source, original_index_name, filename = _load_forward_chunks(
-            self,
-            processed_data=processed_data,
-            original_source=original_source,
-            original_index_name=original_index_name,
-            filename=filename,
-        )
+
+        chunks = processed_data.get('chunks')
+        split_async = bool(processed_data.get('split_async'))
+        # If chunks are not in payload, try loading from Redis via the redis_key
+        if (not chunks) and processed_data.get('redis_key'):
+            redis_key = processed_data.get('redis_key')
+            if not REDIS_BACKEND_URL:
+                raise Exception(json.dumps({
+                    "message": "REDIS_BACKEND_URL not configured to retrieve chunks",
+                    "index_name": original_index_name,
+                    "task_name": "forward",
+                    "source": original_source,
+                    "original_filename": filename
+                }, ensure_ascii=False))
+            try:
+                import redis
+                client = redis.Redis.from_url(
+                    REDIS_BACKEND_URL, decode_responses=True)
+                ready_key = f"{redis_key}:ready"
+                if split_async:
+                    ready_flag = client.get(ready_key)
+                    if not ready_flag:
+                        retry_num = getattr(self.request, 'retries', 0)
+                        logger.info(
+                            f"[{self.request.id}] FORWARD TASK: Async split not ready for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                        raise self.retry(
+                            countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                            max_retries=ASYNC_SPLIT_RETRY_MAX,
+                            exc=Exception(json.dumps({
+                                "message": "Async split not ready; will retry",
+                                "index_name": original_index_name,
+                                "task_name": "forward",
+                                "source": original_source,
+                                "original_filename": filename
+                            }, ensure_ascii=False))
+                        )
+                cached = client.get(redis_key)
+                if cached:
+                    try:
+                        logger.debug(
+                            f"[{self.request.id}] FORWARD TASK: Retrieved Redis key '{redis_key}', payload_length={len(cached)}")
+                        chunks = json.loads(cached)
+                    except json.JSONDecodeError as jde:
+                        # Log raw prefix to help diagnose incorrect writes
+                        raw_preview = cached[:120] if isinstance(
+                            cached, str) else str(type(cached))
+                        logger.error(
+                            f"[{self.request.id}] FORWARD TASK: JSON decode error for key '{redis_key}': {str(jde)}; raw_prefix={raw_preview!r}")
+                        raise
+                else:
+                    if split_async:
+                        retry_num = getattr(self.request, 'retries', 0)
+                        logger.info(
+                            f"[{self.request.id}] FORWARD TASK: Async split ready but chunks missing for key {redis_key}. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                        raise self.retry(
+                            countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                            max_retries=ASYNC_SPLIT_RETRY_MAX,
+                            exc=Exception(json.dumps({
+                                "message": "Async split ready but chunks missing; will retry",
+                                "index_name": original_index_name,
+                                "task_name": "forward",
+                                "source": original_source,
+                                "original_filename": filename
+                            }, ensure_ascii=False))
+                        )
+                    # No busy-wait: release the worker slot and retry later
+                    retry_num = getattr(self.request, 'retries', 0)
+                    logger.info(
+                        f"[{self.request.id}] FORWARD TASK: Chunks not yet available for key {redis_key}. Retry {retry_num + 1}/{FORWARD_REDIS_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                    raise self.retry(
+                        countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                        max_retries=FORWARD_REDIS_RETRY_MAX,
+                        exc=Exception(json.dumps({
+                            "message": "Chunks not ready in Redis; will retry",
+                            "index_name": original_index_name,
+                            "task_name": "forward",
+                            "source": original_source,
+                            "original_filename": filename
+                        }, ensure_ascii=False))
+                    )
+            except Retry:
+                raise
+            except Exception as exc:
+                raise Exception(json.dumps({
+                    "message": f"Failed to retrieve chunks from Redis: {str(exc)}",
+                    "index_name": original_index_name,
+                    "task_name": "forward",
+                    "source": original_source,
+                    "original_filename": filename
+                }, ensure_ascii=False))
+        if processed_data.get('source'):
+            original_source = processed_data.get('source')
+        if processed_data.get('index_name'):
+            original_index_name = processed_data.get('index_name')
+        if processed_data.get('original_filename'):
+            filename = processed_data.get('original_filename')
+        logger.info(
+            f"[{self.request.id}] FORWARD TASK: Received data for source '{original_source}' with {len(chunks) if chunks else 'None'} chunks")
 
         # Calculate total chunks for progress tracking
         total_chunks = len(chunks) if chunks else 0
+
+        if chunks is None:
+            raise Exception(json.dumps({
+                "message": "No chunks received for forwarding",
+                "index_name": original_index_name,
+                "task_name": "forward",
+                "source": original_source,
+                "original_filename": original_filename
+            }, ensure_ascii=False))
+        if len(chunks) == 0:
+            if split_async and processed_data.get('redis_key'):
+                retry_num = getattr(self.request, 'retries', 0)
+                logger.info(
+                    f"[{self.request.id}] FORWARD TASK: Empty chunks while waiting for async split. Retry {retry_num + 1}/{ASYNC_SPLIT_RETRY_MAX} in {FORWARD_REDIS_RETRY_DELAY_S}s")
+                raise self.retry(
+                    countdown=FORWARD_REDIS_RETRY_DELAY_S,
+                    max_retries=ASYNC_SPLIT_RETRY_MAX,
+                    exc=Exception(json.dumps({
+                        "message": "Chunks not ready in Redis (empty); will retry",
+                        "index_name": original_index_name,
+                        "task_name": "forward",
+                        "source": original_source,
+                        "original_filename": filename
+                    }, ensure_ascii=False))
+                )
+            logger.warning(
+                f"[{self.request.id}] FORWARD TASK: Empty chunks list received for source {original_source}")
         formatted_chunks = []
         # Compute once per file to avoid repeated IO/MinIO calls inside loop
         file_size = get_file_size(source_type, original_source) if isinstance(
@@ -1868,7 +1757,6 @@ def forward(
 
         logger.info(
             f"[{self.request.id}] FORWARD TASK: Successfully stored {len(chunks)} chunks to index {original_index_name} in {end_time - start_time:.2f}s")
-
         return {
             'task_id': task_id,
             'source': original_source,
@@ -1951,106 +1839,9 @@ def forward(
         raise
 
 
-@app.task(
-    bind=True,
-    base=LoggingTask,
-    name="data_process.tasks.cleanup_source",
-    queue="forward_q",
-)
-def cleanup_source(self, forward_result: Dict[str, Any]) -> Dict[str, Any]:
-    """
-    Conditionally delete the MinIO source file after successful indexing.
-
-    If the knowledge base is configured with preserve_source_file=false, call:
-    DELETE /indices/{index_name}/documents?path_or_url=...&scope=source_only
-    """
-    index_name = (forward_result or {}).get("index_name")
-    source = (forward_result or {}).get("source")
-
-    cleanup_info: Dict[str, Any] = {
-        "attempted": False,
-        "skipped_reason": None,
-        "success": None,
-        "http_status": None,
-        "response": None,
-        "error": None,
-    }
-
-    if not index_name or not source:
-        cleanup_info["skipped_reason"] = "missing_index_name_or_source"
-        forward_result = dict(forward_result or {})
-        forward_result["source_cleanup"] = cleanup_info
-        return forward_result
-
-    try:
-        record = get_knowledge_record({"index_name": index_name}) or {}
-        preserve_source_file = record.get("preserve_source_file", True)
-    except Exception as exc:
-        logger.warning(
-            "[%s] CLEANUP TASK: Failed to load knowledge config for index '%s': %s",
-            getattr(self.request, "id", "unknown"),
-            index_name,
-            exc,
-        )
-        cleanup_info["skipped_reason"] = "knowledge_record_lookup_failed"
-        forward_result = dict(forward_result or {})
-        forward_result["source_cleanup"] = cleanup_info
-        return forward_result
-
-    if preserve_source_file:
-        cleanup_info["skipped_reason"] = "preserve_source_file_true"
-        forward_result = dict(forward_result or {})
-        forward_result["source_cleanup"] = cleanup_info
-        return forward_result
-
-    cleanup_info["attempted"] = True
-    try:
-        resp = _delete_source_file_via_http_sync(
-            base_url=ELASTICSEARCH_SERVICE,
-            index_name=index_name,
-            path_or_url=source,
-            scope="source_only",
-        )
-        cleanup_info["http_status"] = resp.get("http_status")
-        cleanup_info["response"] = (
-            resp.get("response_json")
-            if resp.get("response_json") is not None
-            else resp.get("response_text")
-        )
-
-        ok = False
-        if isinstance(resp.get("response_json"), dict):
-            ok = bool(resp["response_json"].get("status") == "success")
-        elif resp.get("http_status") and 200 <= int(resp["http_status"]) < 300:
-            ok = True
-
-        cleanup_info["success"] = ok
-        if not ok:
-            logger.warning(
-                "[%s] CLEANUP TASK: Source-only delete did not succeed. index='%s' source='%s' http_status=%s",
-                getattr(self.request, "id", "unknown"),
-                index_name,
-                source,
-                cleanup_info["http_status"],
-            )
-    except Exception as exc:
-        cleanup_info["success"] = False
-        cleanup_info["error"] = str(exc)
-        logger.warning(
-            "[%s] CLEANUP TASK: Source-only delete failed. index='%s' source='%s' error=%s",
-            getattr(self.request, "id", "unknown"),
-            index_name,
-            source,
-            exc,
-        )
-
-    forward_result = dict(forward_result or {})
-    forward_result["source_cleanup"] = cleanup_info
-    return forward_result
-
-
-def submit_process_forward_chain(
-        *,
+@app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_and_forward')
+def process_and_forward(
+        self,
         source: str,
         source_type: str,
         chunking_strategy: str,
@@ -2058,14 +1849,30 @@ def submit_process_forward_chain(
         original_filename: Optional[str] = None,
         authorization: Optional[str] = None,
         embedding_model_id: Optional[int] = None,
-        tenant_id: Optional[str] = None,
+        tenant_id: Optional[str] = None
 ) -> str:
     """
-    Build and enqueue a Celery chain: process -> forward.
+    Combined task that chains processing and forwarding
+
+    This task delegates to a chain of process -> forward
+
+    Args:
+        source: Source file path, URL, or text content
+        source_type: source of the file("local", "minio")
+        chunking_strategy: Strategy for chunking the document
+        index_name: Name of the index to store documents
+        original_filename: The original name of the file
+        authorization: Authorization header for API calls
+        embedding_model_id: Embedding model ID for chunk size configuration
+        tenant_id: Tenant ID for retrieving model configuration
 
     Returns:
-        Celery chain task ID, or empty string if enqueue failed.
+        Task ID of the chain
     """
+    logger.info(
+        f"Starting processing chain for {source}, original_filename={original_filename}, strategy={chunking_strategy}, index={index_name}, model_id={embedding_model_id}")
+
+    # Create a task chain
     task_chain = chain(
         process.s(
             source=source,
@@ -2082,64 +1889,18 @@ def submit_process_forward_chain(
             source_type=source_type,
             original_filename=original_filename,
             authorization=authorization
-        ).set(queue='forward_q'),
-        cleanup_source.s().set(queue='forward_q'),
+        ).set(queue='forward_q')
     )
 
+    # Execute the chain
     result = task_chain.apply_async()
     if result is None or not hasattr(result, 'id') or result.id is None:
         logger.error(
             "Celery chain apply_async() did not return a valid result or result.id")
         return ""
-    return result.id
-
+    logger.info(f"Created task chain ID: {result.id}")
 
-@app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_and_forward')
-def process_and_forward(
-        self,
-        source: str,
-        source_type: str,
-        chunking_strategy: str,
-        index_name: Optional[str] = None,
-        original_filename: Optional[str] = None,
-        authorization: Optional[str] = None,
-        embedding_model_id: Optional[int] = None,
-        tenant_id: Optional[str] = None
-) -> str:
-    """
-    Combined task that chains processing and forwarding
-
-    This task delegates to a chain of process -> forward
-
-    Args:
-        source: Source file path, URL, or text content
-        source_type: source of the file("local", "minio")
-        chunking_strategy: Strategy for chunking the document
-        index_name: Name of the index to store documents
-        original_filename: The original name of the file
-        authorization: Authorization header for API calls
-        embedding_model_id: Embedding model ID for chunk size configuration
-        tenant_id: Tenant ID for retrieving model configuration
-
-    Returns:
-        Task ID of the chain
-    """
-    logger.info(
-        f"Starting processing chain for {source}, original_filename={original_filename}, strategy={chunking_strategy}, index={index_name}, model_id={embedding_model_id}")
-
-    chain_id = submit_process_forward_chain(
-        source=source,
-        source_type=source_type,
-        chunking_strategy=chunking_strategy,
-        index_name=index_name,
-        original_filename=original_filename,
-        authorization=authorization,
-        embedding_model_id=embedding_model_id,
-        tenant_id=tenant_id,
-    )
-    if chain_id:
-        logger.info(f"Created task chain ID: {chain_id}")
-    return chain_id
+    return result.id
 
 
 @app.task(bind=True, base=LoggingTask, name='data_process.tasks.process_sync')
diff --git a/backend/database/agent_db.py b/backend/database/agent_db.py
index 533659b0f..82696ffab 100644
--- a/backend/database/agent_db.py
+++ b/backend/database/agent_db.py
@@ -1,10 +1,9 @@
 import logging
-from typing import List, Optional
+from typing import List
 from sqlalchemy import or_, update
 
 from database.client import get_db_session, as_dict, filter_property
 from database.db_models import AgentInfo, ToolInstance, AgentRelation
-from database.agent_version_db import query_current_version_no
 from consts.const import ASSET_OWNER_TENANT_ID
 from utils.str_utils import convert_list_to_string
 
@@ -103,40 +102,6 @@ def query_sub_agents_id_list(main_agent_id: int, tenant_id: str, version_no: int
         return [relation.selected_agent_id for relation in relations]
 
 
-def query_sub_agent_relations(main_agent_id: int, tenant_id: str, version_no: int = 0) -> List[dict]:
-    """
-    Query sub-agent relations by main agent id, including pinned version info.
-    Default version_no=0 queries the draft version.
-
-    Args:
-        main_agent_id: Parent agent ID
-        tenant_id: Tenant ID
-        version_no: Version number to filter. Default 0 = draft/editing state
-    """
-    with get_db_session() as session:
-        query = session.query(AgentRelation).filter(
-            AgentRelation.parent_agent_id == main_agent_id,
-            AgentRelation.tenant_id == tenant_id,
-            AgentRelation.version_no == version_no,
-            AgentRelation.delete_flag != 'Y')
-        relations = query.all()
-        return [as_dict(relation) for relation in relations]
-
-
-def resolve_sub_agent_version_no(
-    selected_agent_id: int,
-    selected_agent_version_no: Optional[int],
-    tenant_id: str,
-) -> int:
-    """
-    Resolve the effective version number for a sub-agent relation.
-    Uses pinned version when set; otherwise falls back to child's current published version.
-    """
-    if selected_agent_version_no is not None:
-        return selected_agent_version_no
-    return query_current_version_no(agent_id=selected_agent_id, tenant_id=tenant_id) or 0
-
-
 def clear_agent_new_mark(agent_id: int, tenant_id: str, user_id: str, version_no: int = 0):
     """
     Clear the NEW mark for an agent.
@@ -198,7 +163,6 @@ def create_agent(agent_info, tenant_id: str, user_id: str):
     """
     info_with_metadata = dict(agent_info)
     info_with_metadata.setdefault("max_steps", 15)
-    info_with_metadata.setdefault("verification_config", None)
     info_with_metadata.update({
         "tenant_id": tenant_id,
         "version_no": 0,  # Default to draft version
@@ -237,9 +201,6 @@ def create_agent(agent_info, tenant_id: str, user_id: str):
             "group_ids": new_agent.group_ids,
             "is_new": new_agent.is_new,
             "enable_context_manager": new_agent.enable_context_manager,
-            "verification_config": new_agent.verification_config,
-            "greeting_message": new_agent.greeting_message,
-            "example_questions": new_agent.example_questions,
             "current_version_no": new_agent.current_version_no,
             "version_no": new_agent.version_no,
             "created_by": new_agent.created_by,
diff --git a/backend/database/agent_repository_db.py b/backend/database/agent_repository_db.py
deleted file mode 100644
index a6bb4f48b..000000000
--- a/backend/database/agent_repository_db.py
+++ /dev/null
@@ -1,358 +0,0 @@
-import logging
-import math
-from typing import Any, Dict, List, Optional
-
-from sqlalchemy import func, or_, update
-
-from database.client import as_dict, filter_property, get_db_session
-from database.db_models import AgentRepository
-
-logger = logging.getLogger("agent_repository_db")
-
-# Listing status: NOT_SHARED (未共享), PENDING_REVIEW (待审核),
-# REJECTED (审核驳回), SHARED (已共享)
-STATUS_NOT_SHARED = "NOT_SHARED"
-STATUS_PENDING_REVIEW = "PENDING_REVIEW"
-STATUS_REJECTED = "REJECTED"
-STATUS_SHARED = "SHARED"
-
-VALID_REPOSITORY_STATUSES = frozenset({
-    STATUS_NOT_SHARED,
-    STATUS_PENDING_REVIEW,
-    STATUS_REJECTED,
-    STATUS_SHARED,
-})
-
-_UPSERT_IMMUTABLE_FIELDS = frozenset({
-    "agent_id",
-    "agent_repository_id",
-    "publisher_tenant_id",
-})
-
-_UPSERT_SNAPSHOT_FIELDS = frozenset({
-    "source_version_no",
-    "name",
-    "display_name",
-    "description",
-    "author",
-    "category_id",
-    "tags",
-    "tool_count",
-    "version_label",
-    "agent_info_json",
-})
-
-
-def insert_agent_repository_record(
-    repository_data: Dict[str, Any],
-    publisher_tenant_id: str,
-    publisher_user_id: str,
-) -> int:
-    """Insert a new agent repository listing record."""
-    with get_db_session() as session:
-        payload = {
-            **repository_data,
-            "publisher_tenant_id": publisher_tenant_id,
-            "publisher_user_id": publisher_user_id,
-            "created_by": publisher_user_id,
-            "updated_by": publisher_user_id,
-            "delete_flag": "N",
-        }
-        if payload.get("status") is None:
-            payload["status"] = STATUS_NOT_SHARED
-
-        new_record = AgentRepository(
-            **filter_property(payload, AgentRepository)
-        )
-        session.add(new_record)
-        session.flush()
-        return int(new_record.agent_repository_id)
-
-
-def get_agent_repository_by_id(repository_id: int) -> Optional[dict]:
-    """Fetch a repository listing by primary key."""
-    with get_db_session() as session:
-        record = session.query(AgentRepository).filter(
-            AgentRepository.agent_repository_id == repository_id,
-            AgentRepository.delete_flag != "Y",
-        ).first()
-        return as_dict(record) if record else None
-
-
-def get_agent_repository_by_id_and_publisher(
-    repository_id: int,
-    publisher_tenant_id: str,
-) -> Optional[dict]:
-    """Fetch a repository listing scoped to the publisher tenant."""
-    with get_db_session() as session:
-        record = session.query(AgentRepository).filter(
-            AgentRepository.agent_repository_id == repository_id,
-            AgentRepository.publisher_tenant_id == publisher_tenant_id,
-            AgentRepository.delete_flag != "Y",
-        ).first()
-        return as_dict(record) if record else None
-
-
-def get_agent_repository_by_agent_id(agent_id: int) -> Optional[dict]:
-    """Fetch an active repository listing by root agent_id."""
-    with get_db_session() as session:
-        record = session.query(AgentRepository).filter(
-            AgentRepository.agent_id == agent_id,
-            AgentRepository.delete_flag != "Y",
-        ).first()
-        return as_dict(record) if record else None
-
-
-def upsert_agent_repository_record(
-    repository_data: Dict[str, Any],
-    publisher_tenant_id: str,
-    publisher_user_id: str,
-) -> tuple[int, bool]:
-    """Insert or update a repository listing keyed by agent_id.
-
-    When no record exists, inserts a new listing. When a record exists:
-    - Same source_version_no: updates status (and updated_by) only.
-    - Different source_version_no: updates all snapshot fields, preserving
-      agent_id, agent_repository_id, and publisher_tenant_id.
-
-    Returns:
-        Tuple of (agent_repository_id, is_updated). is_updated is False on insert.
-    """
-    agent_id = repository_data.get("agent_id")
-    if agent_id is None:
-        raise ValueError("agent_id is required for repository upsert")
-
-    existing = get_agent_repository_by_agent_id(int(agent_id))
-    if not existing:
-        repository_id = insert_agent_repository_record(
-            repository_data=repository_data,
-            publisher_tenant_id=publisher_tenant_id,
-            publisher_user_id=publisher_user_id,
-        )
-        return repository_id, False
-
-    existing_version = existing.get("source_version_no")
-    incoming_version = repository_data.get("source_version_no")
-    repository_id = int(existing["agent_repository_id"])
-
-    if existing_version == incoming_version:
-        update_fields: Dict[str, Any] = {
-            "status": repository_data.get("status", STATUS_NOT_SHARED),
-            "updated_by": publisher_user_id,
-        }
-    else:
-        update_fields = {
-            key: repository_data[key]
-            for key in _UPSERT_SNAPSHOT_FIELDS
-            if key in repository_data
-        }
-        update_fields["publisher_user_id"] = publisher_user_id
-        update_fields["updated_by"] = publisher_user_id
-        update_fields["status"] = repository_data.get("status", STATUS_NOT_SHARED)
-
-    with get_db_session() as session:
-        session.execute(
-            update(AgentRepository)
-            .where(
-                AgentRepository.agent_repository_id == repository_id,
-                AgentRepository.publisher_tenant_id == publisher_tenant_id,
-                AgentRepository.delete_flag != "Y",
-            )
-            .values(**update_fields)
-        )
-    return repository_id, True
-
-
-def list_agent_repository_summaries(
-    *,
-    status: Optional[str] = None,
-) -> List[dict]:
-    """List all active repository summaries without heavy JSON blobs."""
-    with get_db_session() as session:
-        query = session.query(
-            AgentRepository.agent_repository_id,
-            AgentRepository.author,
-            AgentRepository.name,
-            AgentRepository.display_name,
-            AgentRepository.description,
-            AgentRepository.status,
-        ).filter(
-            AgentRepository.delete_flag != "Y",
-        )
-        if status:
-            query = query.filter(AgentRepository.status == status)
-        rows = query.order_by(AgentRepository.agent_repository_id.desc()).all()
-        return [
-            {
-                "agent_repository_id": row.agent_repository_id,
-                "author": row.author,
-                "name": row.name,
-                "display_name": row.display_name,
-                "description": row.description,
-                "status": row.status,
-            }
-            for row in rows
-        ]
-
-
-def query_agent_repository_list(
-    *,
-    page: int = 1,
-    page_size: int = 20,
-    search: Optional[str] = None,
-    tag: Optional[str] = None,
-    category_id: Optional[int] = None,
-    status: Optional[str] = STATUS_SHARED,
-    publisher_tenant_id: Optional[str] = None,
-) -> Dict[str, Any]:
-    """Query repository listings with offset pagination."""
-    page = max(page, 1)
-    page_size = max(min(page_size, 100), 1)
-    offset = (page - 1) * page_size
-
-    with get_db_session() as session:
-        query = session.query(AgentRepository).filter(
-            AgentRepository.delete_flag != "Y",
-        )
-
-        if status:
-            query = query.filter(AgentRepository.status == status)
-        if publisher_tenant_id:
-            query = query.filter(
-                AgentRepository.publisher_tenant_id == publisher_tenant_id
-            )
-        if category_id is not None:
-            query = query.filter(AgentRepository.category_id == category_id)
-        if tag:
-            query = query.filter(AgentRepository.tags.any(tag))
-        if search:
-            keyword = f"%{search}%"
-            query = query.filter(
-                or_(
-                    AgentRepository.name.ilike(keyword),
-                    AgentRepository.display_name.ilike(keyword),
-                    AgentRepository.description.ilike(keyword),
-                    AgentRepository.author.ilike(keyword),
-                    func.array_to_string(AgentRepository.tags, ",").ilike(keyword),
-                )
-            )
-
-        total = query.count()
-        rows = (
-            query.order_by(AgentRepository.agent_repository_id.desc())
-            .offset(offset)
-            .limit(page_size)
-            .all()
-        )
-
-        total_pages = math.ceil(total / page_size) if total else 0
-        return {
-            "items": [as_dict(row) for row in rows],
-            "pagination": {
-                "page": page,
-                "page_size": page_size,
-                "total": total,
-                "total_pages": total_pages,
-            },
-        }
-
-
-def update_agent_repository_by_id(
-    *,
-    repository_id: int,
-    publisher_tenant_id: str,
-    user_id: str,
-    updates: Dict[str, Any],
-) -> int:
-    """Update a repository listing owned by the publisher tenant. Returns affected row count."""
-    allowed_fields = {
-        "display_name",
-        "description",
-        "author",
-        "category_id",
-        "tags",
-        "tool_count",
-        "version_label",
-        "source_version_no",
-        "agent_info_json",
-        "status",
-    }
-    update_fields = {
-        key: value
-        for key, value in updates.items()
-        if key in allowed_fields
-    }
-    if not update_fields:
-        return 0
-
-    update_fields["updated_by"] = user_id
-
-    with get_db_session() as session:
-        result = session.execute(
-            update(AgentRepository)
-            .where(
-                AgentRepository.agent_repository_id == repository_id,
-                AgentRepository.publisher_tenant_id == publisher_tenant_id,
-                AgentRepository.delete_flag != "Y",
-            )
-            .values(**update_fields)
-        )
-        return int(result.rowcount or 0)
-
-
-def update_agent_repository_status_by_id(
-    *,
-    repository_id: int,
-    status: str,
-    user_id: str,
-) -> int:
-    """Update repository listing status by primary key. Returns affected row count."""
-    with get_db_session() as session:
-        result = session.execute(
-            update(AgentRepository)
-            .where(
-                AgentRepository.agent_repository_id == repository_id,
-                AgentRepository.delete_flag != "Y",
-            )
-            .values(status=status, updated_by=user_id)
-        )
-        return int(result.rowcount or 0)
-
-
-def soft_delete_agent_repository_by_id(
-    *,
-    repository_id: int,
-    publisher_tenant_id: str,
-    user_id: str,
-) -> int:
-    """Soft-delete a repository listing owned by the publisher tenant."""
-    with get_db_session() as session:
-        result = session.execute(
-            update(AgentRepository)
-            .where(
-                AgentRepository.agent_repository_id == repository_id,
-                AgentRepository.publisher_tenant_id == publisher_tenant_id,
-                AgentRepository.delete_flag != "Y",
-            )
-            .values(delete_flag="Y", updated_by=user_id)
-        )
-        return int(result.rowcount or 0)
-
-
-def list_agent_repository_by_publisher(
-    publisher_tenant_id: str,
-    *,
-    publisher_user_id: Optional[str] = None,
-) -> List[dict]:
-    """List all repository listings published by a tenant."""
-    with get_db_session() as session:
-        query = session.query(AgentRepository).filter(
-            AgentRepository.publisher_tenant_id == publisher_tenant_id,
-            AgentRepository.delete_flag != "Y",
-        )
-        if publisher_user_id:
-            query = query.filter(
-                AgentRepository.publisher_user_id == publisher_user_id
-            )
-        rows = query.order_by(AgentRepository.agent_repository_id.desc()).all()
-        return [as_dict(row) for row in rows]
diff --git a/backend/database/cas_session_db.py b/backend/database/cas_session_db.py
deleted file mode 100644
index 57d1aa8ea..000000000
--- a/backend/database/cas_session_db.py
+++ /dev/null
@@ -1,134 +0,0 @@
-"""
-Database operations for CAS-backed web sessions.
-"""
-
-from datetime import datetime
-from typing import Any, Dict, Optional
-
-from database.client import as_dict, get_db_session
-from database.db_models import UserCasSession
-
-CAS_SESSION_ACTIVE = "active"
-CAS_SESSION_REVOKED = "revoked"
-
-
-def create_cas_session(
-    *,
-    session_id: str,
-    user_id: str,
-    cas_user_id: str,
-    expires_at: datetime,
-    cas_session_index: Optional[str] = None,
-) -> Dict[str, Any]:
-    with get_db_session() as session:
-        record = UserCasSession(
-            session_id=session_id,
-            user_id=user_id,
-            cas_user_id=cas_user_id,
-            cas_session_index=cas_session_index,
-            status=CAS_SESSION_ACTIVE,
-            expires_at=expires_at,
-            created_by=user_id,
-            updated_by=user_id,
-        )
-        session.add(record)
-        session.flush()
-        return as_dict(record)
-
-
-def get_cas_session_by_session_id(session_id: str) -> Optional[Dict[str, Any]]:
-    if not session_id:
-        return None
-    with get_db_session() as session:
-        result = (
-            session.query(UserCasSession)
-            .filter(
-                UserCasSession.session_id == session_id,
-                UserCasSession.delete_flag == "N",
-            )
-            .first()
-        )
-        return as_dict(result) if result else None
-
-
-def is_cas_session_active(session_id: str) -> bool:
-    if not session_id:
-        return False
-    with get_db_session() as session:
-        result = (
-            session.query(UserCasSession)
-            .filter(
-                UserCasSession.session_id == session_id,
-                UserCasSession.status == CAS_SESSION_ACTIVE,
-                UserCasSession.expires_at > datetime.now(),
-                UserCasSession.delete_flag == "N",
-            )
-            .first()
-        )
-        return result is not None
-
-
-def revoke_cas_session_by_session_id(session_id: str, actor: str = "cas") -> int:
-    if not session_id:
-        return 0
-    with get_db_session() as session:
-        result = (
-            session.query(UserCasSession)
-            .filter(
-                UserCasSession.session_id == session_id,
-                UserCasSession.status == CAS_SESSION_ACTIVE,
-                UserCasSession.delete_flag == "N",
-            )
-            .update(
-                {
-                    "status": CAS_SESSION_REVOKED,
-                    "revoked_at": datetime.now(),
-                    "updated_by": actor,
-                }
-            )
-        )
-        return result
-
-
-def revoke_cas_sessions_by_user_id(cas_user_id: str, actor: str = "cas") -> int:
-    if not cas_user_id:
-        return 0
-    with get_db_session() as session:
-        result = (
-            session.query(UserCasSession)
-            .filter(
-                UserCasSession.cas_user_id == cas_user_id,
-                UserCasSession.status == CAS_SESSION_ACTIVE,
-                UserCasSession.delete_flag == "N",
-            )
-            .update(
-                {
-                    "status": CAS_SESSION_REVOKED,
-                    "revoked_at": datetime.now(),
-                    "updated_by": actor,
-                }
-            )
-        )
-        return result
-
-
-def revoke_cas_session_by_index(cas_session_index: str, actor: str = "cas") -> int:
-    if not cas_session_index:
-        return 0
-    with get_db_session() as session:
-        result = (
-            session.query(UserCasSession)
-            .filter(
-                UserCasSession.cas_session_index == cas_session_index,
-                UserCasSession.status == CAS_SESSION_ACTIVE,
-                UserCasSession.delete_flag == "N",
-            )
-            .update(
-                {
-                    "status": CAS_SESSION_REVOKED,
-                    "revoked_at": datetime.now(),
-                    "updated_by": actor,
-                }
-            )
-        )
-        return result
diff --git a/backend/database/conversation_db.py b/backend/database/conversation_db.py
index 2d06bb9be..18c0ee9fc 100644
--- a/backend/database/conversation_db.py
+++ b/backend/database/conversation_db.py
@@ -1016,71 +1016,3 @@ def get_message_id_by_index(conversation_id: int, message_index: int) -> Optiona
         result = session.execute(stmt).scalar()
 
         return result
-
-
-def get_latest_assistant_message_id(conversation_id: int, user_id: Optional[str] = None) -> Optional[int]:
-    """
-    Get the most recent assistant message ID for a conversation.
-
-    Args:
-        conversation_id: Conversation ID (integer)
-        user_id: Optional user ID for ownership check
-
-    Returns:
-        Optional[int]: The latest assistant message ID, or None if not found
-    """
-    with get_db_session() as session:
-        conversation_id = int(conversation_id)
-
-        stmt = select(ConversationMessage.message_id).where(
-            ConversationMessage.conversation_id == conversation_id,
-            ConversationMessage.delete_flag == 'N',
-            ConversationMessage.message_role == 'assistant'
-        ).order_by(desc(ConversationMessage.message_index)).limit(1)
-
-        if user_id:
-            stmt = stmt.join(
-                ConversationRecord,
-                ConversationMessage.conversation_id == ConversationRecord.conversation_id
-            ).where(ConversationRecord.created_by == user_id)
-
-        result = session.execute(stmt).scalar()
-        return result
-
-
-def update_message_minio_files(message_id: int, skill_file_uploads: List[Dict[str, Any]]) -> bool:
-    """
-    Merge skill file uploads into an existing message's minio_files field.
-
-    Args:
-        message_id: Message ID to update
-        skill_file_uploads: List of skill file upload metadata dicts to append
-
-    Returns:
-        bool: True if the message was updated, False if the message was not found
-    """
-    with get_db_session() as session:
-        message_id = int(message_id)
-
-        stmt = select(ConversationMessage).where(
-            ConversationMessage.message_id == message_id,
-            ConversationMessage.delete_flag == 'N'
-        )
-        record = session.scalars(stmt).first()
-        if not record:
-            return False
-
-        existing = record.minio_files
-        if existing:
-            try:
-                if isinstance(existing, str):
-                    existing = json.loads(existing)
-            except (json.JSONDecodeError, TypeError):
-                existing = []
-        else:
-            existing = []
-
-        existing.extend(skill_file_uploads)
-        record.minio_files = json.dumps(existing, ensure_ascii=False)
-
-        return True
diff --git a/backend/database/db_models.py b/backend/database/db_models.py
index 5450b5f74..b779266c9 100644
--- a/backend/database/db_models.py
+++ b/backend/database/db_models.py
@@ -15,8 +15,6 @@
 _TENANT_ID_DOC = "Tenant ID for multi-tenancy isolation"
 
 # Base class for tables without audit fields
-
-
 class SimpleTableBase(DeclarativeBase):
     pass
 
@@ -299,16 +297,13 @@ class AgentInfo(TableBase):
 
     agent_id = Column(Integer, Sequence(
         "ag_tenant_agent_t_agent_id_seq", schema=SCHEMA), nullable=False, primary_key=True, autoincrement=True, doc="ID")
-    version_no = Column(Integer, default=0, nullable=False, primary_key=True,
-                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    version_no = Column(Integer, default=0, nullable=False, primary_key=True, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
     name = Column(String(100), doc="Agent name")
     display_name = Column(String(100), doc="Agent display name")
     description = Column(Text, doc="Description")
     author = Column(String(100), doc="Agent author")
-    model_name = Column(
-        String(100), doc="[DEPRECATED] Name of the model used, use model_id instead")
-    model_id = Column(
-        Integer, doc="Model ID, foreign key reference to model_record_t.model_id")
+    model_name = Column(String(100), doc="[DEPRECATED] Name of the model used, use model_id instead")
+    model_id = Column(Integer, doc="Model ID, foreign key reference to model_record_t.model_id")
     max_steps = Column(Integer, doc="Maximum number of steps")
     duty_prompt = Column(Text, doc="Duty prompt content")
     constraint_prompt = Column(Text, doc="Constraint prompt content")
@@ -320,22 +315,15 @@ class AgentInfo(TableBase):
         Boolean, doc="Whether to provide the running summary to the manager agent")
     business_description = Column(
         Text, doc="Manually entered by the user to describe the entire business process")
-    business_logic_model_name = Column(
-        String(100), doc="Model name used for business logic prompt generation")
-    business_logic_model_id = Column(
-        Integer, doc="Model ID used for business logic prompt generation, foreign key reference to model_record_t.model_id")
-    prompt_template_id = Column(
-        Integer, doc="Prompt template ID used for business logic prompt generation")
-    prompt_template_name = Column(String(
-        100), doc="Prompt template name used for business logic prompt generation")
+    business_logic_model_name = Column(String(100), doc="Model name used for business logic prompt generation")
+    business_logic_model_id = Column(Integer, doc="Model ID used for business logic prompt generation, foreign key reference to model_record_t.model_id")
+    prompt_template_id = Column(Integer, doc="Prompt template ID used for business logic prompt generation")
+    prompt_template_name = Column(String(100), doc="Prompt template name used for business logic prompt generation")
     group_ids = Column(String, doc="Agent group IDs list")
     is_new = Column(Boolean, default=False, doc="Whether this agent is marked as new for the user")
     current_version_no = Column(Integer, nullable=True, doc="Current published version number. NULL means no version published yet")
     ingroup_permission = Column(String(30), doc="In-group permission: EDIT, READ_ONLY, PRIVATE")
     enable_context_manager = Column(Boolean, default=False, doc="Whether to enable context management (compression) for this agent")
-    verification_config = Column(JSONB, doc="Layered ReAct self-verification configuration")
-    greeting_message = Column(Text, doc="Agent greeting message displayed on chat initial screen")
-    example_questions = Column(JSONB, doc="List of example questions for starting a conversation with this agent")
 
 
 class PromptTemplate(TableBase):
@@ -364,15 +352,12 @@ class PromptTemplate(TableBase):
 
     template_id = Column(Integer, Sequence(
         "ag_prompt_template_t_template_id_seq", schema=SCHEMA), primary_key=True, nullable=False, autoincrement=True, doc="Prompt template ID")
-    template_name = Column(String(100), nullable=False,
-                           doc="Prompt template name")
+    template_name = Column(String(100), nullable=False, doc="Prompt template name")
     description = Column(String(500), doc="Prompt template description")
-    template_type = Column(String(50), nullable=False,
-                           default="agent_generate", doc="Prompt template type")
+    template_type = Column(String(50), nullable=False, default="agent_generate", doc="Prompt template type")
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
     user_id = Column(String(100), nullable=False, doc="User ID")
-    template_content_zh = Column(
-        JSONB, nullable=False, doc="Chinese prompt template content")
+    template_content_zh = Column(JSONB, nullable=False, doc="Chinese prompt template content")
     template_content_en = Column(JSONB, doc="English prompt template content")
 
 
@@ -396,8 +381,7 @@ class ToolInstance(TableBase):
     user_id = Column(String(100), doc="User ID")
     tenant_id = Column(String(100), doc="Tenant ID")
     enabled = Column(Boolean, doc="Enabled")
-    version_no = Column(Integer, default=0, primary_key=True, nullable=False,
-                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    version_no = Column(Integer, default=0, primary_key=True, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
 
 
 class KnowledgeRecord(TableBase):
@@ -413,25 +397,18 @@ class KnowledgeRecord(TableBase):
     knowledge_name = Column(String(100), doc="User-facing knowledge base name")
     knowledge_describe = Column(String(3000), doc="Knowledge base description")
     knowledge_sources = Column(String(300), doc="Knowledge base sources")
-    embedding_model_name = Column(String(
-        200), doc="Embedding model name, used to record the embedding model used by the knowledge base")
-    embedding_model_id = Column(
-        Integer, doc="Embedding model ID, foreign key reference to model_record_t.model_id")
+    embedding_model_name = Column(String(200), doc="Embedding model name, used to record the embedding model used by the knowledge base")
+    embedding_model_id = Column(Integer, doc="Embedding model ID, foreign key reference to model_record_t.model_id")
     tenant_id = Column(String(100), doc="Tenant ID")
     group_ids = Column(String, doc="Knowledge base group IDs list")
     ingroup_permission = Column(
         String(30), doc="In-group permission: EDIT, READ_ONLY, PRIVATE")
     summary_frequency = Column(String(10), nullable=True,
-                               doc="Auto-summary frequency: '3h', '5h', '1d', '1w', or NULL (disabled)")
+        doc="Auto-summary frequency: '3h', '5h', '1d', '1w', or NULL (disabled)")
     last_summary_time = Column(TIMESTAMP(timezone=False), nullable=True,
-                               doc="Timestamp of last summary generation")
+        doc="Timestamp of last summary generation")
     last_doc_update_time = Column(TIMESTAMP(timezone=False), nullable=True,
-                                  doc="Timestamp of last document add/delete operation")
-    preserve_source_file = Column(
-        Boolean,
-        default=True,
-        doc="Whether to preserve uploaded source documents after vectorization",
-    )
+        doc="Timestamp of last document add/delete operation")
 
 
 class TenantConfig(TableBase):
@@ -504,8 +481,7 @@ class McpRecord(TableBase):
         doc="Custom HTTP headers as JSON object for MCP server requests",
         default=None,
     )
-    source = Column(
-        String(30), doc="Source type: local/mcp_registry/community")
+    source = Column(String(30), doc="Source type: local/mcp_registry/community")
     registry_json = Column(JSONB, doc="Full MCP registry server.json snapshot")
     config_json = Column(JSON, doc="MCP config data")
     enabled = Column(Boolean, default=True, doc="Enabled")
@@ -533,13 +509,11 @@ class McpCommunityRecord(TableBase):
     source = Column(String(30), doc="Source type, fixed to community")
     version = Column(String(50), doc="MCP version")
     registry_json = Column(JSONB, doc="Full MCP metadata JSON")
-    transport_type = Column(
-        String(30), doc="Transport type: http/sse/container")
+    transport_type = Column(String(30), doc="Transport type: http/sse/container")
     config_json = Column(JSON, doc="Public-shareable MCP configuration JSON")
     tags = Column(ARRAY(Text), doc="Tags")
     description = Column(Text, doc="Description")
 
-
 class UserTenant(TableBase):
     """
     User and tenant relationship table
@@ -551,8 +525,7 @@ class UserTenant(TableBase):
                             primary_key=True, nullable=False, doc="User tenant relationship ID, unique primary key")
     user_id = Column(String(100), nullable=False, doc="User ID")
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
-    user_role = Column(
-        String(30), doc="User role: SUPER_ADMIN, ADMIN, DEV, USER")
+    user_role = Column(String(30), doc="User role: SUPER_ADMIN, ADMIN, DEV, USER")
     user_email = Column(String(255), doc="User email address")
 
 
@@ -563,18 +536,11 @@ class AgentRelation(TableBase):
     __tablename__ = "ag_agent_relation_t"
     __table_args__ = {"schema": SCHEMA}
 
-    relation_id = Column(Integer, Sequence("ag_agent_relation_t_relation_id_seq", schema=SCHEMA),
-                         primary_key=True, nullable=False, doc="Relationship ID, primary key")
-    selected_agent_id = Column(
-        Integer, primary_key=True, doc="Selected agent ID")
+    relation_id = Column(Integer, Sequence("ag_agent_relation_t_relation_id_seq", schema=SCHEMA), primary_key=True, nullable=False, doc="Relationship ID, primary key")
+    selected_agent_id = Column(Integer, primary_key=True, doc="Selected agent ID")
     parent_agent_id = Column(Integer, doc="Parent agent ID")
     tenant_id = Column(String(100), doc="Tenant ID")
-    version_no = Column(Integer, default=0, nullable=False,
-                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
-    selected_agent_version_no = Column(
-        Integer, nullable=True,
-        doc="Pinned version of selected_agent_id. NULL = runtime fallback to child current_version_no",
-    )
+    version_no = Column(Integer, default=0, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
 
 
 class PartnerMappingId(TableBase):
@@ -690,51 +656,13 @@ class AgentVersion(TableBase):
                 primary_key=True, nullable=False, doc=_PRIMARY_KEY_DOC)
     tenant_id = Column(String(100), nullable=False, doc="Tenant ID")
     agent_id = Column(Integer, nullable=False, doc="Agent ID")
-    version_no = Column(Integer, nullable=False,
-                        doc="Version number, starts from 1. Does not include 0 (draft)")
-    version_name = Column(
-        String(100), doc="User-defined version name for display")
+    version_no = Column(Integer, nullable=False, doc="Version number, starts from 1. Does not include 0 (draft)")
+    version_name = Column(String(100), doc="User-defined version name for display")
     release_note = Column(Text, doc="Release notes / publish remarks")
-    source_version_no = Column(
-        Integer, doc="Source version number. If this version is a rollback, record the source version")
-    source_type = Column(String(
-        30), doc="Source type: NORMAL (normal publish) / ROLLBACK (rollback and republish)")
-    status = Column(String(30), default="RELEASED",
-                    doc="Version status: RELEASED / DISABLED / ARCHIVED")
-    is_a2a = Column(Boolean, default=False,
-                    doc="Whether this version is published as an A2A Server agent")
-
-
-class AgentRepository(TableBase):
-    """
-    Agent repository (marketplace) table. Frozen snapshot of a published agent tree for sharing.
-    """
-    __tablename__ = "ag_agent_repository_t"
-    __table_args__ = {"schema": SCHEMA}
-
-    agent_repository_id = Column(BigInteger, Sequence("ag_agent_repository_t_agent_repository_id_seq", schema=SCHEMA),
-                                 primary_key=True, nullable=False, doc="Agent repository listing ID, unique primary key")
-    publisher_tenant_id = Column(String(100), nullable=False, doc="Publisher tenant ID")
-    publisher_user_id = Column(String(100), nullable=False, doc="Publisher user ID")
-    agent_id = Column(Integer, nullable=False,
-                      doc="Root agent ID from ag_tenant_agent_t; upsert key")
-    source_version_no = Column(Integer, nullable=False,
-                               doc="Published version number frozen at share time")
-    name = Column(String(100), nullable=False,
-                  doc="Root agent programmatic name for display and search")
-    display_name = Column(String(100), doc="Root agent display name")
-    description = Column(Text, doc="Root agent description")
-    author = Column(String(100), doc="Agent author")
-    category_id = Column(Integer, doc="Optional marketplace category ID")
-    tags = Column(ARRAY(Text), doc="Marketplace tags")
-    tool_count = Column(Integer,
-                        doc="Total tool count across all agents in the bundle (display only)")
-    version_label = Column(String(100),
-                           doc="Repository entry version label for display (e.g. v1.0)")
-    agent_info_json = Column(JSONB, nullable=False,
-                             doc="Frozen ExportAndImportDataFormat snapshot with optional skills")
-    status = Column(String(30), default="NOT_SHARED",
-                    doc="Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)")
+    source_version_no = Column(Integer, doc="Source version number. If this version is a rollback, record the source version")
+    source_type = Column(String(30), doc="Source type: NORMAL (normal publish) / ROLLBACK (rollback and republish)")
+    status = Column(String(30), default="RELEASED", doc="Version status: RELEASED / DISABLED / ARCHIVED")
+    is_a2a = Column(Boolean, default=False, doc="Whether this version is published as an A2A Server agent")
 
 
 class UserTokenInfo(TableBase):
@@ -747,8 +675,7 @@ class UserTokenInfo(TableBase):
     token_id = Column(Integer, Sequence("user_token_info_t_token_id_seq", schema=SCHEMA),
                       primary_key=True, nullable=False, doc="Token ID, unique primary key")
     access_key = Column(String(100), nullable=False, doc="Access Key (AK)")
-    user_id = Column(String(100), nullable=False,
-                     doc="User ID who owns this token")
+    user_id = Column(String(100), nullable=False, doc="User ID who owns this token")
 
 
 class UserTokenUsageLog(TableBase):
@@ -760,21 +687,16 @@ class UserTokenUsageLog(TableBase):
 
     token_usage_id = Column(Integer, Sequence("user_token_usage_log_t_token_usage_id_seq", schema=SCHEMA),
                             primary_key=True, nullable=False, doc="Token usage log ID, unique primary key")
-    token_id = Column(Integer, nullable=False,
-                      doc="Foreign key to user_token_info_t.token_id")
-    call_function_name = Column(
-        String(100), doc="API function name being called")
-    related_id = Column(
-        Integer, doc="Related resource ID (e.g., conversation_id)")
-    meta_data = Column(
-        JSONB, doc="Additional metadata for this usage log entry, stored as JSON")
+    token_id = Column(Integer, nullable=False, doc="Foreign key to user_token_info_t.token_id")
+    call_function_name = Column(String(100), doc="API function name being called")
+    related_id = Column(Integer, doc="Related resource ID (e.g., conversation_id)")
+    meta_data = Column(JSONB, doc="Additional metadata for this usage log entry, stored as JSON")
 
 
 class UserOAuthAccount(TableBase):
     __tablename__ = "user_oauth_account_t"
     __table_args__ = (
-        UniqueConstraint("provider", "provider_user_id",
-                         name="uq_oauth_provider_user"),
+        UniqueConstraint("provider", "provider_user_id", name="uq_oauth_provider_user"),
         {"schema": SCHEMA},
     )
 
@@ -792,38 +714,11 @@ class UserOAuthAccount(TableBase):
     provider_user_id = Column(
         String(200), nullable=False, doc="User ID from the OAuth provider"
     )
-    provider_email = Column(
-        String(255), doc="Email address from the OAuth provider")
-    provider_username = Column(
-        String(200), doc="Display name from the OAuth provider")
+    provider_email = Column(String(255), doc="Email address from the OAuth provider")
+    provider_username = Column(String(200), doc="Display name from the OAuth provider")
     tenant_id = Column(String(100), doc="Tenant ID at time of linking")
 
 
-class UserCasSession(TableBase):
-    __tablename__ = "user_cas_session_t"
-    __table_args__ = (
-        Index("ix_user_cas_session_session_id", "session_id"),
-        Index("ix_user_cas_session_user_id", "user_id"),
-        Index("ix_user_cas_session_cas_user_id", "cas_user_id"),
-        {"schema": SCHEMA},
-    )
-
-    cas_session_id = Column(
-        Integer,
-        Sequence("user_cas_session_t_cas_session_id_seq", schema=SCHEMA),
-        primary_key=True,
-        nullable=False,
-        doc="CAS session record ID",
-    )
-    session_id = Column(String(100), nullable=False, unique=True, doc="JWT session ID")
-    user_id = Column(String(100), nullable=False, doc="Supabase user UUID")
-    cas_user_id = Column(String(200), nullable=False, doc="User ID from CAS")
-    cas_session_index = Column(String(500), doc="CAS SessionIndex or service ticket")
-    status = Column(String(30), nullable=False, default="active", doc="active/revoked")
-    expires_at = Column(TIMESTAMP(timezone=False), nullable=False, doc="Session expiration time")
-    revoked_at = Column(TIMESTAMP(timezone=False), doc="Revocation time")
-
-
 class SkillInfo(TableBase):
     """
     Skill information table - stores skill metadata and content.
@@ -833,17 +728,13 @@ class SkillInfo(TableBase):
 
     skill_id = Column(Integer, Sequence("ag_skill_info_t_skill_id_seq", schema=SCHEMA),
                       primary_key=True, nullable=False, autoincrement=True, doc="Skill ID")
-    skill_name = Column(String(100), nullable=False,
-                        unique=True, doc="Unique skill name")
-    tenant_id = Column(String(100), nullable=True,
-                       doc="Tenant ID for multi-tenancy. NULL for pre-existing skills.")
+    skill_name = Column(String(100), nullable=False, unique=True, doc="Unique skill name")
+    tenant_id = Column(String(100), nullable=True, doc="Tenant ID for multi-tenancy. NULL for pre-existing skills.")
     skill_description = Column(String(1000), doc="Skill description")
     skill_tags = Column(JSON, doc="Skill tags as JSON array")
     skill_content = Column(Text, doc="Skill content in markdown format")
-    config_schemas = Column(
-        JSON, doc="Parameter metadata from config/schema.yaml")
-    config_values = Column(
-        JSON, doc="Runtime parameter values from config/config.yaml")
+    config_schemas = Column(JSON, doc="Parameter metadata from config/schema.yaml")
+    config_values = Column(JSON, doc="Runtime parameter values from config/config.yaml")
     source = Column(String(30), nullable=False, default="official",
                     doc="Skill source: official, custom, etc.")
 
@@ -857,10 +748,8 @@ class SkillToolRelation(TableBase):
 
     rel_id = Column(Integer, Sequence("ag_skill_tools_rel_t_rel_id_seq", schema=SCHEMA),
                     primary_key=True, nullable=False, autoincrement=True, doc="Relation ID")
-    skill_id = Column(Integer, nullable=False,
-                      doc="Foreign key to ag_skill_info_t.skill_id")
-    tool_id = Column(Integer, nullable=False,
-                     doc="Foreign key to ag_tool_info_t.tool_id")
+    skill_id = Column(Integer, nullable=False, doc="Foreign key to ag_skill_info_t.skill_id")
+    tool_id = Column(Integer, nullable=False, doc="Foreign key to ag_tool_info_t.tool_id")
 
 
 class SkillInstance(TableBase):
@@ -879,19 +768,14 @@ class SkillInstance(TableBase):
         nullable=False,
         doc="Skill instance ID"
     )
-    skill_id = Column(Integer, nullable=False,
-                      doc="Foreign key to ag_skill_info_t.skill_id")
+    skill_id = Column(Integer, nullable=False, doc="Foreign key to ag_skill_info_t.skill_id")
     agent_id = Column(Integer, nullable=False, doc="Agent ID")
     user_id = Column(String(100), doc="User ID")
     tenant_id = Column(String(100), doc="Tenant ID")
-    enabled = Column(Boolean, default=True,
-                     doc="Whether this skill is enabled for the agent")
-    version_no = Column(Integer, default=0, primary_key=True, nullable=False,
-                        doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
-    config_values = Column(
-        JSON, doc="Per-agent runtime parameter values (mirrors ag_tool_instance_t.params)")
-    config_schemas = Column(
-        JSON, doc="Per-agent parameter schema overrides from config/schema.yaml")
+    enabled = Column(Boolean, default=True, doc="Whether this skill is enabled for the agent")
+    version_no = Column(Integer, default=0, primary_key=True, nullable=False, doc="Version number. 0 = draft/editing state, >=1 = published snapshot")
+    config_values = Column(JSON, doc="Per-agent runtime parameter values (mirrors ag_tool_instance_t.params)")
+    config_schemas = Column(JSON, doc="Per-agent parameter schema overrides from config/schema.yaml")
 
 
 class OuterApiService(TableBase):
@@ -904,16 +788,13 @@ class OuterApiService(TableBase):
 
     id = Column(BigInteger, Sequence("ag_outer_api_services_id_seq", schema=SCHEMA),
                 primary_key=True, nullable=False, doc="Service ID, unique primary key")
-    mcp_service_name = Column(String(100), nullable=False,
-                              doc="MCP service name (unique identifier per tenant)")
+    mcp_service_name = Column(String(100), nullable=False, doc="MCP service name (unique identifier per tenant)")
     description = Column(Text, doc="Service description from OpenAPI info")
     openapi_json = Column(JSONB, doc="Complete OpenAPI JSON specification")
     server_url = Column(String(500), doc="Base URL of the REST API server")
     headers_template = Column(JSONB, doc="Default headers template as JSON")
-    tenant_id = Column(String(100), nullable=False,
-                       doc="Tenant ID for multi-tenancy")
-    is_available = Column(Boolean, default=True,
-                          doc="Whether the service is available")
+    tenant_id = Column(String(100), nullable=False, doc="Tenant ID for multi-tenancy")
+    is_available = Column(Boolean, default=True, doc="Whether the service is available")
 
 
 # Alias for backward compatibility
@@ -928,37 +809,27 @@ class A2ANacosConfig(TableBase):
     __tablename__ = "ag_a2a_nacos_config_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True,
-                autoincrement=True, doc=_PRIMARY_KEY_DOC)
-    config_id = Column(String(64), unique=True, nullable=False,
-                       doc="Unique config identifier for API reference")
+    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    config_id = Column(String(64), unique=True, nullable=False, doc="Unique config identifier for API reference")
 
     # Nacos connection
-    nacos_addr = Column(String(512), nullable=False,
-                        doc="Nacos server address, e.g., http://nacos-server:8848")
-    nacos_username = Column(
-        String(100), doc="Nacos username for authentication")
-    nacos_password = Column(
-        String(256), doc="Nacos password, encrypted at rest")
+    nacos_addr = Column(String(512), nullable=False, doc="Nacos server address, e.g., http://nacos-server:8848")
+    nacos_username = Column(String(100), doc="Nacos username for authentication")
+    nacos_password = Column(String(256), doc="Nacos password, encrypted at rest")
 
     # Discovery scope
-    namespace_id = Column(String(100), default="public",
-                          doc="Nacos namespace for service discovery")
+    namespace_id = Column(String(100), default="public", doc="Nacos namespace for service discovery")
 
     # Metadata
-    name = Column(String(100), nullable=False,
-                  doc="Display name for this Nacos config")
+    name = Column(String(100), nullable=False, doc="Display name for this Nacos config")
     description = Column(Text, doc="Description of this Nacos configuration")
 
     # Tenant isolation
-    tenant_id = Column(String(100), nullable=False,
-                       doc="Tenant ID for multi-tenancy")
+    tenant_id = Column(String(100), nullable=False, doc="Tenant ID for multi-tenancy")
 
     # Status
-    is_active = Column(Boolean, default=True,
-                       doc="Whether this Nacos config is active")
-    last_scan_at = Column(TIMESTAMP(timezone=False),
-                          doc="Last time a scan was performed using this config")
+    is_active = Column(Boolean, default=True, doc="Whether this Nacos config is active")
+    last_scan_at = Column(TIMESTAMP(timezone=False), doc="Last time a scan was performed using this config")
 
 
 class A2AExternalAgent(TableBase):
@@ -969,49 +840,39 @@ class A2AExternalAgent(TableBase):
     __tablename__ = "ag_a2a_external_agent_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True,
-                autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Agent metadata (cached from Agent Card)
-    name = Column(String(255), nullable=False,
-                  doc="Agent name from Agent Card")
+    name = Column(String(255), nullable=False, doc="Agent name from Agent Card")
     description = Column(Text, doc="Agent description from Agent Card")
-    version = Column(
-        String(50), doc="Agent version from Agent Card, e.g., 1.2.0")
+    version = Column(String(50), doc="Agent version from Agent Card, e.g., 1.2.0")
 
     # Primary interface (extracted from supportedInterfaces for quick access)
     # In A2A 1.0, this should store the http-json-rpc URL
-    agent_url = Column(String(512), nullable=False,
-                       doc="Primary A2A endpoint URL (http-json-rpc by default)")
+    agent_url = Column(String(512), nullable=False, doc="Primary A2A endpoint URL (http-json-rpc by default)")
 
     # Protocol type for calling this agent: JSONRPC, HTTP+JSON, GRPC
-    protocol_type = Column(String(20), default=PROTOCOL_JSONRPC,
-                           doc="Protocol type for calling this agent")
+    protocol_type = Column(String(20), default=PROTOCOL_JSONRPC, doc="Protocol type for calling this agent")
 
     # Capabilities
-    streaming = Column(Boolean, default=False,
-                       doc="Whether this agent supports SSE streaming")
+    streaming = Column(Boolean, default=False, doc="Whether this agent supports SSE streaming")
 
     # All supported interfaces (full JSON array from Agent Card)
     # Format: [{protocolBinding, url, protocolVersion}, ...]
     supported_interfaces = Column(JSON, doc="All supported interfaces array")
 
     # Source information
-    source_type = Column(String(20), nullable=False,
-                         doc="Discovery source: url or nacos")
+    source_type = Column(String(20), nullable=False, doc="Discovery source: url or nacos")
 
     # For URL mode
     source_url = Column(String(512), doc="Direct URL to agent card")
 
     # For Nacos mode
-    nacos_config_id = Column(
-        String(64), doc="Reference to Nacos config used for discovery")
-    nacos_agent_name = Column(
-        String(255), doc="Original name used for Nacos query")
+    nacos_config_id = Column(String(64), doc="Reference to Nacos config used for discovery")
+    nacos_agent_name = Column(String(255), doc="Original name used for Nacos query")
 
     # Base URL for infrastructure health checks
-    base_url = Column(String(
-        512), doc="Base URL for health checks (service root address), e.g., http://agent:8080")
+    base_url = Column(String(512), doc="Base URL for health checks (service root address), e.g., http://agent:8080")
 
     # Tenant isolation
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
@@ -1020,18 +881,13 @@ class A2AExternalAgent(TableBase):
     raw_card = Column(JSON, doc="Full original Agent Card JSON from discovery")
 
     # Cache management
-    cached_at = Column(TIMESTAMP(timezone=False),
-                       doc="Timestamp when Agent Card was cached")
-    cache_expires_at = Column(
-        TIMESTAMP(timezone=False), doc="Timestamp when cache expires")
+    cached_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when Agent Card was cached")
+    cache_expires_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when cache expires")
 
     # Health check status
-    is_available = Column(Boolean, default=True,
-                          doc="Whether this agent is currently reachable")
-    last_check_at = Column(TIMESTAMP(timezone=False),
-                           doc="Last health check timestamp")
-    last_check_result = Column(
-        String(50), doc="Last health check result: OK, ERROR, TIMEOUT")
+    is_available = Column(Boolean, default=True, doc="Whether this agent is currently reachable")
+    last_check_at = Column(TIMESTAMP(timezone=False), doc="Last health check timestamp")
+    last_check_result = Column(String(50), doc="Last health check result: OK, ERROR, TIMEOUT")
 
 
 class A2AExternalAgentRelation(TableBase):
@@ -1049,23 +905,19 @@ class A2AExternalAgentRelation(TableBase):
         {"schema": SCHEMA},
     )
 
-    id = Column(BigInteger, primary_key=True,
-                autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Local agent (parent)
-    local_agent_id = Column(Integer, nullable=False,
-                            doc="Local parent agent ID")
+    local_agent_id = Column(Integer, nullable=False, doc="Local parent agent ID")
 
     # External A2A agent (sub-agent) - FK to ag_a2a_external_agent_t.id
-    external_agent_id = Column(
-        BigInteger, nullable=False, doc="External A2A agent ID (FK to ag_a2a_external_agent_t.id)")
+    external_agent_id = Column(BigInteger, nullable=False, doc="External A2A agent ID (FK to ag_a2a_external_agent_t.id)")
 
     # Tenant isolation
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
 
     # Status
-    is_enabled = Column(Boolean, default=True,
-                        doc="Whether this relation is active")
+    is_enabled = Column(Boolean, default=True, doc="Whether this relation is active")
 
 
 class A2AServerAgent(TableBase):
@@ -1076,8 +928,7 @@ class A2AServerAgent(TableBase):
     __tablename__ = "ag_a2a_server_agent_t"
     __table_args__ = {"schema": SCHEMA}
 
-    id = Column(BigInteger, primary_key=True,
-                autoincrement=True, doc=_PRIMARY_KEY_DOC)
+    id = Column(BigInteger, primary_key=True, autoincrement=True, doc=_PRIMARY_KEY_DOC)
 
     # Link to local agent
     agent_id = Column(Integer, nullable=False, doc="Local agent ID")
@@ -1087,44 +938,35 @@ class A2AServerAgent(TableBase):
     tenant_id = Column(String(100), nullable=False, doc=_TENANT_ID_DOC)
 
     # Generated endpoint ID
-    endpoint_id = Column(String(64), unique=True,
-                         nullable=False, doc="Generated endpoint ID")
+    endpoint_id = Column(String(64), unique=True, nullable=False, doc="Generated endpoint ID")
 
     # Basic info (extracted from local agent, can be overridden)
-    name = Column(String(255), nullable=False,
-                  doc="Agent name exposed in Agent Card")
+    name = Column(String(255), nullable=False, doc="Agent name exposed in Agent Card")
     description = Column(Text, doc="Agent description exposed in Agent Card")
     version = Column(String(50), doc="Agent version exposed in Agent Card")
 
     # Primary endpoint URL (http-json-rpc by default)
-    agent_url = Column(
-        String(512), doc="Primary A2A endpoint URL (http-json-rpc by default)")
+    agent_url = Column(String(512), doc="Primary A2A endpoint URL (http-json-rpc by default)")
 
     # Capabilities
-    streaming = Column(Boolean, default=False,
-                       doc="Whether this agent supports SSE streaming")
+    streaming = Column(Boolean, default=False, doc="Whether this agent supports SSE streaming")
 
     # All supported interfaces (A2A 1.0 compliant)
     # Format: [{protocolBinding, url, protocolVersion}, ...]
-    supported_interfaces = Column(
-        JSON, doc="All supported interfaces: [{protocolBinding, url, protocolVersion}, ...]")
+    supported_interfaces = Column(JSON, doc="All supported interfaces: [{protocolBinding, url, protocolVersion}, ...]")
 
     # Agent Card customization (partial overrides only)
-    card_overrides = Column(
-        JSON, doc="User customizations for Agent Card (partial override)")
+    card_overrides = Column(JSON, doc="User customizations for Agent Card (partial override)")
 
     # A2A Server status
-    is_enabled = Column(Boolean, default=False,
-                        doc="Whether A2A Server is enabled for this agent")
+    is_enabled = Column(Boolean, default=False, doc="Whether A2A Server is enabled for this agent")
 
     # Raw Agent Card (generated from settings, for debugging)
     raw_card = Column(JSON, doc="Generated Agent Card JSON (for debugging)")
 
     # Publishing timestamps
-    published_at = Column(TIMESTAMP(timezone=False),
-                          doc="Timestamp when A2A Server was last enabled")
-    unpublished_at = Column(TIMESTAMP(timezone=False),
-                            doc="Timestamp when A2A Server was disabled")
+    published_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when A2A Server was last enabled")
+    unpublished_at = Column(TIMESTAMP(timezone=False), doc="Timestamp when A2A Server was disabled")
 
 
 class A2ATask(SimpleTableBase):
@@ -1137,8 +979,7 @@ class A2ATask(SimpleTableBase):
 
     # Core identifiers (following A2A spec)
     id = Column(String(64), primary_key=True, doc="Task ID (A2A spec: taskId)")
-    context_id = Column(
-        String(64), doc="Context ID for grouping related tasks")
+    context_id = Column(String(64), doc="Context ID for grouping related tasks")
 
     # Endpoint and caller info
     endpoint_id = Column(String(64), nullable=False, doc="Endpoint ID")
@@ -1149,21 +990,16 @@ class A2ATask(SimpleTableBase):
     raw_request = Column(JSON, doc="Original A2A request payload")
 
     # Task state (following A2A TaskState enum)
-    task_state = Column(String(50), nullable=False, server_default="TASK_STATE_SUBMITTED",
-                        doc="Task state: TASK_STATE_SUBMITTED, TASK_STATE_WORKING, TASK_STATE_COMPLETED, TASK_STATE_FAILED, TASK_STATE_CANCELED, TASK_STATE_INPUT_REQUIRED, TASK_STATE_REJECTED, TASK_STATE_AUTH_REQUIRED")
-    state_timestamp = Column(TIMESTAMP(timezone=False),
-                             doc="Task state last update timestamp")
+    task_state = Column(String(50), nullable=False, server_default="TASK_STATE_SUBMITTED", doc="Task state: TASK_STATE_SUBMITTED, TASK_STATE_WORKING, TASK_STATE_COMPLETED, TASK_STATE_FAILED, TASK_STATE_CANCELED, TASK_STATE_INPUT_REQUIRED, TASK_STATE_REJECTED, TASK_STATE_AUTH_REQUIRED")
+    state_timestamp = Column(TIMESTAMP(timezone=False), doc="Task state last update timestamp")
 
     # Task result
     result_data = Column(JSON, doc="Task final result data")
 
     # Timestamps
-    create_time = Column(TIMESTAMP(timezone=False),
-                         server_default=func.now(), doc="Task creation timestamp")
-    update_time = Column(TIMESTAMP(timezone=False), server_default=func.now(
-    ), onupdate=func.now(), doc="Task last update timestamp")
-    completed_at = Column(TIMESTAMP(timezone=False),
-                          doc="Task completion timestamp")
+    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Task creation timestamp")
+    update_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), onupdate=func.now(), doc="Task last update timestamp")
+    completed_at = Column(TIMESTAMP(timezone=False), doc="Task completion timestamp")
 
 
 class A2AMessage(SimpleTableBase):
@@ -1175,30 +1011,23 @@ class A2AMessage(SimpleTableBase):
     __table_args__ = {"schema": SCHEMA}
 
     # Core identifiers (following A2A spec)
-    message_id = Column(String(64), primary_key=True,
-                        doc="Message ID (A2A spec: messageId)")
-    task_id = Column(String(64), nullable=True,
-                     doc="Task ID this message belongs to (nullable for standalone/simple requests)")
+    message_id = Column(String(64), primary_key=True, doc="Message ID (A2A spec: messageId)")
+    task_id = Column(String(64), nullable=True, doc="Task ID this message belongs to (nullable for standalone/simple requests)")
 
     # Message attributes
-    message_index = Column(Integer, nullable=False,
-                           doc="Order of message in the conversation")
-    role = Column(String(20), nullable=False,
-                  doc="Message sender role: user or agent")
+    message_index = Column(Integer, nullable=False, doc="Order of message in the conversation")
+    role = Column(String(20), nullable=False, doc="Message sender role: user or agent")
 
     # Message content (following A2A Part structure)
-    parts = Column(JSON, nullable=False,
-                   doc="Message parts following A2A Part structure")
+    parts = Column(JSON, nullable=False, doc="Message parts following A2A Part structure")
     meta_data = Column(JSON, doc="Optional metadata")
     extensions = Column(JSON, doc="Extension URI list")
 
     # References to other tasks (optional)
-    reference_task_ids = Column(
-        JSON, doc="Referenced task IDs array for multi-turn scenarios")
+    reference_task_ids = Column(JSON, doc="Referenced task IDs array for multi-turn scenarios")
 
     # Timestamp
-    create_time = Column(TIMESTAMP(
-        timezone=False), server_default=func.now(), doc="Message creation timestamp")
+    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Message creation timestamp")
 
 
 class A2AArtifact(SimpleTableBase):
@@ -1210,19 +1039,15 @@ class A2AArtifact(SimpleTableBase):
 
     # Core identifiers (following A2A spec)
     id = Column(String(64), primary_key=True, doc="Internal primary key")
-    artifact_id = Column(String(64), nullable=False,
-                         doc="Artifact ID (A2A spec: artifactId)")
-    task_id = Column(String(64), nullable=False,
-                     doc="Task ID this artifact belongs to")
+    artifact_id = Column(String(64), nullable=False, doc="Artifact ID (A2A spec: artifactId)")
+    task_id = Column(String(64), nullable=False, doc="Task ID this artifact belongs to")
 
     # Artifact attributes
     name = Column(String(255), doc="Human-readable artifact name")
     description = Column(Text, doc="Artifact description")
-    parts = Column(JSON, nullable=False,
-                   doc="Artifact parts following A2A Part structure")
+    parts = Column(JSON, nullable=False, doc="Artifact parts following A2A Part structure")
     meta_data = Column(JSON, doc="Artifact metadata")
     extensions = Column(JSON, doc="Extension URI list")
 
     # Timestamp
-    create_time = Column(TIMESTAMP(
-        timezone=False), server_default=func.now(), doc="Artifact creation timestamp")
+    create_time = Column(TIMESTAMP(timezone=False), server_default=func.now(), doc="Artifact creation timestamp")
diff --git a/backend/database/knowledge_db.py b/backend/database/knowledge_db.py
index 8fc60d6bd..9a8b1c8c1 100644
--- a/backend/database/knowledge_db.py
+++ b/backend/database/knowledge_db.py
@@ -34,7 +34,6 @@ def create_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
             - user_id: Optional user ID for created_by and updated_by fields
             - tenant_id: Optional tenant ID for created_by and updated_by fields
             - embedding_model_name: embedding model name for the knowledge base
-            - preserve_source_file: whether to preserve uploaded source documents (optional)
 
     Returns:
         Dict[str, Any]: Dictionary with at least 'knowledge_id' and 'index_name'
@@ -58,7 +57,6 @@ def create_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
                 "knowledge_name": knowledge_name,
                 "group_ids": convert_list_to_string(group_ids) if isinstance(group_ids, list) else group_ids,
                 "ingroup_permission": query.get("ingroup_permission"),
-                "preserve_source_file": query.get("preserve_source_file", True),
             }
 
             # For backward compatibility: if caller explicitly provides index_name,
@@ -119,16 +117,11 @@ def upsert_knowledge_record(query: Dict[str, Any]) -> Dict[str, Any]:
 
             if existing_record:
                 # Update existing record
-                existing_record.knowledge_name = query.get(
-                    'knowledge_name') or query.get('index_name')
-                existing_record.knowledge_describe = query.get(
-                    'knowledge_describe', '')
-                existing_record.knowledge_sources = query.get(
-                    'knowledge_sources', 'elasticsearch')
-                existing_record.embedding_model_name = query.get(
-                    'embedding_model_name')
-                existing_record.embedding_model_id = query.get(
-                    'embedding_model_id')
+                existing_record.knowledge_name = query.get('knowledge_name') or query.get('index_name')
+                existing_record.knowledge_describe = query.get('knowledge_describe', '')
+                existing_record.knowledge_sources = query.get('knowledge_sources', 'elasticsearch')
+                existing_record.embedding_model_name = query.get('embedding_model_name')
+                existing_record.embedding_model_id = query.get('embedding_model_id')
                 existing_record.updated_by = query.get('user_id')
                 existing_record.update_time = func.current_timestamp()
 
@@ -190,7 +183,7 @@ def update_knowledge_record(query: Dict[str, Any]) -> bool:
             # Update group IDs
             if query.get("group_ids") is not None:
                 record.group_ids = query["group_ids"]
-
+            
             # Update timestamp and user
             if query.get("user_id"):
                 record.updated_by = query["user_id"]
@@ -258,17 +251,15 @@ def get_knowledge_record(query: Optional[Dict[str, Any]] = None) -> Dict[str, An
 
             # Support both index_name and knowledge_name queries
             if 'index_name' in query:
-                db_query = db_query.filter(
-                    KnowledgeRecord.index_name == query['index_name'])
+                db_query = db_query.filter(KnowledgeRecord.index_name == query['index_name'])
             elif 'knowledge_name' in query:
-                db_query = db_query.filter(
-                    KnowledgeRecord.knowledge_name == query['knowledge_name'])
+                db_query = db_query.filter(KnowledgeRecord.knowledge_name == query['knowledge_name'])
 
             # Add tenant_id filter only if it is provided in the query
             if 'tenant_id' in query and query['tenant_id'] is not None:
                 db_query = db_query.filter(
                     KnowledgeRecord.tenant_id == query['tenant_id'])
-
+            
             result = db_query.first()
 
             if result:
diff --git a/backend/database/user_tenant_db.py b/backend/database/user_tenant_db.py
index b147eac49..f1294f8a7 100644
--- a/backend/database/user_tenant_db.py
+++ b/backend/database/user_tenant_db.py
@@ -75,37 +75,6 @@ def insert_user_tenant(user_id: str, tenant_id: str, user_role: str = "USER", us
         session.add(user_tenant)
 
 
-def upsert_user_tenant(user_id: str, tenant_id: str, user_role: str = "USER", user_email: str = None) -> Dict[str, Any]:
-    """
-    Create or update the active user-tenant relationship for an external identity login.
-    """
-    with get_db_session() as session:
-        result = session.query(UserTenant).filter(
-            UserTenant.user_id == user_id,
-            UserTenant.delete_flag == "N"
-        ).first()
-
-        if result:
-            result.tenant_id = tenant_id
-            result.user_role = user_role
-            if user_email is not None:
-                result.user_email = user_email
-            result.updated_by = user_id
-        else:
-            result = UserTenant(
-                user_id=user_id,
-                tenant_id=tenant_id,
-                user_role=user_role,
-                user_email=user_email,
-                created_by=user_id,
-                updated_by=user_id
-            )
-            session.add(result)
-
-        session.flush()
-        return as_dict(result)
-
-
 def get_users_by_tenant_id(tenant_id: str, page: Optional[int] = 1, page_size: Optional[int] = 20,
                            sort_by: str = "created_at", sort_order: str = "desc") -> Dict[str, Any]:
     """
diff --git a/backend/mcp_service.py b/backend/mcp_service.py
index 4629d42ad..0d8ab4c1b 100644
--- a/backend/mcp_service.py
+++ b/backend/mcp_service.py
@@ -70,7 +70,7 @@ async def run(self, arguments: Dict[str, Any]) -> Any:
 
 
 nexent_mcp = FastMCP(name="nexent_mcp")
-nexent_mcp.mount(local_mcp_service, local_mcp_service.name)
+nexent_mcp.mount(local_mcp_service.name, local_mcp_service)
 
 _openapi_mcp_services: Dict[str, FastMCP] = {}
 
@@ -188,8 +188,7 @@ def _sanitize_function_name(name: str) -> str:
 def register_openapi_service(
     service_name: str,
     openapi_json: Dict[str, Any],
-    server_url: str,
-    headers_template: Dict[str, str],
+    server_url: str
 ) -> bool:
     """
     Register an OpenAPI service using FastMCP.from_openapi().
@@ -223,7 +222,7 @@ def register_openapi_service(
             openapi_spec["servers"] = [{"url": server_url}]
 
         # Create HTTP client for the underlying REST API
-        client = httpx.AsyncClient(base_url=server_url, timeout=120.0, headers=headers_template)
+        client = httpx.AsyncClient(base_url=server_url, timeout=30.0)
 
         # Create FastMCP instance from OpenAPI spec
         mcp_server = FastMCP.from_openapi(
@@ -240,7 +239,7 @@ def register_openapi_service(
         _openapi_mcp_services[service_name] = mcp_server
 
         # Mount to the main MCP server
-        nexent_mcp.mount(mcp_server, service_name)
+        nexent_mcp.mount(service_name, mcp_server)
 
         logger.info(f"Registered OpenAPI service: {service_name}")
         return True
@@ -321,14 +320,13 @@ def refresh_openapi_services_by_tenant(tenant_id: str) -> Dict[str, Any]:
         service_name = service.get("mcp_service_name")
         openapi_json = service.get("openapi_json")
         server_url = service.get("server_url")
-        headers_template = service.get("headers_template")
 
         if not openapi_json:
             logger.warning(f"Service '{service_name}' has no OpenAPI JSON, skipping")
             skipped_count += 1
             continue
 
-        if register_openapi_service(service_name, openapi_json, server_url, headers_template):
+        if register_openapi_service(service_name, openapi_json, server_url):
             registered_count += 1
         else:
             skipped_count += 1
@@ -396,7 +394,6 @@ def refresh_single_openapi_service(service_name: str, tenant_id: str) -> Dict[st
     # Re-register with fresh data
     openapi_json = service_data.get("openapi_json")
     server_url = service_data.get("server_url")
-    headers_template = service_data.get("headers_template")
 
     if not openapi_json:
         logger.warning(f"Service '{service_name}' has no OpenAPI JSON")
@@ -406,7 +403,7 @@ def refresh_single_openapi_service(service_name: str, tenant_id: str) -> Dict[st
             "error": "No OpenAPI JSON found"
         }
 
-    success = register_openapi_service(service_name, openapi_json, server_url, headers_template)
+    success = register_openapi_service(service_name, openapi_json, server_url)
     return {
         "status": "refreshed" if success else "error",
         "service_name": service_name,
diff --git a/backend/prompts/managed_system_prompt_template_en.yaml b/backend/prompts/managed_system_prompt_template_en.yaml
index 62e16e946..5c2893c39 100644
--- a/backend/prompts/managed_system_prompt_template_en.yaml
+++ b/backend/prompts/managed_system_prompt_template_en.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### Basic Information
-  You are {{APP_NAME}}, {{APP_DESCRIPTION}}
+  You are {{APP_NAME}}, {{APP_DESCRIPTION}}, it is {{time|default('current time')}} now
 
   {%- if memory_list and memory_list|length > 0 %}
   ### Contextual Memory
@@ -66,11 +66,6 @@ system_prompt: |-
      - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.
      - **IMPORTANT**: After code execution, the system will return content with "Observation:" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**
 
-  3. Self-verification:
-     - After critical events (tool calls, retrieval results, code execution, and final-answer preparation), the system may run explicit verification.
-     - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.
-     - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.
-
   After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.
 
   When generating the final answer, you need to follow these specifications:
@@ -183,13 +178,3 @@ final_answer:
     Original task: {{task}}
 
     Please provide a clear and concise summary of the work completed so far.
-
-
-verification:
-  pre_messages: |-
-    You are a strict verifier for a ReAct agent. Judge reliability only from the task, candidate answer, tool outputs, and observations. Do not output hidden chain-of-thought.
-    You must output JSON only.
-
-  post_messages: |-
-    Verify whether the candidate answer covers the user's intent, is grounded in observations, handles tool errors, uses trustworthy citations, and is formatted for users.
-    Output fields: passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note.
diff --git a/backend/prompts/managed_system_prompt_template_zh.yaml b/backend/prompts/managed_system_prompt_template_zh.yaml
index da3d53469..291e336fb 100644
--- a/backend/prompts/managed_system_prompt_template_zh.yaml
+++ b/backend/prompts/managed_system_prompt_template_zh.yaml
@@ -2,7 +2,7 @@ system_prompt: |-
 
   ### 基本信息
 
-  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，用户ID为{{user_id}}
+  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，现在是{{time|default('当前时间')}}，用户ID为{{user_id}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### 上下文记忆
@@ -130,11 +130,6 @@ system_prompt: |-
      - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。
      - **重要**：代码执行后，系统会返回 "Observation:" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。
 
-  3. 自验证：
-     - 关键事件（工具调用、检索结果、代码执行、准备最终回答）后，系统会进行显式自验证。
-     - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。
-     - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。
-
   在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。
 
   生成最终回答时，你需要遵循以下规范：
@@ -276,13 +271,3 @@ final_answer:
     原始任务：{{task}}
 
     请对迄今为止完成的工作进行清晰、简洁的总结。
-
-
-verification:
-  pre_messages: |-
-    你是 ReAct 智能体的严格验证器。请仅根据任务、候选答案、工具输出和观察结果判断答案是否可靠，不要输出隐藏思维链。
-    你必须只输出 JSON。
-
-  post_messages: |-
-    请验证候选答案是否覆盖用户意图、是否有观察结果支撑、是否处理了工具错误、引用是否可信、格式是否适合展示。
-    输出字段：passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note。
diff --git a/backend/prompts/manager_system_prompt_template_en.yaml b/backend/prompts/manager_system_prompt_template_en.yaml
index d44ed9a71..8ce58db29 100644
--- a/backend/prompts/manager_system_prompt_template_en.yaml
+++ b/backend/prompts/manager_system_prompt_template_en.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### Basic Information
-  You are {{APP_NAME}}, {{APP_DESCRIPTION}}
+  You are {{APP_NAME}}, {{APP_DESCRIPTION}}, it is {{time|default('current time')}} now
 
   {%- if memory_list and memory_list|length > 0 %}
   ### Contextual Memory
@@ -67,11 +67,6 @@ system_prompt: |-
      - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.
      - **IMPORTANT**: After code execution, the system will return content with "Observation:" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**
 
-  3. Self-verification:
-     - After critical events (tool calls, retrieval results, code execution, agent handoffs, and final-answer preparation), the system may run explicit verification.
-     - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.
-     - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.
-
   After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.
 
   When generating the final answer, you need to follow these specifications:
@@ -227,13 +222,3 @@ final_answer:
     Original task: {{task}}
 
     Please provide a clear and concise summary of the work completed so far.
-
-
-verification:
-  pre_messages: |-
-    You are a strict verifier for a ReAct agent. Judge reliability only from the task, candidate answer, tool outputs, and observations. Do not output hidden chain-of-thought.
-    You must output JSON only.
-
-  post_messages: |-
-    Verify whether the candidate answer covers the user's intent, is grounded in observations, handles tool errors, uses trustworthy citations, and is formatted for users.
-    Output fields: passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note.
diff --git a/backend/prompts/manager_system_prompt_template_zh.yaml b/backend/prompts/manager_system_prompt_template_zh.yaml
index a49ced82d..fc4eb7c0c 100644
--- a/backend/prompts/manager_system_prompt_template_zh.yaml
+++ b/backend/prompts/manager_system_prompt_template_zh.yaml
@@ -1,6 +1,6 @@
 system_prompt: |-
   ### 基本信息
-  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，用户ID为{{user_id}}
+  你是{{APP_NAME}}，{{APP_DESCRIPTION}}，现在是{{time|default('当前时间')}}，用户ID为{{user_id}}
 
   {%- if memory_list and memory_list|length > 0 %}
   ### 上下文记忆
@@ -130,11 +130,6 @@ system_prompt: |-
      - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。
      - **重要**：代码执行后，系统会返回 "Observation:" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。
 
-  3. 自验证：
-     - 关键事件（工具调用、检索结果、代码执行、助手返回、准备最终回答）后，系统会进行显式自验证。
-     - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。
-     - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。
-
   在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。
 
   生成最终回答时，你需要遵循以下规范：
@@ -304,13 +299,3 @@ final_answer:
     原始任务：{{task}}
 
     请对迄今为止完成的工作进行清晰、简洁的总结。
-
-
-verification:
-  pre_messages: |-
-    你是 ReAct 智能体的严格验证器。请仅根据任务、候选答案、工具输出和观察结果判断答案是否可靠，不要输出隐藏思维链。
-    你必须只输出 JSON。
-
-  post_messages: |-
-    请验证候选答案是否覆盖用户意图、是否有观察结果支撑、是否处理了工具错误、引用是否可信、格式是否适合展示。
-    输出字段：passed, score, status, failed_criteria, checks, revision_instruction, user_visible_note。
diff --git a/backend/prompts/utils/greeting_generate_en.yaml b/backend/prompts/utils/greeting_generate_en.yaml
deleted file mode 100644
index 31ea75632..000000000
--- a/backend/prompts/utils/greeting_generate_en.yaml
+++ /dev/null
@@ -1,54 +0,0 @@
-GREETING_SYSTEM_PROMPT: |-
-  ### You are an expert in generating agent greetings and example questions. You help users create engaging greetings and practical example questions for starting conversations with agents.
-  You are building an Agent application. The input includes: agent name, duty description, business description, and existing examples.
-  Generate a concise greeting and 3-5 example questions that help users quickly start a conversation with the agent.
-  The greeting should reflect the agent's positioning and capabilities.
-
-  ### Requirements:
-  1. The greeting should be concise and friendly, 1-2 sentences, introducing the agent's identity and core capabilities. Don't make it too long or too formal.
-  2. Example questions should be specific and practical, representing questions users might actually ask, showcasing the agent's core features.
-  3. If existing examples contain user query scenarios, prioritize extracting short user questions from them, keeping semantics consistent but simplified to natural conversational form.
-  4. Provide 3-5 example questions, each with a clear use case.
-  5. You MUST output strictly in JSON format, do not output any other content or formatting.
-
-  ### Output format:
-  ```json
-  {
-    "greeting_message": "greeting content",
-    "example_questions": ["example question 1", "example question 2", "example question 3"]
-  }
-  ```
-
-  ### Examples:
-  Example 1 (Travel Planning Assistant, existing examples contain "Help me plan a trip from Shanghai to Beijing" etc.):
-  ```json
-  {
-    "greeting_message": "Hello! I'm your travel planning assistant, I can help you plan trips, recommend attractions, and arrange travel routes.",
-    "example_questions": ["Help me plan a 3-day trip from Shanghai to Beijing", "Recommend some family-friendly attractions", "What's fun to do in Hangzhou tomorrow?"]
-  }
-  ```
-
-  Example 2 (Data Analysis Assistant):
-  ```json
-  {
-    "greeting_message": "Hello! I'm a data analysis assistant, I can help you process and analyze data, provide visual reports and insights.",
-    "example_questions": ["Help me analyze trends in this sales data", "Generate a quarterly performance comparison report", "Which products have the highest profit margins?"]
-  }
-  ```
-
-USER_PROMPT: |-
-  ### Agent Name:
-  {{display_name}}
-
-  ### Agent Duty Description:
-  {{duty_description}}
-
-  ### Business Description:
-  {{business_description}}
-
-  {% if few_shots %}
-  ### Existing Examples (extract user query scenarios from these as example questions):
-  {{few_shots}}
-  {% endif %}
-
-  Please generate the greeting and example questions based on the above information. Output strictly in JSON format.
\ No newline at end of file
diff --git a/backend/prompts/utils/greeting_generate_zh.yaml b/backend/prompts/utils/greeting_generate_zh.yaml
deleted file mode 100644
index 34b8d85d3..000000000
--- a/backend/prompts/utils/greeting_generate_zh.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-GREETING_SYSTEM_PROMPT: |-
-  ### 你是【智能体开场白和示例问题生成专家】，用于帮助用户创建高效、吸引人的智能体开场白和示例问题。
-  现在正在构建一个Agent应用，用户的输入包含：智能体名称、职责描述、业务描述、已有示例。
-  请根据智能体的定位和职责，生成一个简短的开场白和3~5个示例问题，帮助用户快速开始与智能体的对话。
-
-  ### 要求：
-  1.开场白要简洁友好，1-2句话即可，介绍智能体的身份和核心能力，不要过长或过于正式。
-  2.示例问题要具体、实用，是用户真实可能提出的问题，体现智能体的核心功能。
-  3.如果已有示例中包含用户的提问场景，请优先从中提炼简短的用户问题作为示例问题，保持语义一致但简化为自然对话形式。
-  4.示例问题数量为3~5个，每个问题要有明确的使用场景。
-  5.必须严格按照JSON格式输出，不要输出任何其他内容或格式。
-
-  ### 输出格式：
-  ```json
-  {
-    "greeting_message": "开场白内容",
-    "example_questions": ["示例问题1", "示例问题2", "示例问题3"]
-  }
-  ```
-
-  ### 参考示例：
-  示例1（旅行规划助手，已有示例包含"帮我规划明天从上海出发去北京的行程"等场景）：
-  ```json
-  {
-    "greeting_message": "你好！我是你的旅行规划助手，可以帮你规划行程、推荐景点和安排出行路线。",
-    "example_questions": ["帮我规划一个从上海到北京的三日旅行", "推荐一些适合家庭出游的景点", "明天去杭州有什么好玩的地方？"]
-  }
-  ```
-
-  示例2（数据分析助手）：
-  ```json
-  {
-    "greeting_message": "你好！我是数据分析助手，可以帮你处理和分析各种数据，提供可视化报告和洞察。",
-    "example_questions": ["帮我分析这组销售数据的趋势", "生成一份季度业绩对比报告", "哪些产品的利润率最高？"]
-  }
-  ```
-
-USER_PROMPT: |-
-  ### 智能体名称：
-  {{display_name}}
-
-  ### 智能体职责描述：
-  {{duty_description}}
-
-  ### 业务描述：
-  {{business_description}}
-
-  {% if few_shots %}
-  ### 已有示例（请从中提炼用户提问场景作为示例问题）：
-  {{few_shots}}
-  {% endif %}
-
-  请根据以上信息生成开场白和示例问题。严格按JSON格式输出。
\ No newline at end of file
diff --git a/backend/pyproject.toml b/backend/pyproject.toml
index b8f51dd4c..dff0e8693 100644
--- a/backend/pyproject.toml
+++ b/backend/pyproject.toml
@@ -1,7 +1,7 @@
 [project]
 name = "backend"
 version = "0.1.0"
-requires-python = ">=3.11,<3.12"
+requires-python = "==3.10.*"
 dependencies = [
     "aiofiles>=0.8.0",
     "uvicorn>=0.34.0",
@@ -11,7 +11,7 @@ dependencies = [
     "aiohttp>=3.8.0",
     "authlib>=1.3.0",
     "cryptography>=42.0.0",
-    "psycopg2-binary>=2.9.9",
+    "psycopg2-binary==2.9.10",
     "PyJWT>=2.8.0",
     "sqlalchemy~=2.0.37",
     "greenlet<3.5.0",
@@ -21,14 +21,10 @@ dependencies = [
     "jsonref>=1.1.0",
     "ruamel-yaml==0.19.1",
     "redis>=5.0.0",
-    "fastmcp>=2.14.2,<3.0",
+    "fastmcp==2.12.0",
     "langchain>=0.3.26",
     "scikit-learn>=1.0.0",
     "numpy>=1.24.0",
-    "defusedxml>=0.7.1",
-    "openjiuwen>=0.1.0",
-    "pydantic-settings>=2.0.0",
-    "python-docx>=1.1.0",
 ]
 
 [project.optional-dependencies]
@@ -38,7 +34,7 @@ data-process = [
     "flower>=2.0.1",
     "nest_asyncio>=1.5.6",
     "unstructured[csv,docx,pdf,pptx,xlsx,md]==0.18.14",
-    "huggingface_hub>=0.30.0,<1.0"
+    "huggingface_hub>=0.19.0,<0.21.0"
 ]
 test = [
     "pytest",
diff --git a/backend/services/agent_repository_service.py b/backend/services/agent_repository_service.py
deleted file mode 100644
index 87649bcd1..000000000
--- a/backend/services/agent_repository_service.py
+++ /dev/null
@@ -1,306 +0,0 @@
-import logging
-from typing import Any, Dict, Optional
-
-from consts.const import ASSET_OWNER_TENANT_ID
-from consts.model import AgentRepositorySnapshot
-from database.agent_db import search_agent_info_by_agent_id
-from database.agent_version_db import search_version_by_version_no
-from database.agent_repository_db import (
-    STATUS_PENDING_REVIEW,
-    VALID_REPOSITORY_STATUSES,
-    get_agent_repository_by_agent_id,
-    get_agent_repository_by_id,
-    insert_agent_repository_record,
-    list_agent_repository_summaries,
-    update_agent_repository_by_id,
-    update_agent_repository_status_by_id,
-)
-from services.agent_service import (
-    collect_skill_zip_entries,
-    export_agent_dict_for_repository_impl,
-    import_agent_impl,
-    import_agent_with_skills_impl,
-)
-
-logger = logging.getLogger("agent_repository_service")
-
-_UPDATE_SNAPSHOT_FIELDS = (
-    "display_name",
-    "description",
-    "author",
-    "category_id",
-    "tags",
-    "tool_count",
-    "version_label",
-    "source_version_no",
-    "agent_info_json",
-    "status",
-)
-
-
-def _to_summary_item(record: Dict[str, Any]) -> Dict[str, Any]:
-    """Map a DB record to a lightweight marketplace summary item."""
-    return {
-        "agent_repository_id": record.get("agent_repository_id"),
-        "author": record.get("author"),
-        "name": record.get("name"),
-        "display_name": record.get("display_name"),
-        "description": record.get("description"),
-        "status": record.get("status"),
-    }
-
-
-def list_agent_repository_listings_impl(
-    *,
-    status: Optional[str] = None,
-) -> Dict[str, Any]:
-    """List all repository listings with optional status filter."""
-    if status is not None and status not in VALID_REPOSITORY_STATUSES:
-        raise ValueError(
-            f"Invalid status '{status}'; must be one of: "
-            f"{', '.join(sorted(VALID_REPOSITORY_STATUSES))}"
-        )
-    records = list_agent_repository_summaries(status=status)
-    return {"items": [_to_summary_item(record) for record in records]}
-
-
-def update_agent_repository_status_impl(
-    *,
-    agent_repository_id: int,
-    status: str,
-    user_id: str,
-) -> Dict[str, Any]:
-    """Update a repository listing status by primary key."""
-    if status not in VALID_REPOSITORY_STATUSES:
-        raise ValueError(
-            f"Invalid status '{status}'; must be one of: "
-            f"{', '.join(sorted(VALID_REPOSITORY_STATUSES))}"
-        )
-
-    record = get_agent_repository_by_id(agent_repository_id)
-    if not record:
-        raise ValueError("Repository listing not found")
-
-    rows_affected = update_agent_repository_status_by_id(
-        repository_id=agent_repository_id,
-        status=status,
-        user_id=user_id,
-    )
-    if rows_affected == 0:
-        raise ValueError("Repository listing not found")
-
-    updated = get_agent_repository_by_id(agent_repository_id)
-    if not updated:
-        raise ValueError("Failed to load repository listing after update")
-    return _to_summary_item(updated)
-
-
-def _to_list_item(record: Dict[str, Any]) -> Dict[str, Any]:
-    """Map a DB record to a marketplace list item (without heavy JSON blobs)."""
-    return {
-        "id": record.get("agent_repository_id"),
-        "agent_repository_id": record.get("agent_repository_id"),
-        "agent_id": record.get("agent_id"),
-        "name": record.get("name"),
-        "display_name": record.get("display_name"),
-        "description": record.get("description"),
-        "author": record.get("author"),
-        "category_id": record.get("category_id"),
-        "tags": record.get("tags") or [],
-        "tool_count": record.get("tool_count"),
-        "version_label": record.get("version_label"),
-        "status": record.get("status"),
-        "source_version_no": record.get("source_version_no"),
-        "publisher_tenant_id": record.get("publisher_tenant_id"),
-        "created_at": record.get("create_time"),
-        "updated_at": record.get("update_time"),
-    }
-
-
-def _to_detail_item(
-    record: Dict[str, Any],
-    *,
-    include_bundles: bool = True,
-    is_updated: Optional[bool] = None,
-) -> Dict[str, Any]:
-    """Map a DB record to a marketplace detail payload."""
-    detail = _to_list_item(record)
-    if include_bundles:
-        detail["agent_info_json"] = record.get("agent_info_json")
-    if is_updated is not None:
-        detail["is_updated"] = is_updated
-    return detail
-
-
-def _validate_create_payload(repository_data: Dict[str, Any]) -> None:
-    """Validate required fields before inserting a repository listing."""
-    required_fields = (
-        "agent_id",
-        "source_version_no",
-        "name",
-        "agent_info_json",
-    )
-    missing = [
-        field for field in required_fields
-        if field not in repository_data or repository_data[field] is None
-    ]
-    if missing:
-        raise ValueError(f"Missing required repository fields: {', '.join(missing)}")
-    if not repository_data.get("name"):
-        raise ValueError("name must be a non-empty string")
-
-    agent_info_json = repository_data.get("agent_info_json")
-    if not isinstance(agent_info_json, dict):
-        raise ValueError("agent_info_json must be a JSON object")
-    for key in ("agent_id", "agent_info", "mcp_info"):
-        if key not in agent_info_json:
-            raise ValueError(f"agent_info_json must contain '{key}'")
-
-
-def _validate_agent_info_json_shareable(agent_info_json: dict) -> None:
-    """Reject marketplace share when any agent in the tree belongs to ASSET_OWNER tenant."""
-    agent_info_map = agent_info_json.get("agent_info")
-    if not isinstance(agent_info_map, dict):
-        return
-    for entry in agent_info_map.values():
-        if not isinstance(entry, dict):
-            continue
-        if entry.get("tenant_id") == ASSET_OWNER_TENANT_ID:
-            raise ValueError("租户管理员智能体无法共享")
-
-
-async def _build_agent_info_json(
-    agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int,
-) -> dict:
-    """Build marketplace snapshot JSON via the agent export pipeline."""
-    export_dict = await export_agent_dict_for_repository_impl(
-        agent_id=agent_id,
-        tenant_id=tenant_id,
-        user_id=user_id,
-        version_no=version_no,
-    )
-    skills = collect_skill_zip_entries(
-        agent_id=agent_id,
-        tenant_id=tenant_id,
-        version_no=version_no,
-    )
-    snapshot = AgentRepositorySnapshot(
-        **export_dict,
-        skills=skills or None,
-    )
-    return snapshot.model_dump()
-
-
-async def _build_repository_data_from_agent(
-    agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int,
-) -> Dict[str, Any]:
-    """Build a repository upsert payload from a published agent version snapshot."""
-    agent_info = search_agent_info_by_agent_id(agent_id, tenant_id, version_no)
-    agent_info_json = await _build_agent_info_json(
-        agent_id=agent_id,
-        tenant_id=tenant_id,
-        user_id=user_id,
-        version_no=version_no,
-    )
-    _validate_agent_info_json_shareable(agent_info_json)
-
-    version_meta = search_version_by_version_no(agent_id, tenant_id, version_no)
-    version_label = (
-        version_meta.get("version_name")
-        if version_meta and version_meta.get("version_name")
-        else f"v{version_no}"
-    )
-
-    return {
-        "agent_id": agent_id,
-        "source_version_no": version_no,
-        "name": agent_info["name"],
-        "display_name": agent_info.get("display_name"),
-        "description": agent_info.get("description"),
-        "author": agent_info.get("author"),
-        "version_label": version_label,
-        "agent_info_json": agent_info_json,
-        "status": STATUS_PENDING_REVIEW,
-    }
-
-
-async def create_agent_repository_listing_impl(
-    agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int,
-) -> Dict[str, Any]:
-    """Create or update a repository listing from a published agent version.
-
-    Loads agent metadata and builds agent_info_json via the export pipeline,
-    then inserts or updates the marketplace table.
-
-    When a listing for the same agent_id already exists, snapshot fields are
-    updated via update_agent_repository_by_id.
-    """
-    if version_no < 0:
-        raise ValueError("version_no must be >= 0")
-
-    repository_data = await _build_repository_data_from_agent(
-        agent_id, tenant_id, user_id, version_no
-    )
-    _validate_create_payload(repository_data)
-
-    existing = get_agent_repository_by_agent_id(agent_id)
-    if not existing:
-        repository_id = insert_agent_repository_record(
-            repository_data=repository_data,
-            publisher_tenant_id=tenant_id,
-            publisher_user_id=user_id,
-        )
-        is_updated = False
-    else:
-        repository_id = int(existing["agent_repository_id"])
-        updates = {
-            key: repository_data[key]
-            for key in _UPDATE_SNAPSHOT_FIELDS
-            if key in repository_data
-        }
-        affected = update_agent_repository_by_id(
-            repository_id=repository_id,
-            publisher_tenant_id=tenant_id,
-            user_id=user_id,
-            updates=updates,
-        )
-        if affected == 0:
-            raise ValueError("Failed to update repository listing")
-        is_updated = True
-
-    record = get_agent_repository_by_id(repository_id)
-    if not record:
-        raise ValueError("Failed to load repository listing after write")
-    return _to_detail_item(record, is_updated=is_updated)
-
-
-async def import_agent_from_repository_impl(
-    agent_repository_id: int,
-    authorization: str,
-) -> Dict[int, int]:
-    """Import an agent tree from a marketplace repository listing into the current tenant."""
-    record = get_agent_repository_by_id(agent_repository_id)
-    if not record:
-        raise ValueError("Repository listing not found")
-
-    agent_info_json = record.get("agent_info_json")
-    if not isinstance(agent_info_json, dict):
-        raise ValueError("Repository listing has no agent snapshot")
-
-    snapshot = AgentRepositorySnapshot.model_validate(agent_info_json)
-    if snapshot.skills:
-        return await import_agent_with_skills_impl(
-            snapshot,
-            snapshot.skills,
-            authorization,
-        )
-    return await import_agent_impl(snapshot, authorization)
diff --git a/backend/services/agent_service.py b/backend/services/agent_service.py
index 643d1995e..5a340b1d6 100644
--- a/backend/services/agent_service.py
+++ b/backend/services/agent_service.py
@@ -22,8 +22,7 @@
 from utils.prompt_template_utils import normalize_prompt_generate_template_content
 from consts.const import MEMORY_SEARCH_START_MSG, MEMORY_SEARCH_DONE_MSG, MEMORY_SEARCH_FAIL_MSG, TOOL_TYPE_MAPPING, \
     LANGUAGE, MESSAGE_ROLE, MODEL_CONFIG_MAPPING, CAN_EDIT_ALL_USER_ROLES, PERMISSION_EDIT, PERMISSION_READ, PERMISSION_PRIVATE
-from consts.exceptions import AppException, MemoryPreparationException, SkillDuplicateError
-from consts.error_code import ErrorCode
+from consts.exceptions import MemoryPreparationException, SkillDuplicateError
 from consts.agent_unavailable_reasons import AgentUnavailableReason
 from consts.model import (
     AgentInfoRequest,
@@ -46,9 +45,7 @@
     delete_related_agent,
     insert_related_agent,
     query_all_agent_info_by_tenant_id,
-    query_sub_agent_relations,
     query_sub_agents_id_list,
-    resolve_sub_agent_version_no,
     search_agent_id_by_agent_name,
     search_agent_info_by_agent_id,
     search_blank_sub_agent_by_main_agent_id,
@@ -70,10 +67,8 @@
     search_tools_for_sub_agent
 )
 from database import skill_db
-from database.attachment_db import upload_fileobj
 from services.skill_service import SkillService
-from services.file_management_service import is_allowed_skill_upload_path
-from database.agent_version_db import query_version_list, query_current_version_no
+from database.agent_version_db import query_version_list
 from database.group_db import query_group_ids_by_user
 from database.user_tenant_db import get_user_tenant_by_user_id
 from database.a2a_agent_db import get_server_agent_ids, query_external_sub_agents
@@ -83,7 +78,7 @@
     get_prompt_template_summary,
 )
 from utils.str_utils import convert_list_to_string, convert_string_to_list
-from services.conversation_management_service import save_conversation_assistant, save_conversation_user, save_skill_files_to_conversation
+from services.conversation_management_service import save_conversation_assistant, save_conversation_user
 from services.memory_config_service import build_memory_context
 from utils.auth_utils import get_current_user_info, get_user_language
 from utils.config_utils import tenant_config_manager
@@ -102,139 +97,9 @@
 SAFE_AGENT_STREAM_ERROR_MESSAGE = "Agent execution failed. Please try again later."
 
 
-def _extract_json_objects_from_text(text: str) -> list[dict]:
-    """Extract all JSON objects embedded in a text blob."""
-    if not text:
-        return []
-
-    decoder = json.JSONDecoder()
-    results: list[dict] = []
-    index = 0
-
-    while index < len(text):
-        start_index = text.find("{", index)
-        if start_index < 0:
-            break
-
-        try:
-            payload, end_index = decoder.raw_decode(text, start_index)
-        except json.JSONDecodeError:
-            index = start_index + 1
-            continue
-
-        if isinstance(payload, dict):
-            results.append(payload)
-        index = max(end_index, start_index + 1)
-
-    return results
-
-
-def _extract_skill_file_upload_payloads(content: str) -> list[dict]:
-    """Extract JSON payloads containing absolute_path from streamed tool output."""
-    payloads: list[dict] = []
-    for payload in _extract_json_objects_from_text(content):
-        if payload.get("absolute_path"):
-            payloads.append(payload)
-    return payloads
-
-
-def _transform_skill_files_to_standard_format(upload_results: list[dict]) -> list[dict]:
-    """
-    Transform skill file upload results to match the frontend attachment format.
-
-    Skill upload format:
-        {file_name, absolute_path, object_name, preview_url, url, presigned_url, mime_type, file_size, status}
-    Frontend format:
-        {object_name, name, type, size, url, presigned_url, description}
-    """
-    frontend_files = []
-    for result in upload_results:
-        frontend_files.append({
-            "object_name": result.get("object_name", ""),
-            "name": result.get("file_name", result.get("name", "")),
-            "type": "file",
-            "size": result.get("file_size", result.get("size", 0)),
-            "url": result.get("url", ""),
-            "presigned_url": result.get("presigned_url", result.get("preview_url", "")),
-            "description": "",
-        })
-    return frontend_files
-
-
-async def _process_skill_file_uploads(
-    content: str,
-    user_id: str,
-    tenant_id: str,
-) -> list[dict]:
-    """Upload generated skill files to storage and return upload metadata."""
-
-    upload_results: list[dict] = []
-    for payload in _extract_skill_file_upload_payloads(content):
-        absolute_path = str(payload.get("absolute_path") or "").strip()
-        file_name = str(
-            payload.get("file_name")
-            or payload.get("file_path")
-            or os.path.basename(absolute_path)
-        )
-        mime_type = str(payload.get("mime_type") or payload.get("content_type") or "application/octet-stream")
-        if not absolute_path:
-            continue
-
-        if not is_allowed_skill_upload_path(absolute_path):
-            logger.warning(
-                "[skill-file] rejected unsafe path absolute_path=%s",
-                absolute_path,
-            )
-            continue
-
-        if not file_name:
-            file_name = os.path.basename(absolute_path)
-
-        if not os.path.exists(absolute_path):
-            continue
-
-        try:
-            file_size = os.path.getsize(absolute_path)
-            actual_prefix = f"skill-files/{user_id}" if user_id else "skill-files"
-            with open(absolute_path, "rb") as file_obj:
-                upload_result = upload_fileobj(
-                    file_obj=file_obj,
-                    file_name=file_name,
-                    prefix=actual_prefix,
-                    generate_presigned_url=True,
-                    file_size=file_size,
-                )
-
-            if upload_result.get("success"):
-                upload_results.append(
-                    {
-                        "status": "success",
-                        "file_name": file_name,
-                        "absolute_path": absolute_path,
-                        "object_name": upload_result.get("object_name"),
-                        "preview_url": upload_result.get("presigned_url") or upload_result.get("url"),
-                        "url": upload_result.get("url"),
-                        "presigned_url": upload_result.get("presigned_url"),
-                        "mime_type": mime_type,
-                        "file_size": upload_result.get("file_size", file_size),
-                    }
-                )
-            else:
-                error_message = upload_result.get("error") or "Upload failed"
-                logger.warning(
-                    "[skill-file] upload failed file_name=%s absolute_path=%s error=%s",
-                    file_name,
-                    absolute_path,
-                    error_message,
-                )
-        except Exception as exc:
-            logger.exception(
-                "[skill-file] failed to upload file file_name=%s absolute_path=%s",
-                file_name,
-                absolute_path,
-            )
-
-    return upload_results
+# -------------------------------------------------------------
+# Internal helper functions
+# -------------------------------------------------------------
 
 
 def _safe_agent_stream_error_chunk() -> str:
@@ -782,53 +647,23 @@ async def _stream_agent_chunks(
     agent_run_info,
     memory_ctx,
 ):
-    """Yield SSE chunks from agent_run while persisting messages and cleanup."""
+    """Yield SSE chunks from agent_run while persisting messages & cleanup.
+
+    This utility centralizes the common streaming logic used by both
+    generate_stream_with_memory and generate_stream_no_memory so that the code
+    is easier to maintain and less error-prone.
+    """
 
     local_messages = []
     captured_final_answer = None
-    captured_skill_files: dict[str, dict] = {}
-    skill_file_uploads: list[dict] = []
     try:
         async for chunk in agent_run(agent_run_info):
             local_messages.append(chunk)
+            # Try to capture the final answer as it streams by in order to start memory addition
             try:
                 data = json.loads(chunk)
-                chunk_type = data.get("type")
-                if chunk_type == "final_answer":
+                if data.get("type") == "final_answer":
                     captured_final_answer = data.get("content")
-
-                should_parse_skill_file = chunk_type in {"execution_logs", "parse"} or data.get("role") == "tool-response"
-                if should_parse_skill_file:
-                    extracted_payload_count = 0
-                    content_value = data.get("content")
-                    if isinstance(content_value, list):
-                        content_items = content_value
-                    elif content_value:
-                        content_items = [{"type": "text", "text": str(content_value)}]
-                    else:
-                        content_items = []
-
-                    for item in content_items:
-                        if isinstance(item, dict) and item.get("type") == "text":
-                            text_value = item.get("text")
-                            if text_value:
-                                extracted_payloads = _extract_json_objects_from_text(text_value)
-                                for payload in extracted_payloads:
-                                    absolute_path = str(payload.get("absolute_path") or "").strip()
-                                    if not absolute_path:
-                                        continue
-                                    if absolute_path in captured_skill_files:
-                                        continue
-                                    if not os.path.exists(absolute_path):
-                                        continue
-                                    captured_skill_files[absolute_path] = payload
-                                    extracted_payload_count += 1
-                    if extracted_payload_count:
-                        logger.info(
-                            "[skill-file] captured payloads count=%s current_total=%s",
-                            extracted_payload_count,
-                            len(captured_skill_files),
-                        )
             except Exception:
                 pass
             yield f"data: {chunk}\n\n"
@@ -836,6 +671,7 @@ async def _stream_agent_chunks(
         logger.error("Agent run error: %r", run_exc, exc_info=True)
         yield _safe_agent_stream_error_chunk()
     finally:
+        # Persist assistant messages for non-debug runs
         if not agent_request.is_debug:
             save_messages(
                 agent_request,
@@ -844,54 +680,11 @@ async def _stream_agent_chunks(
                 tenant_id=tenant_id,
                 user_id=user_id,
             )
+        # Always unregister the run to release resources
         agent_run_manager.unregister_agent_run(
             agent_request.conversation_id, user_id)
 
-        try:
-            skill_file_content_local = "\n".join(
-                json.dumps(payload, ensure_ascii=False)
-                for payload in captured_skill_files.values()
-            )
-            if skill_file_content_local:
-                skill_file_uploads = await _process_skill_file_uploads(
-                    content=skill_file_content_local,
-                    user_id=user_id,
-                    tenant_id=tenant_id,
-                )
-                logger.info(
-                    "[skill-file] upload finished conversation=%s result_count=%s results=%s",
-                    agent_request.conversation_id,
-                    len(skill_file_uploads), skill_file_uploads
-                )
-                if skill_file_uploads:
-                    # Keep original format for real-time SSE display
-                    skill_files_payload = json.dumps(
-                        {"skill_file_uploads": skill_file_uploads},
-                        ensure_ascii=False,
-                    )
-                    try:
-                        yield f"data: {json.dumps({'type': 'skill_files', 'content': skill_files_payload}, ensure_ascii=False)}\n\n"
-                    except RuntimeError:
-                        # Stream is closing (e.g., client disconnect). Avoid raising during generator teardown.
-                        pass
-                    # Persist skill file uploads to the conversation history so they
-                    # appear in subsequent GET /conversation/{id} calls.
-                    # Transform to frontend attachment format (object_name, name, type, size, etc.)
-                    try:
-                        frontend_files = _transform_skill_files_to_standard_format(skill_file_uploads)
-                        save_skill_files_to_conversation(
-                            conversation_id=agent_request.conversation_id,
-                            skill_file_uploads=frontend_files,
-                            user_id=user_id,
-                        )
-                    except Exception:
-                        logger.exception(
-                            "[skill-file] failed to persist skill file uploads to conversation=%s",
-                            agent_request.conversation_id,
-                        )
-        except Exception:
-            logger.exception("Failed to process skill file uploads")
-
+        # Schedule memory addition in background to avoid blocking SSE termination
         async def _add_memory_background():
             try:
                 # Skip if memory recording is disabled
@@ -986,13 +779,14 @@ async def get_agent_info_impl(agent_id: int, tenant_id: str, version_no: int = 0
             user_role = str(user_tenant_record.get("user_role") or "").upper()
             can_edit_all = user_role in CAN_EDIT_ALL_USER_ROLES
 
-            # Permission logic (same as agent list, including ASSET_OWNER read-only override)
-            agent_info["permission"] = resolve_agent_list_permission(
-                user_role=user_role,
-                agent=agent_info,
-                user_id=user_id,
-                can_edit_all=can_edit_all,
-            )
+            # Permission logic (same as agent list):
+            # - If creator or can_edit_all: PERMISSION_EDIT
+            # - Otherwise: use ingroup_permission, default to PERMISSION_READ if None
+            if can_edit_all or str(agent_info.get("created_by")) == str(user_id):
+                agent_info["permission"] = PERMISSION_EDIT
+            else:
+                ingroup_permission = agent_info.get("ingroup_permission")
+                agent_info["permission"] = ingroup_permission if ingroup_permission is not None else PERMISSION_READ
         except Exception as e:
             logger.warning(f"Failed to calculate agent permission: {str(e)}")
 
@@ -1068,12 +862,6 @@ async def get_agent_info_impl(agent_id: int, tenant_id: str, version_no: int = 0
     agent_info["is_available"] = is_available
     agent_info["unavailable_reasons"] = unavailable_reasons
 
-    # Set current_version_no from draft record (version_no=0)
-    # This ensures the returned data always has the current published version info
-    if version_no > 0:
-        draft_version_no = query_current_version_no(agent_id, tenant_id)
-        agent_info["current_version_no"] = draft_version_no
-
     return agent_info
 
 
@@ -1118,10 +906,6 @@ async def get_creating_sub_agent_info_impl(authorization: str = Header(None)):
 
 async def update_agent_info_impl(request: AgentInfoRequest, authorization: str = Header(None)):
     user_id, tenant_id, _ = get_current_user_info(authorization)
-
-    if request.example_questions is not None and len(request.example_questions) > 6:
-        raise AppException(ErrorCode.COMMON_PARAMETER_INVALID, "example_questions cannot exceed 6 items")
-
     prompt_template_id, prompt_template_name = get_prompt_template_summary(
         template_id=request.prompt_template_id,
         tenant_id=tenant_id,
@@ -1148,12 +932,9 @@ async def update_agent_info_impl(request: AgentInfoRequest, authorization: str =
                 "prompt_template_name": prompt_template_name,
                 "max_steps": request.max_steps,
                 "provide_run_summary": request.provide_run_summary,
-                "verification_config": request.verification_config,
                 "duty_prompt": request.duty_prompt,
                 "constraint_prompt": request.constraint_prompt,
                 "few_shots_prompt": request.few_shots_prompt,
-                "greeting_message": request.greeting_message,
-                "example_questions": request.example_questions,
                 "enabled": request.enabled if request.enabled is not None else True,
                 "group_ids": convert_list_to_string(request.group_ids) if request.group_ids else user_group_ids,
                 "ingroup_permission": request.ingroup_permission
@@ -1421,216 +1202,76 @@ async def clear_agent_memory(agent_id: int, tenant_id: str, user_id: str):
         # Silently fail to maintain agent deletion process
 
 
-async def _export_agent_dict_core(
-    root_agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int = 0,
-) -> dict:
-    """Build ExportAndImportDataFormat dict for an agent tree at the given version."""
+async def export_agent_impl(agent_id: int, authorization: str = Header(None)) -> str:
+    """
+    Export the configuration information of the specified agent and all its sub-agents.
+
+    Args:
+        agent_id (int): The ID of the agent to export.
+        authorization (str): User authentication information, obtained from the Header.
+
+    Returns:
+        str: A formatted JSON string containing the configuration information of the agent and all its sub-agents.
+
+    Data Structure Example:
+        model.py  ExportAndImportDataFormat
+
+    Note:
+        This function recursively finds all managed sub-agents and exports the detailed configuration of each agent (including tools, prompts, etc.) as a dictionary, and finally returns it as a formatted JSON string for frontend download and backup.
+    """
+
+    user_id, tenant_id, _ = get_current_user_info(authorization)
+
     export_agent_dict = {}
-    search_list: deque = deque([(root_agent_id, version_no)])
-    visited: set = set()
+    search_list = deque([agent_id])
+    agent_id_set = set()
 
     mcp_info_set = set()
 
-    while search_list:
-        current_agent_id, current_version_no = search_list.popleft()
-        visit_key = (current_agent_id, current_version_no)
-        if visit_key in visited:
+    while len(search_list):
+        left_ele = search_list.popleft()
+        if left_ele in agent_id_set:
             continue
-        visited.add(visit_key)
 
-        agent_info = await export_agent_by_agent_id(
-            agent_id=current_agent_id,
-            tenant_id=tenant_id,
-            user_id=user_id,
-            version_no=current_version_no,
-        )
+        agent_id_set.add(left_ele)
+        agent_info = await export_agent_by_agent_id(agent_id=left_ele, tenant_id=tenant_id, user_id=user_id)
 
+        # collect mcp name
         for tool in agent_info.tools:
             if tool.source == "mcp" and tool.usage:
                 mcp_info_set.add(tool.usage)
 
-        relations = query_sub_agent_relations(
-            main_agent_id=current_agent_id,
-            tenant_id=tenant_id,
-            version_no=current_version_no,
-        )
-        for rel in relations:
-            child_id = rel["selected_agent_id"]
-            child_version = resolve_sub_agent_version_no(
-                child_id,
-                rel.get("selected_agent_version_no"),
-                tenant_id,
-            )
-            search_list.append((child_id, child_version))
-
+        search_list.extend(agent_info.managed_agents)
         export_agent_dict[str(agent_info.agent_id)] = agent_info
 
+    # convert mcp info to MCPInfo list
     mcp_info_list = []
     for mcp_server_name in mcp_info_set:
+        # get mcp url by mcp_server_name and tenant_id
         mcp_url = get_mcp_server_by_name_and_tenant(mcp_server_name, tenant_id)
         mcp_info_list.append(
             MCPInfo(mcp_server_name=mcp_server_name, mcp_url=mcp_url))
 
     export_data = ExportAndImportDataFormat(
-        agent_id=root_agent_id,
-        agent_info=export_agent_dict,
-        mcp_info=mcp_info_list,
-    )
-    return export_data.model_dump()
+        agent_id=agent_id, agent_info=export_agent_dict, mcp_info=mcp_info_list)
+    return json.dumps(export_data.model_dump())
 
 
-async def export_agent_dict_impl(
-    agent_id: int,
-    authorization: str = Header(None),
-    version_no: int = 0,
-) -> dict:
+async def export_agent_by_agent_id(agent_id: int, tenant_id: str, user_id: str) -> ExportAndImportAgentInfo:
     """
-    Export the configuration information of the specified agent and all its sub-agents.
-
-    Args:
-        agent_id (int): The ID of the agent to export.
-        authorization (str): User authentication information, obtained from the Header.
-        version_no (int): Version to export. Default 0 = draft.
-
-    Returns:
-        dict: ExportAndImportDataFormat as a plain dict (via model_dump).
+    Export a single agent's information based on agent_id
     """
-    user_id, tenant_id, _ = get_current_user_info(authorization)
-    return await _export_agent_dict_core(
-        root_agent_id=agent_id,
-        tenant_id=tenant_id,
-        user_id=user_id,
-        version_no=version_no,
-    )
-
-
-async def export_agent_dict_for_repository_impl(
-    agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int,
-) -> dict:
-    """Export agent tree for marketplace repository storage (no HTTP auth header)."""
-    return await _export_agent_dict_core(
-        root_agent_id=agent_id,
-        tenant_id=tenant_id,
-        user_id=user_id,
-        version_no=version_no,
-    )
-
-
-async def export_agent_impl(
-    agent_id: int,
-    authorization: str = Header(None),
-    version_no: int = 0,
-) -> str:
-    """Serialize export_agent_dict_impl output to a JSON string for download or ZIP embedding."""
-    agent_dict = await export_agent_dict_impl(
-        agent_id, authorization, version_no=version_no
-    )
-    return json.dumps(agent_dict)
-
-
-def _collect_skill_names_from_tree(
-    agent_id: int,
-    tenant_id: str,
-    version_no: int,
-    visited: Optional[set] = None,
-) -> List[str]:
-    """Collect unique skill names from an agent tree at the given version."""
-    if visited is None:
-        visited = set()
-
-    skill_names: List[str] = []
-    seen_names: set = set()
-
-    def _walk(current_agent_id: int, current_version_no: int) -> None:
-        visit_key = (current_agent_id, current_version_no)
-        if visit_key in visited:
-            return
-        visited.add(visit_key)
-
-        skill_instances = skill_db.query_skill_instances_by_agent_id(
-            agent_id=current_agent_id,
-            tenant_id=tenant_id,
-            version_no=current_version_no,
-        )
-        for inst in skill_instances:
-            skill_id = inst.get("skill_id")
-            skill = skill_db.get_skill_by_id(skill_id, tenant_id)
-            if skill:
-                name = skill.get("name")
-                if name and name not in seen_names:
-                    seen_names.add(name)
-                    skill_names.append(name)
-
-        relations = query_sub_agent_relations(
-            main_agent_id=current_agent_id,
-            tenant_id=tenant_id,
-            version_no=current_version_no,
-        )
-        for rel in relations:
-            child_id = rel["selected_agent_id"]
-            child_version = resolve_sub_agent_version_no(
-                child_id,
-                rel.get("selected_agent_version_no"),
-                tenant_id,
-            )
-            _walk(child_id, child_version)
-
-    _walk(agent_id, version_no)
-    return skill_names
-
-
-def collect_skill_zip_entries(
-    agent_id: int,
-    tenant_id: str,
-    version_no: int = 0,
-) -> List[SkillZipEntry]:
-    """Export skill ZIP payloads for all skills in an agent tree."""
-    skill_names = _collect_skill_names_from_tree(agent_id, tenant_id, version_no)
-    if not skill_names:
-        return []
-
-    skill_service = SkillService(tenant_id=tenant_id)
-    exported = skill_service.export_skills_by_names(skill_names, tenant_id)
-    return [
-        SkillZipEntry(
-            skill_name=entry["skill_name"],
-            skill_zip_base64=entry["skill_zip_base64"],
-        )
-        for entry in exported
-    ]
-
-
-async def export_agent_by_agent_id(
-    agent_id: int,
-    tenant_id: str,
-    user_id: str,
-    version_no: int = 0,
-) -> ExportAndImportAgentInfo:
-    """Export a single agent's information based on agent_id and version_no."""
     agent_info = search_agent_info_by_agent_id(
-        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
-    )
+        agent_id=agent_id, tenant_id=tenant_id)
     agent_relation_in_db = query_sub_agents_id_list(
-        main_agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
-    )
-    tool_list = await create_tool_config_list(
-        agent_id=agent_id,
-        tenant_id=tenant_id,
-        user_id=user_id,
-        version_no=version_no,
-    )
+        main_agent_id=agent_id, tenant_id=tenant_id)
+    tool_list = await create_tool_config_list(agent_id=agent_id, tenant_id=tenant_id, user_id=user_id)
 
     # Collect skill names from skill instances
     skill_names: List[str] = []
     try:
         skill_instances = skill_db.query_skill_instances_by_agent_id(
-            agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
+            agent_id=agent_id, tenant_id=tenant_id, version_no=0
         )
         for inst in skill_instances:
             skill_id = inst.get("skill_id")
@@ -1666,7 +1307,6 @@ async def export_agent_by_agent_id(
             "display_name") if business_logic_model_info is not None else None
 
     agent_info = ExportAndImportAgentInfo(agent_id=agent_id,
-                                          tenant_id=agent_info["tenant_id"],
                                           name=agent_info["name"],
                                           display_name=agent_info["display_name"],
                                           description=agent_info["description"],
@@ -1674,7 +1314,6 @@ async def export_agent_by_agent_id(
                                           author=agent_info.get("author"),
                                           max_steps=agent_info["max_steps"],
                                           provide_run_summary=agent_info["provide_run_summary"],
-                                          verification_config=agent_info.get("verification_config"),
                                           duty_prompt=agent_info.get(
                                               "duty_prompt"),
                                           constraint_prompt=agent_info.get(
@@ -1829,7 +1468,6 @@ async def import_agent_by_agent_id(
                                          "prompt_template_name": import_agent_info.prompt_template_name or SYSTEM_PROMPT_TEMPLATE_NAME,
                                          "max_steps": import_agent_info.max_steps,
                                          "provide_run_summary": import_agent_info.provide_run_summary,
-                                         "verification_config": getattr(import_agent_info, "verification_config", None),
                                          "duty_prompt": import_agent_info.duty_prompt,
                                          "constraint_prompt": import_agent_info.constraint_prompt,
                                          "few_shots_prompt": import_agent_info.few_shots_prompt,
@@ -2197,7 +1835,6 @@ async def prepare_agent_run(
         is_debug=agent_request.is_debug,
         override_version_no=agent_request.version_no,
         override_model_id=agent_request.model_id,
-        tool_params=agent_request.tool_params,
     )
 
     # Mount conversation-level reusable ContextManager if enabled
@@ -2643,45 +2280,52 @@ def get_sub_agents_recursive(parent_agent_id: int, depth: int = 0, max_depth: in
         raise ValueError(f"Failed to get agent call relationship: {str(e)}")
 
 
-async def export_agent_with_skills_impl(
-    agent_id: int,
-    authorization: str,
-    version_no: int = 0,
-) -> dict:
-    """Export an agent, returning a ZIP if it has skill instances, otherwise a plain dict.
+async def export_agent_with_skills_impl(agent_id: int, authorization: str) -> dict:
+    """Export an agent, returning a ZIP if it has skill instances, otherwise plain JSON.
 
     The response is either:
       - A dict with {"_zip": True, "data": bytes, "filename": str} when the agent has skills
-      - ExportAndImportDataFormat as a plain dict when the agent has no skills
+      - A plain dict (JSON string) when the agent has no skills
     """
+    from services.skill_service import SkillService
+
     user_id, tenant_id, _ = get_current_user_info(authorization)
 
-    skill_zip_entries = collect_skill_zip_entries(
-        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
+    skill_instances = skill_db.query_skill_instances_by_agent_id(
+        agent_id=agent_id, tenant_id=tenant_id, version_no=0
     )
 
-    if not skill_zip_entries:
-        return await export_agent_dict_impl(
-            agent_id, authorization, version_no=version_no
-        )
+    if not skill_instances:
+        return await export_agent_impl(agent_id, authorization)
 
-    agent_json_str = await export_agent_impl(
-        agent_id, authorization, version_no=version_no
-    )
+    skill_names = []
+    for inst in skill_instances:
+        skill_id = inst.get("skill_id")
+        skill = skill_db.get_skill_by_id(skill_id, tenant_id)
+        if skill:
+            skill_names.append(skill.get("name"))
+
+    if not skill_names:
+        return await export_agent_impl(agent_id, authorization)
+
+    agent_json_str = await export_agent_impl(agent_id, authorization)
+
+    skill_service = SkillService(tenant_id=tenant_id)
+    skill_zip_entries = skill_service.export_skills_by_names(
+        skill_names, tenant_id)
 
     zip_buffer = io.BytesIO()
     with zipfile.ZipFile(zip_buffer, "w", zipfile.ZIP_DEFLATED) as zf:
         zf.writestr("agent.json", agent_json_str)
         for entry in skill_zip_entries:
-            skill_zip_bytes = base64.b64decode(entry.skill_zip_base64)
-            zf.writestr(f"skills/{entry.skill_name}.zip", skill_zip_bytes)
+            skill_zip_bytes = base64.b64decode(entry["skill_zip_base64"])
+            zf.writestr(f"skills/{entry['skill_name']}.zip", skill_zip_bytes)
 
     zip_buffer.seek(0)
     zip_data = zip_buffer.read()
 
     agent_info = search_agent_info_by_agent_id(
-        agent_id=agent_id, tenant_id=tenant_id, version_no=version_no
-    )
+        agent_id=agent_id, tenant_id=tenant_id)
     agent_name = agent_info.get(
         "name", "anonymous") if agent_info else "anonymous"
 
diff --git a/backend/services/agent_version_service.py b/backend/services/agent_version_service.py
index 8ed6e14d4..d7096727b 100644
--- a/backend/services/agent_version_service.py
+++ b/backend/services/agent_version_service.py
@@ -49,17 +49,6 @@ def _remove_audit_fields_for_insert(data: dict) -> None:
     data.pop('delete_flag', None)
 
 
-def _build_sub_agent_relations(relations: List[dict]) -> List[dict]:
-    """Map relation snapshots to sub-agent relation payloads for API responses."""
-    return [
-        {
-            'agent_id': r['selected_agent_id'],
-            'version_no': r.get('selected_agent_version_no'),
-        }
-        for r in relations
-    ]
-
-
 def publish_version_impl(
     agent_id: int,
     tenant_id: str,
@@ -103,18 +92,11 @@ def publish_version_impl(
         _remove_audit_fields_for_insert(tool_snapshot)
         insert_tool_snapshot(tool_snapshot)
 
-    # Insert relation snapshots with pinned child agent versions
+    # Insert relation snapshots
     for rel in relations_draft:
-        child_id = rel['selected_agent_id']
-        child_version = query_current_version_no(child_id, tenant_id)
-        if child_version is None:
-            raise ValueError(
-                f"Sub-agent {child_id} has no published version; publish the sub-agent first."
-            )
         rel_snapshot = rel.copy()
         rel_snapshot.pop('version_no', None)
         rel_snapshot['version_no'] = new_version_no
-        rel_snapshot['selected_agent_version_no'] = child_version
         _remove_audit_fields_for_insert(rel_snapshot)
         insert_relation_snapshot(rel_snapshot)
 
@@ -289,7 +271,6 @@ def get_version_detail_impl(
 
     # Extract sub_agent_id_list from relations
     result['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_snapshot]
-    result['sub_agent_relations'] = _build_sub_agent_relations(relations_snapshot)
 
     # Get skill instances for this version (from ag_skill_instance_t with version_no)
     from database import skill_db as skill_db_module
@@ -729,7 +710,6 @@ def _get_version_detail_or_draft(
         # Add tools (only enabled tools)
         result['tools'] = [t for t in tools_draft if t.get('enabled', True)]
         result['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_draft]
-        result['sub_agent_relations'] = _build_sub_agent_relations(relations_draft)
 
         # Get draft skill instances (version_no=0)
         skills_draft = skill_db_module.query_skill_instances_by_agent_id(
@@ -803,11 +783,12 @@ async def list_published_agents_impl(
             CAN_EDIT_ALL_USER_ROLES,
             get_user_tenant_by_user_id,
             query_group_ids_by_user,
+            PERMISSION_EDIT,
+            PERMISSION_READ,
             get_model_by_model_id,
             check_agent_availability,
             _apply_duplicate_name_availability_rules,
         )
-        from services.asset_owner_visibility import resolve_agent_list_permission
         from database.agent_version_db import query_agent_snapshot
 
         # Get user role for permission check
@@ -877,10 +858,9 @@ async def list_published_agents_impl(
 
             # Extract sub_agent_id_list from relations
             agent_info['sub_agent_id_list'] = [r['selected_agent_id'] for r in relations_snapshot]
-            agent_info['sub_agent_relations'] = _build_sub_agent_relations(relations_snapshot)
 
-            # Add current version info
-            agent_info['current_version_no'] = current_version_no
+            # Add published version info
+            agent_info['published_version_no'] = current_version_no
 
             # Check agent availability using the shared function
             _, unavailable_reasons = check_agent_availability(
@@ -913,12 +893,7 @@ async def list_published_agents_impl(
                     model_cache[model_id] = get_model_by_model_id(model_id, tenant_id)
                 model_info = model_cache.get(model_id)
 
-            permission = resolve_agent_list_permission(
-                user_role=user_role,
-                agent=agent,
-                user_id=user_id,
-                can_edit_all=can_edit_all,
-            )
+            permission = PERMISSION_EDIT if can_edit_all or str(agent.get("created_by")) == str(user_id) else PERMISSION_READ
 
             simple_agent_list.append({
                 "agent_id": agent.get("agent_id"),
@@ -934,9 +909,7 @@ async def list_published_agents_impl(
                 "is_new": agent.get("is_new", False),
                 "group_ids": agent.get("group_ids", []),
                 "permission": permission,
-                "current_version_no": agent.get("current_version_no"),
-                "greeting_message": agent.get("greeting_message"),
-                "example_questions": agent.get("example_questions"),
+                "published_version_no": agent.get("published_version_no"),
             })
 
         return simple_agent_list
diff --git a/backend/services/cas_service.py b/backend/services/cas_service.py
deleted file mode 100644
index 7db3fce1a..000000000
--- a/backend/services/cas_service.py
+++ /dev/null
@@ -1,424 +0,0 @@
-import json
-import logging
-import os
-import secrets
-import ssl
-import urllib.parse
-import urllib.request
-from xml.etree.ElementTree import Element
-from dataclasses import dataclass
-from datetime import datetime, timedelta
-from typing import Any, Dict, Optional
-
-import defusedxml.ElementTree as ET
-from defusedxml.common import DefusedXmlException
-
-from consts.const import (
-    CAS_CA_BUNDLE,
-    CAS_CALLBACK_BASE_URL,
-    CAS_EMAIL_ATTRIBUTE,
-    CAS_ENABLED,
-    CAS_LOGIN_MODE,
-    CAS_LOGOUT_URL,
-    CAS_RENEW_BEFORE_SECONDS,
-    CAS_RENEW_TIMEOUT_SECONDS,
-    CAS_ROLE_ATTRIBUTE,
-    CAS_ROLE_MAP_JSON,
-    CAS_SERVER_URL,
-    CAS_SESSION_MAX_AGE_SECONDS,
-    CAS_SSL_VERIFY,
-    CAS_SYNTHETIC_EMAIL_DOMAIN,
-    CAS_TENANT_ATTRIBUTE,
-    CAS_USER_ATTRIBUTE,
-    CAS_VALIDATE_PATH,
-    DEFAULT_TENANT_ID,
-    LOCAL_SESSION_MAX_AGE_SECONDS,
-)
-from database.cas_session_db import (
-    create_cas_session,
-    revoke_cas_session_by_index,
-    revoke_cas_sessions_by_user_id,
-)
-from database.oauth_account_db import get_oauth_account_by_provider
-from database.user_tenant_db import get_user_tenant_by_user_id, upsert_user_tenant
-from services.oauth_service import (
-    create_or_update_oauth_account,
-    find_supabase_user_id_by_email,
-)
-from services.skill_service import init_skill_list_for_tenant
-from services.tool_configuration_service import init_tool_list_for_tenant
-from utils.auth_utils import calculate_expires_at, generate_session_jwt, get_supabase_admin_client
-
-logger = logging.getLogger(__name__)
-
-CAS_PROVIDER = "cas"
-VALID_ROLES = {"SU", "ADMIN", "DEV", "USER"}
-
-
-class CasAuthenticationError(Exception):
-    pass
-
-
-@dataclass
-class CasPrincipal:
-    cas_user_id: str
-    email: str
-    username: str
-    role: str
-    tenant_id: str
-    session_index: str
-    expires_at: datetime
-
-
-def get_cas_config() -> Dict[str, Any]:
-    mode = CAS_LOGIN_MODE if CAS_LOGIN_MODE in {"button", "force", "disabled"} else "disabled"
-    enabled = CAS_ENABLED and bool(CAS_SERVER_URL)
-    if not enabled:
-        mode = "disabled"
-    return {
-        "enabled": enabled,
-        "login_mode": mode,
-        "renew_before_seconds": CAS_RENEW_BEFORE_SECONDS,
-        "renew_timeout_seconds": CAS_RENEW_TIMEOUT_SECONDS,
-        "display_name": "CAS",
-    }
-
-
-def build_login_url(redirect: str = "/") -> str:
-    _ensure_enabled()
-    service_url = _build_callback_url("/api/user/cas/callback", {"redirect": _normalize_redirect(redirect)})
-    return f"{CAS_SERVER_URL}/login?service={service_url}"
-
-
-def build_renew_url() -> str:
-    _ensure_enabled()
-    service_url = _build_callback_url("/api/user/cas/renew_callback", {})
-    return f"{CAS_SERVER_URL}/login?service={service_url}&gateway=true"
-
-
-def build_logout_url() -> str:
-    _ensure_enabled()
-    configured_logout_url = CAS_LOGOUT_URL.strip()
-    if not configured_logout_url:
-        return ""
-
-    parsed_config = urllib.parse.urlsplit(configured_logout_url)
-    if parsed_config.scheme and parsed_config.netloc:
-        logout_url = configured_logout_url
-    else:
-        logout_url = f"{CAS_SERVER_URL}/{configured_logout_url.lstrip('/')}"
-
-    parsed = urllib.parse.urlsplit(logout_url)
-    if parsed.query:
-        return logout_url
-
-    query = f"service={CAS_CALLBACK_BASE_URL}"
-    return urllib.parse.urlunsplit((parsed.scheme, parsed.netloc, parsed.path, query, parsed.fragment))
-
-
-async def login_with_ticket(ticket: str, redirect: str = "/") -> Dict[str, Any]:
-    redirect = _normalize_redirect(redirect)
-    service_url = _build_callback_url("/api/user/cas/callback", {"redirect": redirect})
-    principal = validate_service_ticket(ticket, service_url)
-    return await _create_project_session(principal, redirect=redirect)
-
-
-async def renew_with_ticket(ticket: str) -> Dict[str, Any]:
-    service_url = _build_callback_url("/api/user/cas/renew_callback", {})
-    principal = validate_service_ticket(ticket, service_url)
-    return await _create_project_session(principal, redirect="/", renew=True)
-
-
-def validate_service_ticket(ticket: str, service_url: str) -> CasPrincipal:
-    _ensure_enabled()
-    if not ticket:
-        raise CasAuthenticationError("CAS ticket is missing")
-
-    validate_path = CAS_VALIDATE_PATH if CAS_VALIDATE_PATH.startswith("/") else f"/{CAS_VALIDATE_PATH}"
-    validate_url = f"{CAS_SERVER_URL}{validate_path}"
-    xml_text = _http_get_text(f"{validate_url}?service={service_url}&ticket={ticket}")
-    logger.info("CAS serviceValidate response: %s", xml_text)
-    return parse_service_validate_response(xml_text, fallback_session_index=ticket)
-
-
-def parse_service_validate_response(xml_text: str, fallback_session_index: str = "") -> CasPrincipal:
-    try:
-        root = ET.fromstring(xml_text)
-    except (ET.ParseError, DefusedXmlException) as exc:
-        raise CasAuthenticationError("Invalid CAS validation response") from exc
-
-    failure = _find_first(root, "authenticationFailure")
-    if failure is not None:
-        raise CasAuthenticationError((failure.text or "CAS authentication failed").strip())
-
-    success = _find_first(root, "authenticationSuccess")
-    if success is None:
-        raise CasAuthenticationError("CAS authentication failed")
-
-    user = _get_child_text(success, "user")
-    attrs_node = _find_first(success, "attributes")
-    attrs = _extract_attributes(attrs_node) if attrs_node is not None else {}
-
-    cas_user_id = _attribute_or_default(attrs, CAS_USER_ATTRIBUTE, user) or user
-    if not cas_user_id:
-        raise CasAuthenticationError("CAS user id is missing")
-
-    email = _attribute_or_default(attrs, CAS_EMAIL_ATTRIBUTE, "")
-    username = attrs.get("displayName") or attrs.get("name") or cas_user_id
-    role = _map_role(_attribute_or_default(attrs, CAS_ROLE_ATTRIBUTE, "USER"))
-    tenant_id = _attribute_or_default(attrs, CAS_TENANT_ATTRIBUTE, DEFAULT_TENANT_ID) or DEFAULT_TENANT_ID
-    session_index = attrs.get("SessionIndex") or attrs.get("sessionIndex") or fallback_session_index
-    expires_at = _resolve_expires_at(attrs)
-
-    if not email:
-        safe_user = "".join(c if c.isalnum() or c in ("-", "_", ".") else "_" for c in cas_user_id)
-        email = f"{safe_user}@{CAS_SYNTHETIC_EMAIL_DOMAIN}"
-
-    return CasPrincipal(
-        cas_user_id=str(cas_user_id),
-        email=str(email).lower(),
-        username=str(username),
-        role=role,
-        tenant_id=str(tenant_id),
-        session_index=str(session_index or ""),
-        expires_at=expires_at,
-    )
-
-
-def parse_logout_request(logout_request: str) -> Dict[str, str]:
-    if not logout_request:
-        return {"cas_user_id": "", "session_index": ""}
-    try:
-        root = ET.fromstring(logout_request)
-    except (ET.ParseError, DefusedXmlException):
-        logger.warning("Invalid CAS logoutRequest XML")
-        return {"cas_user_id": "", "session_index": ""}
-
-    session_index = _get_child_text(root, "SessionIndex")
-    cas_user_id = (
-        _get_child_text(root, "NameID")
-        or _get_child_text(root, "nameID")
-        or _get_child_text(root, "user")
-        or _get_child_text(root, "casUserId")
-    )
-    return {"cas_user_id": cas_user_id or "", "session_index": session_index or ""}
-
-
-def revoke_from_logout_request(logout_request: str) -> Dict[str, Any]:
-    parsed = parse_logout_request(logout_request)
-    revoked = 0
-    if parsed["cas_user_id"]:
-        revoked = revoke_cas_sessions_by_user_id(parsed["cas_user_id"])
-        logger.info(
-            "CAS SLO revoke by cas_user_id: cas_user_id=%s revoked=%s",
-            parsed["cas_user_id"],
-            revoked,
-        )
-    if revoked == 0 and parsed["session_index"]:
-        revoked = revoke_cas_session_by_index(parsed["session_index"])
-        logger.info(
-            "CAS SLO revoke by session_index: session_index=%s revoked=%s",
-            parsed["session_index"],
-            revoked,
-        )
-    if revoked == 0:
-        logger.warning("CAS SLO did not revoke any session: %s", parsed)
-    return {"revoked": revoked, **parsed}
-
-
-async def _create_project_session(principal: CasPrincipal, redirect: str = "/", renew: bool = False) -> Dict[str, Any]:
-    user_id = _resolve_project_user(principal)
-    existing_tenant = get_user_tenant_by_user_id(user_id)
-    user_tenant = upsert_user_tenant(
-        user_id=user_id,
-        tenant_id=principal.tenant_id,
-        user_role=principal.role,
-        user_email=principal.email,
-    )
-    if not existing_tenant:
-        await init_tool_list_for_tenant(principal.tenant_id, user_id)
-        await init_skill_list_for_tenant(principal.tenant_id, user_id)
-
-    now = datetime.now()
-    max_local_expiry = now + timedelta(seconds=LOCAL_SESSION_MAX_AGE_SECONDS)
-    expires_at_dt = min(principal.expires_at, max_local_expiry)
-    expires_in_seconds = max(1, int((expires_at_dt - now).total_seconds()))
-
-    session_id = secrets.token_urlsafe(32)
-    create_cas_session(
-        session_id=session_id,
-        user_id=user_id,
-        cas_user_id=principal.cas_user_id,
-        cas_session_index=principal.session_index,
-        expires_at=expires_at_dt,
-    )
-
-    jwt_token = generate_session_jwt(user_id, expires_in=expires_in_seconds, session_id=session_id)
-
-    return {
-        "user": {
-            "id": str(user_id),
-            "email": principal.email,
-            "role": user_tenant.get("user_role", principal.role),
-        },
-        "session": {
-            "access_token": jwt_token,
-            "refresh_token": "",
-            "expires_at": calculate_expires_at(jwt_token),
-            "expires_in_seconds": expires_in_seconds,
-        },
-        "redirect_url": redirect,
-        "renew": renew,
-    }
-
-
-def _resolve_project_user(principal: CasPrincipal) -> str:
-    existing = get_oauth_account_by_provider(CAS_PROVIDER, principal.cas_user_id)
-    if existing:
-        create_or_update_oauth_account(
-            user_id=existing["user_id"],
-            provider=CAS_PROVIDER,
-            provider_user_id=principal.cas_user_id,
-            email=principal.email,
-            username=principal.username,
-            tenant_id=principal.tenant_id,
-        )
-        return existing["user_id"]
-
-    admin_client = get_supabase_admin_client()
-    if not admin_client:
-        raise RuntimeError("Supabase admin client not available")
-
-    user_id = find_supabase_user_id_by_email(admin_client, principal.email)
-    if not user_id:
-        create_resp = admin_client.auth.admin.create_user(
-            {
-                "email": principal.email,
-                "password": secrets.token_urlsafe(32),
-                "email_confirm": True,
-                "user_metadata": {
-                    "full_name": principal.username,
-                    "provider": CAS_PROVIDER,
-                    "cas_user_id": principal.cas_user_id,
-                },
-            }
-        )
-        user_id = create_resp.user.id
-
-    create_or_update_oauth_account(
-        user_id=user_id,
-        provider=CAS_PROVIDER,
-        provider_user_id=principal.cas_user_id,
-        email=principal.email,
-        username=principal.username,
-        tenant_id=principal.tenant_id,
-    )
-    return user_id
-
-
-def _ensure_enabled() -> None:
-    if not CAS_ENABLED or not CAS_SERVER_URL:
-        raise CasAuthenticationError("CAS is not configured")
-
-
-def _build_callback_url(path: str, params: Dict[str, str]) -> str:
-    if not CAS_CALLBACK_BASE_URL:
-        raise CasAuthenticationError("CAS callback base URL is not configured")
-    query = _build_callback_query(params)
-    suffix = f"?{query}" if query else ""
-    return f"{CAS_CALLBACK_BASE_URL}{path}{suffix}"
-
-
-def _build_callback_query(params: Dict[str, str]) -> str:
-    return "&".join(f"{key}={value}" for key, value in params.items())
-
-
-def _normalize_redirect(redirect: str) -> str:
-    if not redirect or not redirect.startswith("/") or redirect.startswith("//"):
-        return "/"
-    return redirect
-
-
-def _build_ssl_context() -> ssl.SSLContext:
-    if CAS_CA_BUNDLE and os.path.isfile(CAS_CA_BUNDLE):
-        return ssl.create_default_context(cafile=CAS_CA_BUNDLE)
-    if not CAS_SSL_VERIFY:
-        ctx = ssl.create_default_context()
-        ctx.check_hostname = False
-        ctx.verify_mode = ssl.CERT_NONE
-        return ctx
-    return ssl.create_default_context()
-
-
-def _http_get_text(url: str) -> str:
-    req = urllib.request.Request(url, headers={"Accept": "application/xml,text/xml,*/*"})
-    with urllib.request.urlopen(req, timeout=15, context=_build_ssl_context()) as resp:
-        return resp.read().decode("utf-8")
-
-
-def _local_name(tag: str) -> str:
-    return tag.rsplit("}", 1)[-1]
-
-
-def _find_first(node: Element, name: str) -> Optional[Element]:
-    for child in node.iter():
-        if _local_name(child.tag) == name:
-            return child
-    return None
-
-
-def _get_child_text(node: Element, name: str) -> str:
-    found = _find_first(node, name)
-    return (found.text or "").strip() if found is not None else ""
-
-
-def _extract_attributes(attrs_node: Element) -> Dict[str, str]:
-    attrs: Dict[str, str] = {}
-    for child in list(attrs_node):
-        value = (child.text or "").strip()
-        if value:
-            attrs[_local_name(child.tag)] = value
-    return attrs
-
-
-def _attribute_or_default(attrs: Dict[str, str], key: str, default: str) -> str:
-    if key and key in attrs:
-        return attrs[key]
-    return default
-
-
-def _map_role(raw_role: str) -> str:
-    role = (raw_role or "USER").upper()
-    try:
-        role_map = json.loads(CAS_ROLE_MAP_JSON) if CAS_ROLE_MAP_JSON else {}
-        role = str(role_map.get(raw_role, role_map.get(role, role))).upper()
-    except Exception:
-        logger.warning("Invalid CAS_ROLE_MAP_JSON; falling back to raw role")
-    return role if role in VALID_ROLES else "USER"
-
-
-def _resolve_expires_at(attrs: Dict[str, str]) -> datetime:
-    for key in ("expiresAt", "expirationDate", "validUntil", "notOnOrAfter"):
-        value = attrs.get(key)
-        if not value:
-            continue
-        parsed = _parse_datetime(value)
-        if parsed:
-            return parsed
-    return datetime.now() + timedelta(seconds=CAS_SESSION_MAX_AGE_SECONDS)
-
-
-def _parse_datetime(value: str) -> Optional[datetime]:
-    try:
-        if value.isdigit():
-            timestamp = int(value)
-            if timestamp > 10_000_000_000:
-                timestamp = timestamp / 1000
-            return datetime.fromtimestamp(timestamp)
-        normalized = value.replace("Z", "+00:00")
-        parsed = datetime.fromisoformat(normalized)
-        if parsed.tzinfo:
-            parsed = parsed.astimezone().replace(tzinfo=None)
-        return parsed
-    except Exception:
-        return None
diff --git a/backend/services/conversation_management_service.py b/backend/services/conversation_management_service.py
index 0b7345461..302ec63a8 100644
--- a/backend/services/conversation_management_service.py
+++ b/backend/services/conversation_management_service.py
@@ -8,7 +8,6 @@
 
 from consts.const import LANGUAGE, MODEL_CONFIG_MAPPING, MESSAGE_ROLE, DEFAULT_EN_TITLE, DEFAULT_ZH_TITLE
 from consts.model import AgentRequest, ConversationResponse, MessageRequest, MessageUnit
-from consts.exceptions import ConversationNotFoundError
 from database.conversation_db import (
     create_conversation,
     create_conversation_message,
@@ -19,14 +18,12 @@
     get_conversation,
     get_conversation_history,
     get_conversation_list,
-    get_latest_assistant_message_id,
     get_message_id_by_index,
     get_source_images_by_conversation,
     get_source_images_by_message,
     get_source_searches_by_conversation,
     get_source_searches_by_message,
     rename_conversation,
-    update_message_minio_files,
     update_message_opinion
 )
 from nexent.core.utils.observer import MessageObserver, ProcessType
@@ -227,7 +224,7 @@ def save_conversation_assistant(request: AgentRequest, messages: List[str], user
             message_list.append(message)
 
     conversation_req = MessageRequest(conversation_id=request.conversation_id, message_idx=user_role_count * 2 + 1,
-                                      role=MESSAGE_ROLE["ASSISTANT"], message=message_list, minio_files=None)
+                                      role=MESSAGE_ROLE["ASSISTANT"], message=message_list, minio_files=request.minio_files)
     save_message(conversation_req, user_id=user_id, tenant_id=tenant_id)
 
 
@@ -299,9 +296,7 @@ def update_conversation_title(conversation_id: int, title: str, user_id: str = N
     """
     success = rename_conversation(conversation_id, title, user_id)
     if not success:
-        raise ConversationNotFoundError(
-            f"Conversation {conversation_id} does not exist or has been deleted"
-        )
+        raise Exception(f"Conversation {conversation_id} does not exist or has been deleted")
     return success
 
 
@@ -514,10 +509,6 @@ def get_conversation_history_service(conversation_id: int, user_id: str) -> List
                     'opinion_flag': msg['opinion_flag']
                 }
 
-                # Add minio_files field (if any, e.g., skill-generated attachments)
-                if 'minio_files' in msg and msg['minio_files']:
-                    message_item['minio_files'] = msg['minio_files']
-
             # Add image content (if any)
             if message_id in image_by_message:
                 message_item['picture'] = image_by_message[message_id]
@@ -710,52 +701,3 @@ async def get_message_id_by_index_impl(conversation_id: int, message_index: int)
     if message_id is None:
         raise Exception("Message not found.")
     return message_id
-
-
-def save_skill_files_to_conversation(
-    conversation_id: int,
-    skill_file_uploads: List[Dict[str, Any]],
-    user_id: str,
-) -> bool:
-    """
-    Append skill file upload records to the latest assistant message in a conversation.
-
-    This persists generated documents (e.g., DOCX, XLSX created by skills) to the
-    conversation history so they appear in subsequent GET /conversation/{id} calls.
-
-    Args:
-        conversation_id: Target conversation ID
-        skill_file_uploads: List of upload metadata dicts (e.g., from upload_fileobj)
-        user_id: User ID for ownership validation
-
-    Returns:
-        bool: True if files were saved, False if no assistant message was found
-    """
-    if not skill_file_uploads:
-        return False
-
-    try:
-        message_id = get_latest_assistant_message_id(conversation_id, user_id)
-        if message_id is None:
-            logging.warning(
-                "[skill-file] no assistant message found for conversation=%s, "
-                "cannot persist skill file uploads",
-                conversation_id,
-            )
-            return False
-
-        success = update_message_minio_files(message_id, skill_file_uploads)
-        if success:
-            logging.info(
-                "[skill-file] persisted %d file(s) to message_id=%s conversation=%s",
-                len(skill_file_uploads),
-                message_id,
-                conversation_id,
-            )
-        return success
-    except Exception as exc:
-        logging.exception(
-            "[skill-file] failed to persist skill file uploads for conversation=%s",
-            conversation_id,
-        )
-        return False
diff --git a/backend/services/data_process_service.py b/backend/services/data_process_service.py
index a7529127c..ae3d35dcd 100644
--- a/backend/services/data_process_service.py
+++ b/backend/services/data_process_service.py
@@ -15,7 +15,7 @@
 import redis
 import torch
 from PIL import Image
-from celery import states
+from celery import states, chain
 from transformers import CLIPProcessor, CLIPModel
 from nexent.data_process.core import DataProcessCore
 
@@ -25,7 +25,7 @@
 from database.attachment_db import delete_file, file_exists, get_file_size_from_minio, get_file_stream, upload_file
 from utils.file_management_utils import convert_office_to_pdf
 from data_process.app import app as celery_app
-from data_process.tasks import submit_process_forward_chain
+from data_process.tasks import process, forward
 from data_process.utils import get_task_info, get_all_task_ids_from_redis
 
 # Limit concurrent LibreOffice processes to avoid resource exhaustion
@@ -54,8 +54,7 @@ def __init__(self):
 
         self._inspector = None
         self._inspector_last_time = 0
-        # 5 minutes - inspector is expensive to create (ping all workers)
-        self._inspector_ttl = 300
+        self._inspector_ttl = 300  # 5 minutes - inspector is expensive to create (ping all workers)
         self._inspector_lock = None
         self._inspector_lock = threading.Lock()
 
@@ -153,8 +152,7 @@ async def get_all_tasks(self, filter: bool = True) -> List[Dict[str, Any]]:
 
             def _normalize_runtime_meta(task: Dict[str, Any]) -> Dict[str, Any]:
                 task_name_full = task.get('name', '') or ''
-                task_name = task_name_full.split(
-                    '.')[-1] if task_name_full else ''
+                task_name = task_name_full.split('.')[-1] if task_name_full else ''
                 kwargs = task.get('kwargs') or {}
                 if isinstance(kwargs, str):
                     try:
@@ -180,43 +178,35 @@ def _normalize_runtime_meta(task: Dict[str, Any]) -> Dict[str, Any]:
             def get_active():
                 t = time.time()
                 # Create fresh inspector with short timeout for each call
-                short_inspector = celery_app.control.inspect(
-                    timeout=short_timeout)
+                short_inspector = celery_app.control.inspect(timeout=short_timeout)
                 result = short_inspector.active()
                 elapsed = time.time() - t
-                logger.info(
-                    f"[get_all_tasks] inspector.active() took {elapsed:.3f}s")
+                logger.info(f"[get_all_tasks] inspector.active() took {elapsed:.3f}s")
                 return result if result else {}
 
             def get_reserved():
                 t = time.time()
-                short_inspector = celery_app.control.inspect(
-                    timeout=short_timeout)
+                short_inspector = celery_app.control.inspect(timeout=short_timeout)
                 result = short_inspector.reserved()
                 elapsed = time.time() - t
-                logger.info(
-                    f"[get_all_tasks] inspector.reserved() took {elapsed:.3f}s")
+                logger.info(f"[get_all_tasks] inspector.reserved() took {elapsed:.3f}s")
                 return result if result else {}
 
             with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor:
                 future_active = executor.submit(get_active)
                 future_reserved = executor.submit(get_reserved)
-                active_tasks_dict = future_active.result(
-                    timeout=short_timeout + 0.5)
-                reserved_tasks_dict = future_reserved.result(
-                    timeout=short_timeout + 0.5)
+                active_tasks_dict = future_active.result(timeout=short_timeout + 0.5)
+                reserved_tasks_dict = future_reserved.result(timeout=short_timeout + 0.5)
             celery_duration = time.time() - celery_start
             if celery_duration > 0.5:
-                logger.warning(
-                    f"[get_all_tasks] Inspector took {celery_duration:.3f}s (expected <0.5s)")
+                logger.warning(f"[get_all_tasks] Inspector took {celery_duration:.3f}s (expected <0.5s)")
             if active_tasks_dict:
                 for worker, tasks in active_tasks_dict.items():
                     for task in tasks:
                         task_id = task.get('id')
                         if task_id:
                             task_ids.add(task_id)
-                            runtime_task_meta[task_id] = _normalize_runtime_meta(
-                                task)
+                            runtime_task_meta[task_id] = _normalize_runtime_meta(task)
             if reserved_tasks_dict:
                 for worker, tasks in reserved_tasks_dict.items():
                     for task in tasks:
@@ -224,8 +214,7 @@ def get_reserved():
                         if task_id:
                             task_ids.add(task_id)
                             # Keep active metadata if already present
-                            runtime_task_meta.setdefault(
-                                task_id, _normalize_runtime_meta(task))
+                            runtime_task_meta.setdefault(task_id, _normalize_runtime_meta(task))
 
             # Get task IDs from Redis backend (covers completed/failed tasks within expiry)
             try:
@@ -252,14 +241,11 @@ def get_reserved():
                     if not task_info.get('task_name') and runtime_meta.get('task_name'):
                         task_info['task_name'] = runtime_meta.get('task_name')
                     if not task_info.get('index_name') and runtime_meta.get('index_name'):
-                        task_info['index_name'] = runtime_meta.get(
-                            'index_name')
+                        task_info['index_name'] = runtime_meta.get('index_name')
                     if not task_info.get('path_or_url') and runtime_meta.get('path_or_url'):
-                        task_info['path_or_url'] = runtime_meta.get(
-                            'path_or_url')
+                        task_info['path_or_url'] = runtime_meta.get('path_or_url')
                     if not task_info.get('original_filename') and runtime_meta.get('original_filename'):
-                        task_info['original_filename'] = runtime_meta.get(
-                            'original_filename')
+                        task_info['original_filename'] = runtime_meta.get('original_filename')
 
                 if filter and not (task_info.get('index_name') and task_info.get('task_name')):
                     # Keep user-visible queued tasks even before worker updates task meta.
@@ -552,23 +538,30 @@ async def create_batch_tasks_impl(self, authorization: Optional[str], request: B
                     f"Missing required field 'index_name' in source config: {source_config}")
                 continue
 
-            chain_id = submit_process_forward_chain(
-                source=source,
-                source_type=source_type,
-                chunking_strategy=chunking_strategy,
-                index_name=index_name,
-                original_filename=original_filename,
-                authorization=authorization,
-                embedding_model_id=embedding_model_id,
-                tenant_id=tenant_id,
+            # Create and submit a chain: process -> forward
+            task_chain = chain(
+                process.s(
+                    source=source,
+                    source_type=source_type,
+                    chunking_strategy=chunking_strategy,
+                    index_name=index_name,
+                    original_filename=original_filename,
+                    embedding_model_id=embedding_model_id,
+                    tenant_id=tenant_id
+                ).set(queue='process_q'),
+                forward.s(
+                    index_name=index_name,
+                    source=source,
+                    source_type=source_type,
+                    original_filename=original_filename,
+                    authorization=authorization
+                ).set(queue='forward_q')
             )
-            if not chain_id:
-                logger.error(
-                    f"Failed to enqueue process-forward chain for source: {source}")
-                continue
 
-            task_ids.append(chain_id)
-            logger.debug(f"Created task {chain_id} for source: {source}")
+            task_result = task_chain.apply_async()
+
+            task_ids.append(task_result.id)
+            logger.debug(f"Created task {task_result.id} for source: {source}")
         logger.info(
             f"Created {len(task_ids)} individual tasks for batch processing")
         return task_ids
@@ -600,7 +593,7 @@ async def process_uploaded_text_file(self, file_content: bytes, filename: str, c
             f"Processing uploaded file: {filename} using SDK DataProcessCore")
 
         data_processor = DataProcessCore()
-        chunks, _ = data_processor.file_process(
+        chunks = data_processor.file_process(
             file_data=file_content,
             filename=filename,
             chunking_strategy=chunking_strategy
@@ -649,8 +642,7 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 # Step 1: Download original Office file from MinIO
                 original_stream = get_file_stream(object_name)
                 if original_stream is None:
-                    raise OfficeConversionException(
-                        f"Source file not found in storage: {object_name}")
+                    raise OfficeConversionException(f"Source file not found in storage: {object_name}")
 
                 original_filename = os.path.basename(object_name)
                 input_path = os.path.join(temp_dir, original_filename)
@@ -662,12 +654,10 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 try:
                     pdf_path = await convert_office_to_pdf(input_path, temp_dir, timeout=30)
                 except Exception as exc:
-                    raise OfficeConversionException(
-                        f"LibreOffice conversion failed: {exc}") from exc
+                    raise OfficeConversionException(f"LibreOffice conversion failed: {exc}") from exc
 
                 # Step 3: Upload converted PDF to MinIO
-                result = upload_file(file_path=pdf_path,
-                                     object_name=pdf_object_name)
+                result = upload_file(file_path=pdf_path, object_name=pdf_object_name)
                 if not result.get('success'):
                     raise OfficeConversionException(
                         f"Failed to upload PDF to MinIO: {result.get('error', 'Unknown error')}"
@@ -676,16 +666,14 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                 # Step 4: Validate the uploaded PDF (header check + minimum size)
                 remote_size = get_file_size_from_minio(pdf_object_name)
                 if remote_size <= 0:
-                    raise OfficeConversionException(
-                        "PDF validation failed: cannot read remote file size")
+                    raise OfficeConversionException("PDF validation failed: cannot read remote file size")
                 if remote_size < 100:
                     raise OfficeConversionException(
                         f"PDF validation failed: file too small ({remote_size} bytes)"
                     )
                 remote_stream = get_file_stream(pdf_object_name)
                 if remote_stream is None:
-                    raise OfficeConversionException(
-                        "PDF validation failed: cannot read uploaded file")
+                    raise OfficeConversionException("PDF validation failed: cannot read uploaded file")
                 try:
                     header = remote_stream.read(5)
                 finally:
@@ -694,8 +682,7 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                     except Exception:
                         pass
                 if not header.startswith(b'%PDF-'):
-                    raise OfficeConversionException(
-                        "PDF validation failed: invalid PDF header")
+                    raise OfficeConversionException("PDF validation failed: invalid PDF header")
 
             except OfficeConversionException:
                 # Clean up any partially-uploaded remote PDF so a future retry starts clean
@@ -703,16 +690,14 @@ async def convert_office_to_pdf_impl(self, object_name: str, pdf_object_name: st
                     delete_file(pdf_object_name)
                 raise
             except Exception as exc:
-                raise OfficeConversionException(
-                    f"Unexpected error during conversion: {exc}") from exc
+                raise OfficeConversionException(f"Unexpected error during conversion: {exc}") from exc
             finally:
                 # Step 5: Clean up local temporary directory
                 if temp_dir and os.path.exists(temp_dir):
                     try:
                         shutil.rmtree(temp_dir)
                     except Exception as cleanup_err:
-                        logger.warning(
-                            f"Failed to cleanup temp dir '{temp_dir}': {cleanup_err}")
+                        logger.warning(f"Failed to cleanup temp dir '{temp_dir}': {cleanup_err}")
 
     def convert_celery_states_to_custom(self, process_celery_state: Optional[str], forward_celery_state: Optional[str]) -> str:
         """Map Celery task states to a custom frontend state string.
diff --git a/backend/services/file_management_service.py b/backend/services/file_management_service.py
index 585669c0c..b2850403d 100644
--- a/backend/services/file_management_service.py
+++ b/backend/services/file_management_service.py
@@ -52,27 +52,6 @@
 
 logger = logging.getLogger("file_management_service")
 
-ALLOWED_SKILL_UPLOAD_ROOT = Path("/mnt/nexent").resolve()
-
-
-def is_allowed_skill_upload_path(file_path: str) -> bool:
-    """Return True when a local file path is under the allowed skill upload root."""
-    if not file_path:
-        return False
-
-    try:
-        candidate_path = Path(file_path).resolve()
-    except Exception:
-        return False
-
-    try:
-        candidate_path.relative_to(ALLOWED_SKILL_UPLOAD_ROOT)
-        return True
-    except ValueError:
-        return False
-
-
-
 
 def resolve_minio_upload_folder(
     folder: Optional[str],
@@ -104,11 +83,6 @@ def resolve_minio_upload_folder(
     if folder == "knowledge_base":
         return "knowledge_base"
 
-    if folder == "skill-files":
-        if user_id:
-            return f"skill-files/{user_id}"
-        return "skill-files"
-
     if user_id:
         return f"attachments/{user_id}"
 
@@ -127,6 +101,7 @@ def check_file_access(
     - knowledge_base/*: All authenticated users can access
     - attachments/{user_id}/*: Only the owner (user_id) can access
     - images_in_attachments/*: All authenticated users can access
+    - preview/*: Accessible if the original file is accessible
 
     Args:
         object_name: File object name in storage
@@ -150,10 +125,6 @@ def check_file_access(
         # Keep them readable for authenticated users to avoid broken image citations.
         return True
 
-    if object_name.startswith("skill-files/"):
-        # Generated documents are private to the uploader and must stay user-scoped.
-        return object_name.startswith(f"skill-files/{user_id}/")
-
     # Check if file is in user's attachments folder
     # Pattern: attachments/{user_id}/*
     if object_name.startswith(f"attachments/{user_id}/"):
@@ -386,20 +357,14 @@ async def upload_to_minio(
             # Convert file content to BytesIO object
             file_obj = BytesIO(file_content)
 
-            # Store original filename before upload
-            original_filename = f.filename or ""
-
             # Upload file
             result = upload_fileobj(
                 file_obj=file_obj,
-                file_name=original_filename,
+                file_name=f.filename or "",
                 prefix=actual_folder,
                 file_size=len(file_content)
             )
 
-            # Preserve original filename in result (upload_fileobj uses it for object name generation)
-            result["original_file_name"] = original_filename
-
             # Reset file pointer for potential re-reading
             await f.seek(0)
             results.append(result)
@@ -411,7 +376,6 @@ async def upload_to_minio(
             results.append({
                 "success": False,
                 "file_name": f.filename,
-                "original_file_name": f.filename,
                 "error": "An error occurred while processing the file."
             })
     return results
diff --git a/backend/services/northbound_service.py b/backend/services/northbound_service.py
index c5493a551..a6eaed77d 100644
--- a/backend/services/northbound_service.py
+++ b/backend/services/northbound_service.py
@@ -1,40 +1,31 @@
 import asyncio
 import hashlib
-import json
 import logging
 import time
 from dataclasses import dataclass
-from os.path import basename
-from typing import Any, Dict, List, Optional
+from typing import Any, Dict, Optional
 
-from fastapi import HTTPException, UploadFile
 from fastapi.responses import StreamingResponse
 
-
-from consts.const import ASSET_OWNER_TENANT_ID
 from consts.exceptions import (
     LimitExceededError,
     UnauthorizedError,
-    ConversationNotFoundError,
 )
-from consts.model import AgentRequest, ToolParamsRequest
-from database.conversation_db import get_conversation_messages, get_source_searches_by_message
+from consts.model import AgentRequest
+from database.conversation_db import get_conversation_messages
 from database.token_db import log_token_usage, get_latest_usage_metadata
 from services.agent_service import (
     run_agent_stream,
     stop_agent_tasks,
+    list_all_agent_info_impl,
     get_agent_id_by_name
 )
-from services.agent_version_service import list_published_agents_impl
 from services.conversation_management_service import (
     save_conversation_user,
     get_conversation_list_service,
     create_new_conversation,
     update_conversation_title as update_conversation_title_service,
 )
-from services.file_management_service import upload_to_minio, resolve_minio_upload_folder, validate_urls_access
-from database.attachment_db import get_file_url, get_file_size_from_minio
-from nexent.multi_modal.utils import parse_s3_url
 
 logger = logging.getLogger("northbound_service")
 
@@ -48,188 +39,6 @@ class NorthboundContext:
     token_id: int = 0
 
 
-def _build_northbound_file_descriptor(
-    upload_result: Dict[str, Any],
-    original_file_name: str = "",
-    file_type: Optional[str] = None,
-    file_size: Optional[int] = None,
-) -> Dict[str, Any]:
-    """Normalize upload metadata for northbound API consumers."""
-    object_name = str(upload_result.get("object_name") or "").strip()
-    # Use original filename if provided, otherwise fall back to upload result or object name
-    if original_file_name:
-        file_name = original_file_name
-    else:
-        file_name = str(upload_result.get("file_name") or basename(object_name) or "")
-    # Frontend-compatible field order
-    descriptor = {
-        "object_name": object_name,
-        "name": file_name,
-        "type": file_type or "file",
-        # Use provided file_size, or from upload_result, or 0 as fallback
-        "size": file_size if file_size is not None else upload_result.get("file_size", 0),
-        # Use relative URL format matching frontend: /nexent/{object_name}
-        "url": f"/nexent/{object_name}",
-        "description": "",
-    }
-    presigned_url = upload_result.get("presigned_url")
-    if presigned_url:
-        descriptor["presigned_url"] = presigned_url
-    return descriptor
-
-
-async def upload_files_for_northbound(
-    ctx: NorthboundContext,
-    files: List[UploadFile],
-    folder: str = "attachments",
-) -> Dict[str, Any]:
-    """Upload files for northbound callers and return reusable storage references."""
-    if not files:
-        raise ValueError("No files in the request")
-
-    actual_folder = resolve_minio_upload_folder(folder, ctx.user_id, ctx.tenant_id)
-    results = await upload_to_minio(files=files, folder=actual_folder)
-    normalized_files = []
-    for result, upload_file in zip(results, files):
-        if result.get("success") and result.get("object_name"):
-            content_type = result.get("content_type", "")
-            file_type = "image" if content_type.startswith("image/") else "file"
-            # Extract original filename - use upload result first, then fallback to UploadFile
-            # The upload result contains the original filename passed to upload_fileobj
-            original_file_name = result.get("original_file_name") or upload_file.filename or ""
-            file_size = result.get("file_size", 0)
-            # If file_size is 0 but we have the UploadFile, try to get size from headers
-            if file_size == 0 and hasattr(upload_file, 'size') and upload_file.size:
-                file_size = upload_file.size
-            descriptor = _build_northbound_file_descriptor(
-                result,
-                original_file_name=original_file_name,
-                file_type=file_type,
-                file_size=file_size,
-            )
-            normalized_files.append(descriptor)
-
-    if not normalized_files:
-        raise ValueError("No valid files uploaded")
-
-    success_count = sum(1 for result in results if result.get("success", False))
-    failed_count = sum(1 for result in results if not result.get("success", False))
-
-    return {
-        "message": f"Processed {len(results)} files",
-        "requestId": ctx.request_id,
-        "summary": {
-            "total": len(results),
-            "uploaded": success_count,
-            "failed": failed_count,
-        },
-        "files": normalized_files,
-    }
-
-
-def _normalize_northbound_attachments(
-    attachments: Optional[List[Any]],
-    user_id: str,
-    tenant_id: str,
-) -> Optional[List[Dict[str, Any]]]:
-    """Convert northbound attachment references into internal minio_files objects.
-    
-    Supports two formats:
-    1. List of S3 URL strings (backward compatible): ["s3://nexent/...", "/nexent/...", "attachments/..."]
-    2. List of attachment objects (full metadata): [{"object_name": "...", "name": "...", ...}]
-    """
-    from database.attachment_db import _build_mcp_presigned_url
-
-    if attachments is None:
-        return None
-    if not isinstance(attachments, list):
-        raise ValueError("attachments must be an array")
-
-    normalized_files: List[Dict[str, Any]] = []
-    for attachment in attachments:
-        # Handle dict format (full attachment object)
-        if isinstance(attachment, dict):
-            # Use the attachment dict directly, just ensure required fields
-            normalized_file = {
-                "object_name": attachment.get("object_name", ""),
-                "name": attachment.get("name", basename(attachment.get("object_name", ""))),
-                "type": attachment.get("type", "file"),
-                "size": attachment.get("size", 0),
-                "url": attachment.get("url", ""),
-                "description": attachment.get("description", ""),
-            }
-            # Add presigned_url if available, or generate one if we have object_name
-            if "presigned_url" in attachment:
-                normalized_file["presigned_url"] = attachment["presigned_url"]
-            elif normalized_file.get("object_name"):
-                try:
-                    presigned_result = get_file_url(object_name=normalized_file["object_name"], expires=86400)
-                    if presigned_result.get("success") and presigned_result.get("url"):
-                        normalized_file["presigned_url"] = _build_mcp_presigned_url(presigned_result["url"])
-                except Exception:
-                    pass
-            normalized_files.append(normalized_file)
-            continue
-
-        # Handle string format (S3 URL)
-        if not isinstance(attachment, str) or not attachment.strip():
-            raise ValueError("attachments must contain non-empty S3 URLs or object paths")
-
-        attachment_url = attachment.strip()
-
-        # Support multiple URL formats:
-        # 1. s3://nexent/attachments/xxx.md
-        # 2. /nexent/attachments/xxx.md
-        # 3. attachments/xxx.md (relative path)
-        if attachment_url.startswith("s3://"):
-            try:
-                _, object_name = parse_s3_url(attachment_url)
-            except ValueError as exc:
-                raise ValueError(f"Invalid S3 URL format: {attachment_url}") from exc
-            validate_url = attachment_url
-        elif attachment_url.startswith("/nexent/"):
-            object_name = attachment_url[len("/nexent/"):]
-            validate_url = f"s3://nexent/{object_name}"
-        elif attachment_url.startswith("attachments/") or attachment_url.startswith("nexent/"):
-            object_name = attachment_url if attachment_url.startswith("nexent/") else attachment_url
-            validate_url = f"s3://nexent/{object_name}"
-        else:
-            raise ValueError(f"Invalid attachment format: {attachment_url}. Expected s3:// URL, /nexent/ path, or attachments/ path")
-
-        try:
-            validate_urls_access([validate_url], user_id, tenant_id)
-            presigned_result = get_file_url(object_name=object_name, expires=86400)
-        except PermissionError as exc:
-            detail = str(exc)
-            if "Invalid S3 URL format" in detail:
-                raise ValueError(detail) from exc
-            raise PermissionError(detail) from exc
-
-        # Get file size from MinIO
-        try:
-            file_size = get_file_size_from_minio(object_name)
-        except Exception:
-            file_size = 0
-
-        # Build frontend-compatible minio_files format
-        file_name = basename(object_name.rstrip("/"))
-        normalized_file = {
-            "object_name": object_name,
-            "name": file_name,
-            "type": "file",
-            "size": file_size,
-            # Use relative URL format matching frontend: /nexent/{object_name}
-            "url": f"/nexent/{object_name}",
-            "description": "",
-        }
-        # Use MCP proxy URL for presigned_url (same as frontend format)
-        if presigned_result.get("success") and presigned_result.get("url"):
-            normalized_file["presigned_url"] = _build_mcp_presigned_url(presigned_result["url"])
-        normalized_files.append(normalized_file)
-
-    return normalized_files
-
-
 # -----------------------------
 # In-memory idempotency and rate limit placeholders
 # -----------------------------
@@ -302,12 +111,6 @@ def _build_idempotency_key(*parts: Any) -> str:
     return ":".join(processed)
 
 
-def _build_title_update_idempotency_key(tenant_id: str, conversation_id: int, title: str) -> str:
-    """Build an ASCII-safe idempotency key for title updates."""
-    title_hash = hashlib.sha256(title.encode("utf-8")).hexdigest()
-    return _build_idempotency_key(tenant_id, str(conversation_id), title_hash)
-
-
 # -----------------------------
 # Agent resolver
 # -----------------------------
@@ -323,9 +126,7 @@ async def start_streaming_chat(
     conversation_id: Optional[int],
     agent_name: str,
     query: str,
-    attachments: Optional[List[Any]] = None,
     meta_data: Optional[Dict[str, Any]] = None,
-    tool_params: Optional[ToolParamsRequest] = None,
     idempotency_key: Optional[str] = None
 ) -> StreamingResponse:
     try:
@@ -344,11 +145,6 @@ async def start_streaming_chat(
         # Get history according to internal_conversation_id
         history_resp = await get_conversation_history_internal(ctx, internal_conversation_id)
         agent_id = await get_agent_id_by_name(agent_name=agent_name, tenant_id=ctx.tenant_id)
-        normalized_attachments = _normalize_northbound_attachments(
-            attachments=attachments,
-            user_id=ctx.user_id,
-            tenant_id=ctx.tenant_id,
-        )
         # Idempotency: only prevent concurrent duplicate starts
         composed_key = idempotency_key or _build_idempotency_key(ctx.tenant_id, str(conversation_id), agent_id, query)
         await idempotency_start(composed_key)
@@ -357,9 +153,8 @@ async def start_streaming_chat(
             agent_id=agent_id,
             query=query,
             history=(history_resp.get("data", {})).get("history", []),
-            minio_files=normalized_attachments,
+            minio_files=None,
             is_debug=False,
-            tool_params=tool_params,
         )
 
         # Synchronously persist the user message before starting the stream to avoid race conditions
@@ -462,58 +257,15 @@ async def list_conversations(ctx: NorthboundContext) -> Dict[str, Any]:
     return {"message": "success", "data": conversations, "requestId": ctx.request_id}
 
 
-def _format_search_record(record: Dict[str, Any]) -> Dict[str, Any]:
-    """Format a search source record for API response."""
-    search_item = {
-        "title": record.get("source_title", ""),
-        "text": record.get("source_content", ""),
-        "source_type": record.get("source_type", ""),
-        "url": record.get("source_location", ""),
-        "filename": record.get("source_title", "") if record.get("source_type") == "file" else None,
-        "published_date": None,
-        "score": float(record["score_overall"]) if record.get("score_overall") is not None else None,
-        "tool_sign": record.get("tool_sign", ""),
-        "cite_index": record.get("cite_index")
-    }
-
-    if record.get("published_date"):
-        if hasattr(record["published_date"], "strftime"):
-            search_item["published_date"] = record["published_date"].strftime("%Y-%m-%d")
-        else:
-            search_item["published_date"] = str(record["published_date"])[:10]
-
-    return search_item
-
-
 async def get_conversation_history_internal(ctx: NorthboundContext, conversation_id: int) -> Dict[str, Any]:
     """Internal helper to get conversation history without logging."""
     history = get_conversation_messages(conversation_id)
+    # Remove unnecessary fields
     result = []
     for message in history:
-        # Parse minio_files from database (stored as JSON string)
-        minio_files = []
-        raw_minio_files = message.get("minio_files")
-        if raw_minio_files:
-            try:
-                minio_files = json.loads(raw_minio_files) if isinstance(raw_minio_files, str) else raw_minio_files
-            except (json.JSONDecodeError, TypeError):
-                logger.warning(f"Failed to parse minio_files for message {message.get('message_id')}")
-
-        # Fetch search results for this message
-        message_id = message.get("message_id")
-        search_results = []
-        if message_id:
-            try:
-                search_records = get_source_searches_by_message(message_id, user_id=ctx.user_id)
-                search_results = [_format_search_record(r) for r in search_records]
-            except Exception as e:
-                logger.warning(f"Failed to get search records for message {message_id}: {str(e)}")
-
         result.append({
             "role": message["message_role"],
-            "content": message["message_content"],
-            "minio_files": minio_files,
-            "search": search_results
+            "content": message["message_content"]
         })
 
     response = {
@@ -532,18 +284,7 @@ async def get_conversation_history(ctx: NorthboundContext, conversation_id: int)
 
 async def get_agent_info_list(ctx: NorthboundContext) -> Dict[str, Any]:
     try:
-        agent_info_list = await list_published_agents_impl(
-            tenant_id=ctx.tenant_id,
-            user_id=ctx.user_id,
-        )
-        # Match the same scope as /agent/published_list: non-asset-owner tenants
-        # also get the asset owner's published agents merged in.
-        if ctx.tenant_id != ASSET_OWNER_TENANT_ID:
-            asset_agent_list = await list_published_agents_impl(
-                tenant_id=ASSET_OWNER_TENANT_ID,
-                user_id=ctx.user_id,
-            )
-            agent_info_list.extend(asset_agent_list)
+        agent_info_list = await list_all_agent_info_impl(tenant_id=ctx.tenant_id, user_id=ctx.user_id)
         # Remove internal information that partner don't need
         for agent_info in agent_info_list:
             agent_info.pop("agent_id", None)
@@ -557,11 +298,7 @@ async def update_conversation_title(ctx: NorthboundContext, conversation_id: int
     composed_key: Optional[str] = None
     try:
         # Idempotency: avoid concurrent duplicate title update for same conversation
-        composed_key = idempotency_key or _build_title_update_idempotency_key(
-            ctx.tenant_id,
-            conversation_id,
-            title,
-        )
+        composed_key = idempotency_key or _build_idempotency_key(ctx.tenant_id, str(conversation_id), title)
         await idempotency_start(composed_key)
 
         update_conversation_title_service(conversation_id, title, ctx.user_id)
@@ -587,8 +324,6 @@ async def update_conversation_title(ctx: NorthboundContext, conversation_id: int
         }
     except LimitExceededError as _:
         raise LimitExceededError("Duplicate request is still running, please wait.")
-    except ConversationNotFoundError:
-        raise
     except Exception as e:
         raise Exception(f"Failed to update conversation title for conversation_id {conversation_id}: {str(e)}")
     finally:
diff --git a/backend/services/prompt_service.py b/backend/services/prompt_service.py
index f1564cdbc..ee9704302 100644
--- a/backend/services/prompt_service.py
+++ b/backend/services/prompt_service.py
@@ -1,17 +1,15 @@
 import json
 import logging
 import queue
-import sys
 import threading
 from typing import Optional, List
 
 from jinja2 import StrictUndefined, Template
 
-from consts.const import LANGUAGE, ENABLE_JIUWEN_SDK
+from consts.const import LANGUAGE
 from consts.error_code import ErrorCode
 from consts.error_message import ErrorMessage
 from consts.exceptions import AppException
-from consts.model import AgentInfoRequest
 from database.agent_db import search_agent_info_by_agent_id, query_all_agent_info_by_tenant_id, \
     query_sub_agents_id_list
 from database.model_management_db import get_model_by_model_id
@@ -24,31 +22,15 @@
     _regenerate_agent_name_with_llm,
     _regenerate_agent_display_name_with_llm,
     _generate_unique_agent_name_with_suffix,
-    _generate_unique_display_name_with_suffix,
-    update_agent,
+    _generate_unique_display_name_with_suffix
 )
 from services.prompt_template_service import resolve_prompt_generate_template
 from utils.llm_utils import call_llm_for_system_prompt
 from utils.prompt_template_utils import (
+    get_prompt_generate_prompt_template,
     get_prompt_optimize_prompt_template,
-    get_prompt_template,
 )
 
-from dataclasses import dataclass, field
-from typing import Optional as Opt
-
-from adapters.exception import JiuwenSDKError, NexentCapabilityError
-
-
-def _get_jiuwen_adapter_class():
-    """Import Jiuwen adapter only when optimization paths need it."""
-    try:
-        from adapters import JiuwenSDKAdapter
-    except ModuleNotFoundError:
-        return None
-    return JiuwenSDKAdapter
-
-
 # Configure logging
 logger = logging.getLogger("prompt_service")
 
@@ -123,16 +105,14 @@ def generate_and_save_system_prompt_impl(agent_id: int,
     # Get knowledge base display names for few-shot examples
     # Priority: frontend-provided > database query
     if knowledge_base_display_names:
-        logger.debug(
-            f"Using frontend-provided knowledge base display names: {knowledge_base_display_names}")
+        logger.debug(f"Using frontend-provided knowledge base display names: {knowledge_base_display_names}")
     else:
         knowledge_base_display_names = get_knowledge_base_display_names(
             tool_info_list=tool_info_list,
             agent_id=agent_id,
             tenant_id=tenant_id
         )
-        logger.debug(
-            f"Using database query for knowledge base display names: {knowledge_base_display_names}")
+        logger.debug(f"Using database query for knowledge base display names: {knowledge_base_display_names}")
 
     # Handle sub-agent IDs
     if sub_agent_ids and len(sub_agent_ids) > 0:
@@ -166,7 +146,7 @@ def generate_and_save_system_prompt_impl(agent_id: int,
 
     # 1. Real-time streaming push
     final_results = {"duty": "", "constraint": "", "few_shots": "", "agent_var_name": "", "agent_display_name": "",
-                     "agent_description": "", "greeting_message": "", "example_questions": ""}
+                     "agent_description": ""}
 
     # Get all existing agent names and display names for duplicate checking (only if not in create mode)
     all_agents = query_all_agent_info_by_tenant_id(tenant_id)
@@ -212,8 +192,7 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                         exclude_agent_id=agent_id,
                         agents_cache=all_agents
                     ):
-                        logger.info(
-                            f"Agent name '{agent_name}' already exists, regenerating with LLM")
+                        logger.info(f"Agent name '{agent_name}' already exists, regenerating with LLM")
                         try:
                             agent_name = _regenerate_agent_name_with_llm(
                                 original_name=agent_name,
@@ -227,12 +206,10 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                                 prompt_template_id=prompt_template_id,
                                 user_id=user_id,
                             )
-                            logger.info(
-                                f"Regenerated agent name: '{agent_name}'")
+                            logger.info(f"Regenerated agent name: '{agent_name}'")
                             final_results["agent_var_name"] = agent_name
                         except Exception as e:
-                            logger.error(
-                                f"Failed to regenerate agent name with LLM: {str(e)}, using fallback")
+                            logger.error(f"Failed to regenerate agent name with LLM: {str(e)}, using fallback")
                             # Fallback: add suffix
                             agent_name = _generate_unique_agent_name_with_suffix(
                                 agent_name,
@@ -258,8 +235,7 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                         exclude_agent_id=agent_id,
                         agents_cache=all_agents
                     ):
-                        logger.info(
-                            f"Agent display_name '{agent_display_name}' already exists, regenerating with LLM")
+                        logger.info(f"Agent display_name '{agent_display_name}' already exists, regenerating with LLM")
                         try:
                             agent_display_name = _regenerate_agent_display_name_with_llm(
                                 original_display_name=agent_display_name,
@@ -273,12 +249,10 @@ def generate_and_save_system_prompt_impl(agent_id: int,
                                 prompt_template_id=prompt_template_id,
                                 user_id=user_id,
                             )
-                            logger.info(
-                                f"Regenerated agent display_name: '{agent_display_name}'")
+                            logger.info(f"Regenerated agent display_name: '{agent_display_name}'")
                             final_results["agent_display_name"] = agent_display_name
                         except Exception as e:
-                            logger.error(
-                                f"Failed to regenerate agent display_name with LLM: {str(e)}, using fallback")
+                            logger.error(f"Failed to regenerate agent display_name with LLM: {str(e)}, using fallback")
                             # Fallback: add suffix
                             agent_display_name = _generate_unique_display_name_with_suffix(
                                 agent_display_name,
@@ -311,68 +285,6 @@ def generate_and_save_system_prompt_impl(agent_id: int,
     if not has_content:
         raise Exception("Failed to generate prompt content.")
 
-    # 3. Generate greeting message and example questions
-    try:
-        greeting_template = get_prompt_template('greeting_generate', language)
-        greeting_system_prompt = greeting_template.get("GREETING_SYSTEM_PROMPT", "")
-        greeting_user_prompt_template = greeting_template.get("USER_PROMPT", "")
-
-        greeting_user_prompt = Template(greeting_user_prompt_template, undefined=StrictUndefined).render({
-            "display_name": final_results.get("agent_display_name", ""),
-            "duty_description": final_results.get("duty", ""),
-            "business_description": task_description,
-            "few_shots": final_results.get("few_shots", ""),
-        })
-
-        greeting_result = call_llm_for_system_prompt(
-            model_id=model_id,
-            user_prompt=greeting_user_prompt,
-            system_prompt=greeting_system_prompt,
-            tenant_id=tenant_id,
-        )
-
-        parsed = None
-        try:
-            json_start = greeting_result.find("{")
-            json_end = greeting_result.rfind("}") + 1
-            if json_start >= 0 and json_end > json_start:
-                parsed = json.loads(greeting_result[json_start:json_end])
-        except json.JSONDecodeError:
-            logger.warning(f"Failed to parse greeting JSON from LLM output: {greeting_result}")
-
-        if parsed and "greeting_message" in parsed and "example_questions" in parsed:
-            greeting_message = parsed["greeting_message"]
-            example_questions = parsed["example_questions"]
-            if isinstance(example_questions, list) and len(example_questions) > 6:
-                example_questions = example_questions[:6]
-        else:
-            greeting_message = greeting_result.strip() if greeting_result else ""
-            example_questions = []
-
-        yield {
-            "type": "greeting_message",
-            "content": greeting_message,
-            "is_complete": True
-        }
-        yield {
-            "type": "example_questions",
-            "content": json.dumps(example_questions, ensure_ascii=False),
-            "is_complete": True
-        }
-
-        final_results["greeting_message"] = greeting_message
-        final_results["example_questions"] = json.dumps(example_questions, ensure_ascii=False)
-
-        # Update agent with greeting (skip in create mode)
-        if agent_id != 0:
-            update_agent(agent_id, AgentInfoRequest(
-                agent_id=agent_id,
-                greeting_message=greeting_message,
-                example_questions=example_questions,
-            ), user_id)
-    except Exception as e:
-        logger.warning(f"Greeting generation failed: {str(e)}, skipping greeting")
-
 def optimize_prompt_section_impl(
     agent_id: int,
     model_id: int,
@@ -427,8 +339,7 @@ def optimize_prompt_section_impl(
     prompt_context = join_info_for_optimize_prompt_section(
         prompt_for_optimize=prompt_template,
         section_type=normalized_section_type,
-        section_title=section_title or _default_prompt_section_title(
-            normalized_section_type, language),
+        section_title=section_title or _default_prompt_section_title(normalized_section_type, language),
         task_description=task_description,
         current_content=current_content,
         feedback=feedback,
@@ -487,8 +398,7 @@ def generate_system_prompt(sub_agent_info_list, task_description, tool_info_list
     # If None or >= 6, no limit (all 6 calls run concurrently)
     # If < 6, use semaphore to limit concurrent calls
     model_config = get_model_by_model_id(model_id, tenant_id)
-    concurrency_limit = model_config.get(
-        "concurrency_limit") if model_config else None
+    concurrency_limit = model_config.get("concurrency_limit") if model_config else None
 
     # Start all generation threads with concurrency control
     threads, error_holder = _start_generation_threads(
@@ -533,8 +443,7 @@ def _resolve_knowledge_base_display_names(
         agent_id=agent_id,
         tenant_id=tenant_id
     )
-    logger.debug(
-        f"Using database query for knowledge base display names: {resolved_names}")
+    logger.debug(f"Using database query for knowledge base display names: {resolved_names}")
     return resolved_names
 
 
@@ -562,9 +471,8 @@ def _resolve_prompt_generation_sub_agents(
         tenant_id=tenant_id, agent_id=agent_id
     )
 
-
 def _start_generation_threads(content, prompt_for_generate, produce_queue, latest, stop_flags, tenant_id, model_id,
-                              has_selected_resources=True, concurrency_limit: Optional[int] = None):
+                                has_selected_resources = True, concurrency_limit: Optional[int] = None):
     """Start all prompt generation threads with optional concurrency control."""
     # Shared error tracking across threads
     error_holder = {"error": None}
@@ -580,11 +488,9 @@ def _start_generation_threads(content, prompt_for_generate, produce_queue, lates
         effective_limit = concurrency_limit
 
     # Use semaphore if concurrency is limited
-    semaphore = threading.Semaphore(
-        effective_limit) if effective_limit else None
+    semaphore = threading.Semaphore(effective_limit) if effective_limit else None
     if semaphore:
-        logger.info(
-            f"Using concurrency limit of {effective_limit} for prompt generation (total tasks: {total_tasks})")
+        logger.info(f"Using concurrency limit of {effective_limit} for prompt generation (total tasks: {total_tasks})")
     else:
         logger.info("Using unlimited concurrency for prompt generation")
 
@@ -633,8 +539,7 @@ def run_and_flag(tag, sys_prompt):
             ("few_shots", prompt_for_generate["few_shots_system_prompt"]),
         ])
     else:
-        logger.info(
-            "Skipping constraint and few_shots generation: no tools or sub-agents selected")
+        logger.info("Skipping constraint and few_shots generation: no tools or sub-agents selected")
         # Mark these sections as already complete with empty content
         stop_flags["constraint"] = True
         stop_flags["few_shots"] = True
@@ -733,15 +638,13 @@ def join_info_for_generate_system_prompt(prompt_for_generate, sub_agent_info_lis
     # This is necessary because Jinja2 StrictUndefined raises an error for any
     # undefined variable, even inside an {% if %} block.
     if knowledge_base_display_names:
-        kb_names_str = ", ".join(
-            f'"{name}"' for name in knowledge_base_display_names)
+        kb_names_str = ", ".join(f'"{name}"' for name in knowledge_base_display_names)
     else:
         kb_names_str = ""
     template_context["knowledge_base_names"] = kb_names_str
 
     # Generate content using template
-    content = Template(
-        prompt_for_generate["user_prompt"], undefined=StrictUndefined).render(template_context)
+    content = Template(prompt_for_generate["user_prompt"], undefined=StrictUndefined).render(template_context)
     return content
 
 
@@ -769,8 +672,7 @@ def join_info_for_optimize_prompt_section(
     )
 
     if knowledge_base_display_names:
-        kb_names_str = ", ".join(
-            f'"{name}"' for name in knowledge_base_display_names)
+        kb_names_str = ", ".join(f'"{name}"' for name in knowledge_base_display_names)
     else:
         kb_names_str = ""
 
@@ -822,8 +724,7 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
         List of knowledge base display names if knowledge_base_search tool is configured, None otherwise
     """
     # Check if knowledge_base_search tool is in the list
-    kb_tool_ids = [tool['tool_id'] for tool in tool_info_list if tool.get(
-        'name') == 'knowledge_base_search']
+    kb_tool_ids = [tool['tool_id'] for tool in tool_info_list if tool.get('name') == 'knowledge_base_search']
     if not kb_tool_ids:
         logger.debug("No knowledge_base_search tool found in tool list")
         return None
@@ -846,23 +747,19 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
                     try:
                         all_index_names.extend(json.loads(index_names))
                     except json.JSONDecodeError:
-                        logger.warning(
-                            f"Failed to parse index_names JSON: {index_names}")
+                        logger.warning(f"Failed to parse index_names JSON: {index_names}")
         except Exception as e:
-            logger.warning(
-                f"Failed to get tool instance for tool_id {kb_tool_id}: {e}")
+            logger.warning(f"Failed to get tool instance for tool_id {kb_tool_id}: {e}")
 
     if not all_index_names:
-        logger.debug(
-            "No index_names configured for knowledge_base_search tool")
+        logger.debug("No index_names configured for knowledge_base_search tool")
         return None
 
     # Remove duplicates while preserving order
     unique_index_names = list(dict.fromkeys(all_index_names))
 
     # Convert to display names
-    knowledge_name_map = get_knowledge_name_map_by_index_names(
-        unique_index_names)
+    knowledge_name_map = get_knowledge_name_map_by_index_names(unique_index_names)
 
     # Return list of display names (knowledge_name) for each configured index_name
     display_names = []
@@ -871,8 +768,7 @@ def get_knowledge_base_display_names(tool_info_list: List[dict], agent_id: int,
         if display_name and display_name not in display_names:
             display_names.append(display_name)
 
-    logger.debug(
-        f"Converted index_names {unique_index_names} to display_names: {display_names}")
+    logger.debug(f"Converted index_names {unique_index_names} to display_names: {display_names}")
     return display_names if display_names else None
 
 
@@ -889,299 +785,3 @@ def get_enabled_sub_agent_description_for_generate_prompt(agent_id: int, tenant_
 
         sub_agent_info_list.append(sub_agent_info)
     return sub_agent_info_list
-
-
-# ── Jiuwen SDK 集成 ───────────────────────────────────────────────────────────
-
-
-@dataclass
-class OptimizeRequest:
-    """优化请求的统一数据结构"""
-    agent_id: int
-    model_id: int
-    task_description: str
-    section_type: str
-    section_title: str
-    current_content: str
-    feedback: str
-    mode: str = "general"
-    start_pos: Opt[int] = None
-    end_pos: Opt[int] = None
-    tool_ids: Opt[list[int]] = None
-    sub_agent_ids: Opt[list[int]] = None
-    knowledge_base_display_names: Opt[list[str]] = None
-
-
-@dataclass
-class OptimizeResult:
-    """优化结果的统一数据结构"""
-    optimized_content: str
-    source: str
-    section_type: str = ""
-    section_title: str = ""
-    original_content: str = ""
-
-
-class PromptOptimizationService:
-    """提示词优化服务 — 统一入口，模式二选一"""
-
-    def optimize_from_debug(self, agent_id: int, feedback: str, selected, history=None) -> OptimizeResult:
-        """基于调试对话自动优化整个 system prompt（完整模板）。
-
-        Args:
-            selected: OptimizeFromDebugSelected (pydantic model) or any object with user_question/assistant_answer.
-            history: Optional[List[HistoryItem]]
-        """
-        if not (feedback or "").strip():
-            raise AppException(
-                ErrorCode.COMMON_MISSING_REQUIRED_FIELD,
-                "Optimization feedback is required.",
-            )
-
-        if not self.is_jiuwen_mode_available():
-            raise NexentCapabilityError(
-                "Auto optimize from debug requires Jiuwen SDK to be enabled."
-            )
-
-        agent_info = search_agent_info_by_agent_id(
-            agent_id=agent_id, tenant_id=self.tenant_id, version_no=0)
-
-        duty = (agent_info.get("duty_prompt") or "").strip()
-        constraint = (agent_info.get("constraint_prompt") or "").strip()
-        few_shots = (agent_info.get("few_shots_prompt") or "").strip()
-
-        original_full_prompt = "\n\n".join(
-            [
-                "# Duty\n" + duty,
-                "# Constraint\n" + constraint,
-                "# FewShots\n" + few_shots,
-            ]
-        ).strip()
-
-        if not original_full_prompt:
-            raise AppException(
-                ErrorCode.COMMON_MISSING_REQUIRED_FIELD,
-                "Agent system prompt is empty.",
-            )
-
-        user_question = getattr(selected, "user_question", None) or (
-            selected.get("user_question") if isinstance(selected, dict) else "")
-        assistant_answer = getattr(selected, "assistant_answer", None) or (
-            selected.get("assistant_answer") if isinstance(selected, dict) else "")
-
-        bad_case_obj = type("_BadCase", (), {})
-        bc = bad_case_obj()
-        bc.question = user_question or ""
-        bc.answer = assistant_answer or ""
-        bc.label = ""
-        bc.reason = feedback
-
-        adapter_cls = _get_jiuwen_adapter_class()
-        if adapter_cls is None:
-            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
-
-        adapter = adapter_cls(
-            model_id=self.model_id, tenant_id=self.tenant_id)
-
-        optimized_full_prompt = adapter.optimize_badcase(
-            prompt=original_full_prompt,
-            bad_cases=[bc],
-            language=self.language,
-        )
-
-        return OptimizeResult(
-            optimized_content=optimized_full_prompt,
-            source="jiuwen",
-            section_type="full_prompt",
-            section_title="system_prompt",
-            original_content=original_full_prompt,
-        )
-
-    def __init__(self, model_id: int, tenant_id: str, language: str):
-        self.model_id = model_id
-        self.tenant_id = tenant_id
-        self.language = language
-
-    def is_jiuwen_mode_available(self) -> bool:
-        """判断 Jiuwen SDK 模式是否可用"""
-        if not ENABLE_JIUWEN_SDK:
-            return False
-
-        return _get_jiuwen_adapter_class() is not None
-
-    def optimize(self, request: OptimizeRequest) -> OptimizeResult:
-        """统一优化入口 — 优先 Jiuwen SDK，失败则降级 nexent 原生"""
-        if self.is_jiuwen_mode_available():
-            logger.info(
-                f"[prompt-optimize] mode={request.mode}, using Jiuwen SDK")
-            try:
-                return self._optimize_with_jiuwen(request)
-            except JiuwenSDKError as e:
-                logger.warning(f"Jiuwen SDK 模式失败，降级到 nexent 原生: {e}")
-                return self._optimize_with_nexent(request)
-        else:
-            return self._optimize_with_nexent(request)
-
-    def _optimize_with_jiuwen(self, request: OptimizeRequest) -> OptimizeResult:
-        """Jiuwen SDK 模式"""
-        logger.info(
-            f"[jiuwen-optimize] mode={request.mode}, start_pos={request.start_pos}, "
-            f"end_pos={request.end_pos}, prompt_len={len(request.current_content)}, "
-            f"feedback_len={len(request.feedback)}"
-        )
-        adapter_cls = _get_jiuwen_adapter_class()
-        if adapter_cls is None:
-            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
-
-        adapter = adapter_cls(
-            model_id=self.model_id,
-            tenant_id=self.tenant_id,
-        )
-        result = adapter.optimize(
-            prompt=request.current_content,
-            feedback=request.feedback,
-            mode=request.mode,
-            start_pos=request.start_pos,
-            end_pos=request.end_pos,
-            language=self.language,
-        )
-
-        # Jiuwen insert/select mode returns a fragment by design.
-        # We reassemble the full prompt here so frontend always receives full optimized content.
-        if request.mode == "insert":
-            if request.start_pos is None or not isinstance(request.start_pos, int):
-                raise JiuwenSDKError("insert mode requires start_pos")
-            if request.start_pos < 0 or request.start_pos > len(request.current_content):
-                raise JiuwenSDKError("insert mode start_pos out of bounds")
-            optimized_full = (
-                request.current_content[: request.start_pos]
-                + result
-                + request.current_content[request.start_pos:]
-            )
-        elif request.mode == "select":
-            if request.start_pos is None or request.end_pos is None:
-                raise JiuwenSDKError(
-                    "select mode requires start_pos and end_pos")
-            if not isinstance(request.start_pos, int) or not isinstance(request.end_pos, int):
-                raise JiuwenSDKError(
-                    "select mode start_pos/end_pos must be int")
-            if request.start_pos < 0 or request.end_pos < 0 or request.start_pos >= request.end_pos:
-                raise JiuwenSDKError("select mode start_pos/end_pos invalid")
-            if request.end_pos > len(request.current_content):
-                raise JiuwenSDKError("select mode end_pos out of bounds")
-            optimized_full = (
-                request.current_content[: request.start_pos]
-                + result
-                + request.current_content[request.end_pos:]
-            )
-        else:
-            optimized_full = result
-
-        return OptimizeResult(
-            optimized_content=optimized_full,
-            source="jiuwen",
-            section_type=request.section_type,
-            section_title=request.section_title,
-            original_content=request.current_content,
-        )
-
-    def _optimize_with_nexent(self, request: OptimizeRequest) -> OptimizeResult:
-        """nexent 原生模式 — 只支持 general 模式"""
-        if request.mode != "general":
-            raise NexentCapabilityError(
-                f"nexent 原生模式只支持 general 模式，"
-                f"当前请求 mode={request.mode} 不支持，请启用 Jiuwen SDK"
-            )
-
-        result = optimize_prompt_section_impl(
-            agent_id=request.agent_id,
-            model_id=self.model_id,
-            task_description=request.task_description,
-            tenant_id=self.tenant_id,
-            language=self.language,
-            section_type=request.section_type,
-            section_title=request.section_title,
-            current_content=request.current_content,
-            feedback=request.feedback,
-            tool_ids=request.tool_ids,
-            sub_agent_ids=request.sub_agent_ids,
-            knowledge_base_display_names=request.knowledge_base_display_names,
-        )
-        return OptimizeResult(
-            optimized_content=result["optimized_content"],
-            source="nexent",
-            section_type=result["section_type"],
-            section_title=result["section_title"],
-            original_content=result["original_content"],
-        )
-
-    def optimize_badcase(
-        self,
-        current_content: str,
-        bad_cases: list,
-        agent_id: int,
-        section_type: str,
-        section_title: str,
-        tool_ids: Opt[list[int]] = None,
-        sub_agent_ids: Opt[list[int]] = None,
-        knowledge_base_display_names: Opt[list[str]] = None,
-    ) -> OptimizeResult:
-        """坏案例优化入口 — 优先 Jiuwen SDK，失败则降级"""
-        if self.is_jiuwen_mode_available():
-            logger.info("[prompt-badcase] using Jiuwen SDK")
-            try:
-                return self._optimize_badcase_with_jiuwen(
-                    current_content, bad_cases, section_type, section_title
-                )
-            except JiuwenSDKError as e:
-                logger.warning(f"Jiuwen SDK badcase 模式失败，降级到 nexent 原生: {e}")
-                return self._optimize_badcase_with_nexent(
-                    current_content, bad_cases, agent_id, section_type, section_title,
-                    tool_ids, sub_agent_ids, knowledge_base_display_names,
-                )
-        else:
-            return self._optimize_badcase_with_nexent(
-                current_content, bad_cases, agent_id, section_type, section_title,
-                tool_ids, sub_agent_ids, knowledge_base_display_names,
-            )
-
-    def _optimize_badcase_with_jiuwen(
-        self, current_content: str, bad_cases: list, section_type: str, section_title: str
-    ) -> OptimizeResult:
-        """Jiuwen SDK 坏案例优化"""
-        adapter_cls = _get_jiuwen_adapter_class()
-        if adapter_cls is None:
-            raise JiuwenSDKError("Jiuwen SDK adapter is unavailable")
-
-        adapter = adapter_cls(
-            model_id=self.model_id,
-            tenant_id=self.tenant_id,
-        )
-        result = adapter.optimize_badcase(
-            prompt=current_content,
-            bad_cases=bad_cases,
-            language=self.language,
-        )
-        return OptimizeResult(
-            optimized_content=result,
-            source="jiuwen",
-            section_type=section_type,
-            section_title=section_title,
-            original_content=current_content,
-        )
-
-    def _optimize_badcase_with_nexent(
-        self,
-        current_content: str,
-        bad_cases: list,
-        agent_id: int,
-        section_type: str,
-        section_title: str,
-        tool_ids: Opt[list[int]] = None,
-        sub_agent_ids: Opt[list[int]] = None,
-        knowledge_base_display_names: Opt[list[str]] = None,
-    ) -> OptimizeResult:
-        """nexent 原生模式不支持坏案例优化"""
-        raise NexentCapabilityError(
-            "nexent 原生模式不支持 badcase 优化，请启用 Jiuwen SDK"
-        )
diff --git a/backend/services/remote_mcp_service.py b/backend/services/remote_mcp_service.py
index 7e77a9c43..56a73fb4b 100644
--- a/backend/services/remote_mcp_service.py
+++ b/backend/services/remote_mcp_service.py
@@ -230,7 +230,7 @@ async def add_mcp_service(
     server_url: str,
     tags: list | None,
     authorization_token: str | None,
-    custom_headers: dict | None = None,
+    custom_headers: dict | None,
     container_config: dict | None,
     registry_json: dict | None,
     enabled: bool = False,
diff --git a/backend/services/tool_configuration_service.py b/backend/services/tool_configuration_service.py
index 3cbf5edc5..ba51567dc 100644
--- a/backend/services/tool_configuration_service.py
+++ b/backend/services/tool_configuration_service.py
@@ -782,8 +782,6 @@ def _validate_local_tool(
                 'embedding_model': embedding_model,
                 'rerank_model': rerank_model,
                 'display_name_to_index_map': display_name_to_index_map,
-                # Internal access control: restrict results to specific document paths (path_or_urls)
-                'document_paths': instantiation_params.get('document_paths'),
             }
             tool_instance = tool_class(**params)
         elif tool_name in ["dify_search", "datamate_search"]:
@@ -984,7 +982,6 @@ def import_openapi_service(
     tenant_id: str,
     user_id: str,
     service_description: str = None,
-    headers_template: Dict[str, Any] = None,
     force_update: bool = False
 ) -> Dict[str, Any]:
     """
@@ -998,7 +995,6 @@ def import_openapi_service(
         tenant_id: Tenant ID for multi-tenancy
         user_id: User ID for audit
         service_description: Optional service description (if not provided, reads from openapi_json.info.description)
-        headers_template: Optional default headers template
         force_update: If True, replace all existing tools for this service
 
     Returns:
@@ -1019,8 +1015,7 @@ def import_openapi_service(
         server_url=server_url,
         tenant_id=tenant_id,
         user_id=user_id,
-        description=service_description,
-        headers_template=headers_template,
+        description=service_description
     )
 
     logger.info(f"Imported service '{service_name}' for tenant {tenant_id}")
diff --git a/backend/services/user_management_service.py b/backend/services/user_management_service.py
index 0b38a76bc..a983b25d3 100644
--- a/backend/services/user_management_service.py
+++ b/backend/services/user_management_service.py
@@ -18,7 +18,6 @@
     get_supabase_admin_client,
     calculate_expires_at,
     get_jwt_expiry_seconds,
-    ensure_cas_session_active_from_authorization,
     resolve_tenant_id_from_user_tenant_record,
 )
 from consts.const import (
@@ -108,7 +107,6 @@ def validate_token(token: str) -> Tuple[bool, Optional[Any]]:
     try:
         user = get_current_user_from_client(client, token)
         if user:
-            ensure_cas_session_active_from_authorization(token)
             return True, user
         return False, None
     except Exception as e:
diff --git a/backend/services/vectordatabase_service.py b/backend/services/vectordatabase_service.py
index dd2f6e51a..11c5fd9bf 100644
--- a/backend/services/vectordatabase_service.py
+++ b/backend/services/vectordatabase_service.py
@@ -10,7 +10,6 @@
 4. Health check interface
 """
 import asyncio
-import hashlib
 import json
 import logging
 import os
@@ -29,7 +28,7 @@
 
 from consts.const import DATAMATE_URL, ES_API_KEY, ES_HOST, LANGUAGE, VectorDatabaseType, IS_SPEED_MODE, PERMISSION_EDIT, PERMISSION_READ, ASSET_OWNER_TENANT_ID
 from consts.model import ChunkCreateRequest, ChunkUpdateRequest
-from database.attachment_db import delete_file, file_exists, get_file_stream
+from database.attachment_db import delete_file, get_file_stream
 from database.knowledge_db import (
     create_knowledge_record,
     delete_knowledge_record,
@@ -354,18 +353,15 @@ def get_embedding_model(
         tenant_id: Tenant ID
         model_name: Optional display name of the embedding model to use.
                    If provided, will find the model by display_name in the tenant's model list.
-        model_type: Optional model type filter. When model_name is omitted, queries tenant
-                   model records by this type; when model_type is also omitted, prefers
-                   embedding models, then multi_embedding models.
 
     Returns:
         Tuple of (embedding model instance or None, model_id or None)
     """
     if model_name:
         try:
-            model_type = _normalize_model_type(model_type)
-            if model_type:
-                model = get_model_by_display_name(model_name, tenant_id, model_type)
+            normalized_model_type = _normalize_model_type(model_type)
+            if normalized_model_type:
+                model = get_model_by_display_name(model_name, tenant_id, normalized_model_type)
             else:
                 model = get_model_by_display_name(model_name, tenant_id)
 
@@ -376,25 +372,8 @@ def get_embedding_model(
             return _create_embedding_model(model), model.get("model_id")
         except Exception as e:
             logger.warning(f"Failed to get embedding model by name {model_name}: {e}")
-    else:
-        try:
-            if model_type:
-                records = get_model_records({"model_type": model_type}, tenant_id)
-            else:
-                records = get_model_records({"model_type": "embedding"}, tenant_id)
-                if not records:
-                    records = get_model_records({"model_type": "multi_embedding"}, tenant_id)
-
-            if records:
-                model = records[0]
-                if model.get("model_type") in ["embedding", "multi_embedding"]:
-                    return _create_embedding_model(model), model.get("model_id")
-                logger.warning(
-                    f"Resolved model is not an embedding model: {model.get('model_type')}"
-                )
-        except Exception as e:
-            logger.warning(f"Failed to get default embedding model for tenant {tenant_id}: {e}")
 
+    # No default fallback - return None, None when no model is specified or found
     return None, None
 
 
@@ -657,7 +636,6 @@ def create_knowledge_base(
             group_ids: Optional[List[int]] = None,
             embedding_model_name: Optional[str] = None,
             is_multimodal: Optional[bool] = None,
-            preserve_source_file: Optional[bool] = None,
     ):
         """
         Create a new knowledge base with a user-facing name and an internal Elasticsearch index name.
@@ -677,8 +655,6 @@ def create_knowledge_base(
             group_ids: List of group IDs (optional)
             embedding_model_name: Specific embedding model name to use (optional).
                                    If provided, will use this model instead of tenant default.
-            preserve_source_file: Whether to preserve uploaded source documents after
-                                   vectorization (optional; defaults to True when omitted).
 
         For backward compatibility, legacy callers can still use create_index() directly
         with an explicit index_name.
@@ -718,8 +694,6 @@ def create_knowledge_base(
                 knowledge_data["ingroup_permission"] = ingroup_permission
             if group_ids is not None:
                 knowledge_data["group_ids"] = group_ids
-            if preserve_source_file is not None:
-                knowledge_data["preserve_source_file"] = preserve_source_file
 
             record_info = create_knowledge_record(knowledge_data)
             index_name = record_info["index_name"]
@@ -1117,7 +1091,6 @@ def list_indices(
                         # Auto-summary settings
                         "summary_frequency": record.get("summary_frequency"),
                         "last_summary_time": record.get("last_summary_time"),
-                        "preserve_source_file": record.get("preserve_source_file", True),
                         "stats": index_stats,
                     })
 
@@ -1515,11 +1488,6 @@ async def list_files(
                     # chunk_count is already set from ES aggregation (doc_count)
                     file_data['chunk_count'] = file_data.get('chunk_count', 0)
 
-            for file_data in files:
-                file_data["source_available"] = (
-                    ElasticSearchService._compute_source_available(file_data)
-                )
-
             total_duration = time.time() - total_start_time
             logger.info(f"[list_files:complete] index={index_name}, total_files={len(files)}, "
                        f"total_duration={total_duration:.3f}s")
@@ -1530,100 +1498,6 @@ async def list_files(
             raise Exception(
                 f"Error getting file list for index {index_name}: {str(e)}")
 
-    DOCUMENT_DELETE_SCOPES = ("source_only", "full")
-
-    @staticmethod
-    def _preview_pdf_cache_object_name(object_name: str) -> str:
-        """Object key for Office-to-PDF preview cache (matches file_management_service)."""
-        name_without_ext = (
-            object_name.rsplit(".", 1)[0] if "." in object_name else object_name
-        )
-        hash_suffix = hashlib.md5(object_name.encode()).hexdigest()[:8]
-        return f"preview/converted/{name_without_ext}_{hash_suffix}.pdf"
-
-    @staticmethod
-    def _compute_source_available(file_data: Dict[str, Any]) -> bool:
-        path_or_url = file_data.get("path_or_url") or ""
-        status = file_data.get("status", "")
-        if status != "COMPLETED":
-            return True
-        if path_or_url.startswith("knowledge_base/"):
-            return file_exists(path_or_url)
-        return True
-
-    @staticmethod
-    def delete_source_file(path_or_url: str) -> Dict[str, Any]:
-        """Remove MinIO source (and preview cache); does not touch Elasticsearch."""
-        minio_result = delete_file(path_or_url)
-        deleted_minio = bool(minio_result.get("success"))
-
-        if path_or_url.startswith("knowledge_base/"):
-            preview_key = ElasticSearchService._preview_pdf_cache_object_name(
-                path_or_url
-            )
-            try:
-                if file_exists(preview_key):
-                    delete_file(preview_key)
-            except Exception as exc:
-                logger.warning(
-                    "Failed to delete preview cache for '%s': %s",
-                    path_or_url,
-                    exc,
-                )
-
-        return {"deleted_minio": deleted_minio}
-
-    @staticmethod
-    async def _assert_source_only_deletable(
-            index_name: str, path_or_url: str
-    ) -> None:
-        celery_task_files = await get_all_files_status(index_name)
-        status_info = celery_task_files.get(path_or_url)
-        if not status_info or not isinstance(status_info, dict):
-            return
-        state = status_info.get("state") or ""
-        if state and state != "COMPLETED":
-            raise ValueError(
-                f"Cannot delete source file while document is in state '{state}'. "
-                "Wait until processing completes or use scope=full to remove the document."
-            )
-
-    @staticmethod
-    async def delete_document_by_scope(
-            index_name: str,
-            path_or_url: str,
-            scope: str,
-            vdb_core: VectorDatabaseCore,
-    ) -> Dict[str, Any]:
-        if scope not in ElasticSearchService.DOCUMENT_DELETE_SCOPES:
-            raise ValueError(
-                f"Invalid scope '{scope}'. "
-                f"Must be one of: {ElasticSearchService.DOCUMENT_DELETE_SCOPES}"
-            )
-
-        if scope == "source_only":
-            await ElasticSearchService._assert_source_only_deletable(
-                index_name, path_or_url
-            )
-            minio_part = ElasticSearchService.delete_source_file(path_or_url)
-            return {
-                "status": "success",
-                "scope": scope,
-                "deleted_es_count": 0,
-                "deleted_minio": minio_part.get("deleted_minio", False),
-                "source_available": False,
-                "message": (
-                    "Source file deleted; index chunks and vectors preserved."
-                ),
-            }
-
-        result = ElasticSearchService.delete_documents(
-            index_name, path_or_url, vdb_core
-        )
-        result["scope"] = scope
-        result["source_available"] = False
-        return result
-
     @staticmethod
     def delete_documents(
             index_name: str = Path(..., description="Name of the index"),
diff --git a/backend/utils/auth_utils.py b/backend/utils/auth_utils.py
index a7194f050..04e81e6e3 100644
--- a/backend/utils/auth_utils.py
+++ b/backend/utils/auth_utils.py
@@ -326,13 +326,16 @@ def calculate_expires_at(token: Optional[str] = None) -> int:
     return int((datetime.now() + timedelta(seconds=expiry_seconds)).timestamp())
 
 
-def _decode_jwt_token(authorization: str) -> dict:
+def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
     """
     Extract user ID from JWT token after verifying signature and expiration.
 
     Args:
         authorization: Authorization header value
 
+    Returns:
+        Optional[str]: User ID, return None if parsing fails
+
     Raises:
         UnauthorizedError: If token is invalid, expired, or signature verification fails
     """
@@ -352,12 +355,17 @@ def _decode_jwt_token(authorization: str) -> dict:
 
         # Decode and verify JWT (signature + expiration)
         # verify_aud=False: allow tokens with aud claim (e.g. test JWT, Supabase) without strict audience check
-        return jwt.decode(
+        decoded = jwt.decode(
             token,
             SUPABASE_JWT_SECRET,
             algorithms=["HS256"],
             options={"verify_exp": True, "verify_aud": False},
         )
+
+        # Extract user ID from JWT claims
+        user_id = decoded.get("sub")
+
+        return user_id
     except jwt.ExpiredSignatureError:
         logging.warning("Token expired")
         raise UnauthorizedError("Token has expired")
@@ -370,47 +378,10 @@ def _decode_jwt_token(authorization: str) -> dict:
     except UnauthorizedError:
         raise
     except Exception as e:
-        logging.error(f"Failed to decode token: {str(e)}")
+        logging.error(f"Failed to extract user ID from token: {str(e)}")
         raise UnauthorizedError("Invalid or expired authentication token")
 
 
-def _extract_user_id_from_jwt_token(authorization: str) -> Optional[str]:
-    """
-    Extract user ID from JWT token after verifying signature and expiration.
-    """
-    decoded = _decode_jwt_token(authorization)
-    return decoded.get("sub")
-
-
-def extract_session_id_from_authorization(authorization: Optional[str]) -> Optional[str]:
-    """Extract the sid claim without enforcing token validity, for idempotent logout."""
-    if not authorization:
-        return None
-    try:
-        token = (
-            authorization.replace("Bearer ", "")
-            if authorization.startswith("Bearer ")
-            else authorization
-        )
-        decoded = jwt.decode(token, options={"verify_signature": False})
-        sid = decoded.get("sid")
-        return str(sid) if sid else None
-    except Exception:
-        return None
-
-
-def ensure_cas_session_active_from_authorization(authorization: Optional[str]) -> None:
-    """Reject CAS-issued JWTs whose server-side session is expired or revoked."""
-    session_id = extract_session_id_from_authorization(authorization)
-    if not session_id:
-        return
-
-    from database.cas_session_db import is_cas_session_active
-
-    if not is_cas_session_active(str(session_id)):
-        raise UnauthorizedError("CAS session has expired or been revoked")
-
-
 def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
     """
     Get current user ID and tenant ID from authorization token
@@ -434,13 +405,10 @@ def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
         raise UnauthorizedError("No authorization header provided")
 
     try:
-        decoded = _decode_jwt_token(authorization)
-        user_id = decoded.get("sub")
+        user_id = _extract_user_id_from_jwt_token(authorization)
         if not user_id:
             raise UnauthorizedError("Invalid or expired authentication token")
 
-        ensure_cas_session_active_from_authorization(authorization)
-
         user_tenant_record = get_user_tenant_by_user_id(user_id)
         if user_tenant_record and user_tenant_record.get("tenant_id"):
             tenant_id = user_tenant_record["tenant_id"]
@@ -453,8 +421,6 @@ def get_current_user_id(authorization: Optional[str] = None) -> tuple[str, str]:
 
         return user_id, tenant_id
 
-    except UnauthorizedError:
-        raise
     except Exception as e:
         logging.error(f"Failed to get user ID and tenant ID: {str(e)}")
         raise UnauthorizedError("Invalid or expired authentication token")
@@ -506,7 +472,7 @@ def generate_test_jwt(user_id: str, expires_in: int = 3600) -> str:
     return jwt.encode(payload, MOCK_JWT_SECRET_KEY, algorithm="HS256")
 
 
-def generate_session_jwt(user_id: str, expires_in: int = 3600, session_id: str = None) -> str:
+def generate_session_jwt(user_id: str, expires_in: int = 3600) -> str:
     """Generate a signed JWT compatible with the existing auth verification flow."""
     now = int(time.time())
     payload = {
@@ -517,8 +483,6 @@ def generate_session_jwt(user_id: str, expires_in: int = 3600, session_id: str =
         "exp": now + expires_in,
         "iss": SUPABASE_URL,
     }
-    if session_id:
-        payload["sid"] = session_id
     return jwt.encode(payload, SUPABASE_JWT_SECRET, algorithm="HS256")
 
 
diff --git a/backend/utils/context_utils.py b/backend/utils/context_utils.py
index 0c3af8915..740bf66df 100644
--- a/backend/utils/context_utils.py
+++ b/backend/utils/context_utils.py
@@ -8,6 +8,7 @@
 allowing ContextManager to assemble them in the correct order.
 """
 
+from datetime import datetime
 from typing import TYPE_CHECKING, Any, Dict, List, Optional
 
 if TYPE_CHECKING:
@@ -507,12 +508,13 @@ def _format_agent_fallback(
     return "- 当前没有可用的助手" if language == "zh" else "- No agents are currently available"
 
 
-def _format_app_context(app_name: str, app_description: str, user_id: str) -> str:
+def _format_app_context(app_name: str, app_description: str, user_id: str, time_str: str) -> str:
     """Format application context for system prompt injection."""
     lines = [
         f"Application: {app_name}",
         f"Description: {app_description}",
         f"Current user: {user_id}",
+        f"Current time: {time_str}",
     ]
     return "\n".join(lines)
 
@@ -526,6 +528,7 @@ def _format_app_context(app_name: str, app_description: str, user_id: str) -> st
 def build_skeleton_header_component(
     app_name: str,
     app_description: str,
+    time_str: str,
     user_id: str,
     language: str = "zh",
     priority: int = 100,
@@ -533,17 +536,14 @@ def build_skeleton_header_component(
     """Build SystemPromptComponent for the header section.
 
     Section: "### 基本信息" / "### Basic Information"
-    Content: Agent identity, app name/description, user_id.
-    Note: Current time is intentionally excluded from the system prompt so the
-    static system prefix can hit the LLM KV/prompt cache across requests. The
-    current time is injected on the user-message side instead (see CoreAgent.run).
+    Content: Agent identity, app name/description, time, user_id
     """
     from nexent.core.agents.agent_model import SystemPromptComponent
 
     if language == "zh":
-        content = f"### 基本信息\n你是{app_name}，{app_description}，用户ID为{user_id}"
+        content = f"### 基本信息\n你是{app_name}，{app_description}，现在是{time_str}，用户ID为{user_id}"
     else:
-        content = f"### Basic Information\nYou are {app_name}, {app_description}"
+        content = f"### Basic Information\nYou are {app_name}, {app_description}, it is {time_str} now"
 
     return SystemPromptComponent(
         content=content,
@@ -611,11 +611,6 @@ def build_skeleton_execution_flow_component(
         lines.append("   - 注意运行的代码不会被用户看到，所以如果用户需要看到代码，你需要使用'<DISPLAY:语言类型>代码</DISPLAY>'表达展示代码。")
         lines.append("   - **重要**：代码执行后，系统会返回 \"Observation:\" 标记的内容（这是真实的执行结果）。请基于这些真实结果继续下一步思考，**不要在代码执行前自行编造观察结果**。")
         lines.append("")
-        lines.append("3. 自验证：")
-        lines.append("   - 关键事件（工具调用、检索结果、代码执行、助手返回、准备最终回答）后，系统会进行显式自验证。")
-        lines.append("   - 如果自验证提示存在错误、证据不足、参数不完整或结果不可靠，必须优先修正、补充证据、重新调用工具，或清晰说明无法完成的部分。")
-        lines.append("   - 最终回答只有在自验证通过后才会展示给用户；如果系统返回 Verification feedback，请把它视为真实观察结果继续修正，不要忽略。")
-        lines.append("")
         lines.append("在思考结束后，当你认为可以回答用户问题，那么可以不生成代码，直接生成最终回答给到用户并停止循环。")
         lines.append("")
         lines.append("生成最终回答时，你需要遵循以下规范：")
@@ -657,11 +652,6 @@ def build_skeleton_execution_flow_component(
         lines.append("   - Note that executed code is not visible to users. If users need to see the code, use '<DISPLAY:language_type>code</DISPLAY>' for displaying code.")
         lines.append("   - **IMPORTANT**: After code execution, the system will return content with \"Observation:\" marker (this is the real execution result). Please continue your next thinking based on these real results. **Do NOT fabricate observation results before code execution.**")
         lines.append("")
-        lines.append("3. Self-verification:")
-        lines.append("   - After critical events (tool calls, retrieval results, code execution, agent handoffs, and final-answer preparation), the system may run explicit verification.")
-        lines.append("   - If verification reports errors, insufficient evidence, incomplete parameters, or unreliable results, you must repair the issue, gather more evidence, call tools again, or clearly state what cannot be completed.")
-        lines.append("   - The final answer is shown to the user only after verification passes. If the system returns Verification feedback, treat it as a real observation and continue revising.")
-        lines.append("")
         lines.append("After thinking, when you believe you can answer the user's question, you can generate a final answer directly to the user without generating code and stop the loop.")
         lines.append("")
         lines.append("When generating the final answer, you need to follow these specifications:")
@@ -1122,6 +1112,7 @@ def build_context_components(
     few_shots: Optional[str] = None,
     app_name: Optional[str] = None,
     app_description: Optional[str] = None,
+    time_str: Optional[str] = None,
     user_id: Optional[str] = None,
     language: str = "zh",
     is_manager: bool = True,
@@ -1176,6 +1167,7 @@ def build_context_components(
         few_shots: Example templates text
         app_name: Application name
         app_description: Application description
+        time_str: Current time string
         user_id: Current user ID
         language: Language code ('zh' or 'en')
         is_manager: Whether this is a manager agent
@@ -1196,11 +1188,12 @@ def build_context_components(
     components: List = []
 
     # 1. Header
-    if app_name and app_description and user_id:
+    if app_name and app_description and time_str and user_id:
         components.append(
             build_skeleton_header_component(
                 app_name=app_name,
                 app_description=app_description,
+                time_str=time_str,
                 user_id=user_id,
                 language=language,
             )
@@ -1335,4 +1328,5 @@ def build_app_context_string(
     Returns:
         Formatted app context string
     """
-    return _format_app_context(app_name, app_description, user_id)
+    time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    return _format_app_context(app_name, app_description, user_id, time_str)
\ No newline at end of file
diff --git a/backend/utils/http_client_utils.py b/backend/utils/http_client_utils.py
index 262c0a593..1c1d14af6 100644
--- a/backend/utils/http_client_utils.py
+++ b/backend/utils/http_client_utils.py
@@ -8,7 +8,6 @@ def create_httpx_client(
     headers: dict[str, str] | None = None,
     timeout: httpx.Timeout | None = None,
     auth: httpx.Auth | None = None,
-    **kwargs,
 ) -> AsyncClient:
     return AsyncClient(
         headers=headers,
@@ -16,5 +15,4 @@ def create_httpx_client(
         auth=auth,
         trust_env=False,
         verify=False,
-        **kwargs,
     )
diff --git a/backend/utils/memory_utils.py b/backend/utils/memory_utils.py
index e3ba01d6d..ada7019a1 100644
--- a/backend/utils/memory_utils.py
+++ b/backend/utils/memory_utils.py
@@ -1,5 +1,4 @@
 import logging
-import re
 from typing import Dict, Any
 from urllib.parse import urlparse
 
@@ -10,11 +9,6 @@
 logger = logging.getLogger("memory_utils")
 
 
-def _sanitize_index_component(value: str) -> str:
-    """Convert arbitrary text into an Elasticsearch-safe index component."""
-    return re.sub(r"[^a-z0-9_.-]", "_", value.lower())
-
-
 def build_memory_config(tenant_id: str) -> Dict[str, Any]:
     """Return a fully-validated configuration dictionary for *mem0* ``Memory``.
     """
@@ -36,8 +30,9 @@ def build_memory_config(tenant_id: str) -> Dict[str, Any]:
     es_host = f"{parsed.scheme}://{parsed.hostname}"
     es_port = parsed.port
     # Normalize repo/name to avoid problematic characters in index names
-    safe_repo = _sanitize_index_component(embed_raw["model_repo"]) if embed_raw["model_repo"] else ""
-    safe_name = _sanitize_index_component(embed_raw["model_name"])
+    safe_repo = embed_raw["model_repo"].lower().replace(
+        "/", "_") if embed_raw["model_repo"] else ""
+    safe_name = embed_raw["model_name"].lower().replace("/", "_")
     index_name = (
         f"mem0_{safe_repo}_{safe_name}_{embed_raw['max_tokens']}"
         if embed_raw["model_repo"]
@@ -78,4 +73,4 @@ def build_memory_config(tenant_id: str) -> Dict[str, Any]:
         },
         "telemetry": {"enabled": False},
     }
-    return memory_config
+    return memory_config 
\ No newline at end of file
diff --git a/backend/utils/prompt_template_utils.py b/backend/utils/prompt_template_utils.py
index 299d3bf94..8822e5fd4 100644
--- a/backend/utils/prompt_template_utils.py
+++ b/backend/utils/prompt_template_utils.py
@@ -99,10 +99,6 @@ def get_prompt_template(template_type: str, language: str = LANGUAGE["ZH"], **kw
             LANGUAGE["ZH"]: 'backend/prompts/utils/generate_title_zh.yaml',
             LANGUAGE["EN"]: 'backend/prompts/utils/generate_title_en.yaml'
         },
-        'greeting_generate': {
-            LANGUAGE["ZH"]: 'backend/prompts/utils/greeting_generate_zh.yaml',
-            LANGUAGE["EN"]: 'backend/prompts/utils/greeting_generate_en.yaml'
-        },
         'document_summary': {
             LANGUAGE["ZH"]: 'backend/prompts/document_summary_agent_zh.yaml',
             LANGUAGE["EN"]: 'backend/prompts/document_summary_agent_en.yaml'
diff --git a/doc/docs/en/quick-start/installation.md b/doc/docs/en/quick-start/installation.md
index 7b6a9cb76..0b1544819 100644
--- a/doc/docs/en/quick-start/installation.md
+++ b/doc/docs/en/quick-start/installation.md
@@ -273,114 +273,6 @@ Provider enablement rules:
 
 For local Docker, a GitHub callback example is `http://localhost:3000/api/user/oauth/callback?provider=github`. In production, use a public HTTPS domain such as `https://nexent.example.com/api/user/oauth/callback?provider=github` and register the exact same URL in the OAuth provider console.
 
-### CAS Login Configuration
-
-CAS SSO does not require the `supabase` component. Set `CAS_CALLBACK_BASE_URL` to the browser-accessible Nexent Web URL without a trailing `/`. `CAS_SERVER_URL` is the CAS Server root URL and should also not include a trailing `/`.
-
-For Docker, configure CAS in `docker/.env`:
-
-```bash
-CAS_ENABLED=true
-CAS_SERVER_URL=http://localhost:8080/cas
-CAS_VALIDATE_PATH=/p3/serviceValidate
-CAS_CALLBACK_BASE_URL=http://localhost:3000
-
-# disabled: disable the CAS login entry and automatic redirects
-# button: show CAS as an optional login button
-# force: redirect unauthenticated Nexent users to CAS automatically
-CAS_LOGIN_MODE=force
-
-# Empty means use <cas:user>; set userName to read <cas:attributes><cas:userName>
-CAS_USER_ATTRIBUTE=
-CAS_EMAIL_ATTRIBUTE=email
-CAS_ROLE_ATTRIBUTE=role
-CAS_TENANT_ATTRIBUTE=tenant_id
-CAS_ROLE_MAP_JSON={"cas-admin":"ADMIN","cas-user":"USER"}
-CAS_SESSION_MAX_AGE_SECONDS=3600
-LOCAL_SESSION_MAX_AGE_SECONDS=3600
-CAS_RENEW_BEFORE_SECONDS=300
-CAS_RENEW_TIMEOUT_SECONDS=10
-CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
-
-# Empty means Nexent logout will not call the CAS Server logout endpoint.
-# /logout is resolved against CAS_SERVER_URL.
-CAS_LOGOUT_URL=/logout
-CAS_SSL_VERIFY=true
-CAS_CA_BUNDLE=
-```
-
-Common CAS URLs:
-
-| Purpose | URL |
-|---------|-----|
-| Nexent login entry | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
-| CAS service callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
-| CAS silent renewal callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
-| CAS single logout callback | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
-
-For Apereo CAS JSON Service Registry, create a service registration file such as `Nexent-10001.json` in the service registry directory configured by your CAS deployment. The `id` must be globally unique. This is a local Docker example:
-
-```json
-{
-  "@class": "org.apereo.cas.services.RegexRegisteredService",
-  "serviceId": "http://localhost:3000.*",
-  "name": "Nexent CAS Client",
-  "id": 10001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://localhost:3000/api/user/cas/logout_callback"
-}
-```
-
-In production, keep `CAS_SSL_VERIFY=true`; for self-signed certificates, prefer `CAS_CA_BUNDLE` and only use `CAS_SSL_VERIFY=false` for local testing.
-
-#### CAS Integration with ModelEngine
-
-When integrating with ModelEngine through the CAS protocol, deploy Nexent with the following configuration:
-
-```bash
-CAS_ENABLED=true
-CAS_SERVER_URL=https://<ModelEngine IP>:5443/SSOSvr
-CAS_VALIDATE_PATH=/p3/serviceValidate
-CAS_CALLBACK_BASE_URL=http://<Nexent IP>:3000
-CAS_LOGIN_MODE=force
-CAS_USER_ATTRIBUTE=userName
-CAS_EMAIL_ATTRIBUTE=email
-CAS_ROLE_ATTRIBUTE=userType
-CAS_TENANT_ATTRIBUTE=tenant_id
-CAS_ROLE_MAP_JSON={"1":"ADMIN","3":"DEV"}
-CAS_SESSION_MAX_AGE_SECONDS=3600
-LOCAL_SESSION_MAX_AGE_SECONDS=3600
-CAS_RENEW_BEFORE_SECONDS=300
-CAS_RENEW_TIMEOUT_SECONDS=10
-CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
-CAS_LOGOUT_URL=/logout?service=http://<Nexent IP>:3000
-CAS_SSL_VERIFY=false
-CAS_CA_BUNDLE=
-```
-
-You also need to add a CAS client service registration file in the OMS container. Use the following steps as a reference:
-
-```bash
-# Create the registration file, paste the JSON content into it, and save it.
-vim Nexent-10000001.json
-{
-  "@class": "org.apereo.cas.services.CasRegisteredService",
-  "serviceId": "http://<Nexent IP>:3000.*",
-  "name": "Nexent CAS Client",
-  "id": 1000001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://<Nexent IP>:3000/api/user/cas/logout_callback"
-}
-
-# Run the following command to copy the registration file into the container.
-kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-```
-
 ### Northbound Interface Configuration (NORTHBOUND_EXTERNAL_URL)
 
 If you need to use any of the following features, configure the `NORTHBOUND_EXTERNAL_URL` environment variable:
diff --git a/doc/docs/en/quick-start/kubernetes-installation.md b/doc/docs/en/quick-start/kubernetes-installation.md
index a10873c7c..8253c411f 100644
--- a/doc/docs/en/quick-start/kubernetes-installation.md
+++ b/doc/docs/en/quick-start/kubernetes-installation.md
@@ -291,122 +291,6 @@ Provider callback URLs:
 
 For local NodePort, a GitHub callback example is `http://localhost:30000/api/user/oauth/callback?provider=github`. In production, use a public HTTPS domain and register the exact same URL in the OAuth provider console.
 
-### CAS Login Configuration
-
-CAS SSO does not require the `supabase` component. Set `nexent-common.config.cas.callbackBaseUrl` to the browser-accessible Nexent Web URL without a trailing `/`. `nexent-common.config.cas.serverUrl` is the CAS Server root URL and should also not include a trailing `/`.
-
-Kubernetes writes CAS settings into backend environment variables through `nexent-common` `config.cas.*` values:
-
-```bash
-helm upgrade --install nexent nexent \
-  --namespace nexent --create-namespace \
-  --set nexent-common.config.cas.enabled=true \
-  --set nexent-common.config.cas.serverUrl=https://cas.example.com/cas \
-  --set nexent-common.config.cas.callbackBaseUrl=https://nexent.example.com \
-  --set nexent-common.config.cas.loginMode=force \
-  --set nexent-common.config.cas.logoutUrl=/logout
-```
-
-Configurable CAS values:
-
-| Value | Environment variable | Description |
-|-------|----------------------|-------------|
-| `nexent-common.config.cas.enabled` | `CAS_ENABLED` | Enables CAS |
-| `nexent-common.config.cas.serverUrl` | `CAS_SERVER_URL` | CAS Server root URL |
-| `nexent-common.config.cas.validatePath` | `CAS_VALIDATE_PATH` | serviceValidate path, default `/p3/serviceValidate` |
-| `nexent-common.config.cas.callbackBaseUrl` | `CAS_CALLBACK_BASE_URL` | Web entry URL; CAS callback paths are appended automatically |
-| `nexent-common.config.cas.loginMode` | `CAS_LOGIN_MODE` | `disabled`, `button`, or `force` |
-| `nexent-common.config.cas.userAttribute` | `CAS_USER_ATTRIBUTE` | User identifier attribute. Empty means use `<cas:user>` |
-| `nexent-common.config.cas.emailAttribute` | `CAS_EMAIL_ATTRIBUTE` | Email attribute |
-| `nexent-common.config.cas.roleAttribute` | `CAS_ROLE_ATTRIBUTE` | Role attribute |
-| `nexent-common.config.cas.tenantAttribute` | `CAS_TENANT_ATTRIBUTE` | Tenant attribute |
-| `nexent-common.config.cas.roleMapJson` | `CAS_ROLE_MAP_JSON` | JSON mapping from CAS roles to Nexent roles |
-| `nexent-common.config.cas.sessionMaxAgeSeconds` | `CAS_SESSION_MAX_AGE_SECONDS` | Maximum local CAS session lifetime |
-| `nexent-common.config.cas.localSessionMaxAgeSeconds` | `LOCAL_SESSION_MAX_AGE_SECONDS` | Nexent local session lifetime |
-| `nexent-common.config.cas.renewBeforeSeconds` | `CAS_RENEW_BEFORE_SECONDS` | Trigger silent renewal within this many seconds before expiry |
-| `nexent-common.config.cas.renewTimeoutSeconds` | `CAS_RENEW_TIMEOUT_SECONDS` | Silent renewal timeout |
-| `nexent-common.config.cas.syntheticEmailDomain` | `CAS_SYNTHETIC_EMAIL_DOMAIN` | Domain used when CAS does not return an email |
-| `nexent-common.config.cas.logoutUrl` | `CAS_LOGOUT_URL` | CAS logout URL. Empty means Nexent logout will not call the CAS Server logout endpoint |
-| `nexent-common.config.cas.sslVerify` | `CAS_SSL_VERIFY` | Whether to verify CAS Server TLS certificates |
-| `nexent-common.config.cas.caBundle` | `CAS_CA_BUNDLE` | Custom CA bundle path |
-
-Common CAS URLs:
-
-| Purpose | URL |
-|---------|-----|
-| Nexent login entry | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
-| CAS service callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
-| CAS silent renewal callback | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
-| CAS single logout callback | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
-
-For Apereo CAS JSON Service Registry, create a service registration file such as `Nexent-10001.json` in the service registry directory configured by your CAS deployment. The `id` must be globally unique. This is a local NodePort example:
-
-```json
-{
-  "@class": "org.apereo.cas.services.RegexRegisteredService",
-  "serviceId": "http://localhost:30000.*",
-  "name": "Nexent CAS Client",
-  "id": 10001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://localhost:30000/api/user/cas/logout_callback"
-}
-```
-
-In production, keep `CAS_SSL_VERIFY=true`; for self-signed certificates, prefer `CAS_CA_BUNDLE` and only use `CAS_SSL_VERIFY=false` for local testing.
-
-#### CAS Integration with ModelEngine
-
-When integrating with ModelEngine through the CAS protocol, use a values file to configure Nexent. This avoids complex command-line escaping for `CAS_ROLE_MAP_JSON`.
-
-Create `cas-modelengine-values.yaml`:
-
-```yaml
-nexent-common:
-  config:
-    cas:
-      enabled: true
-      serverUrl: "https://<ModelEngine IP>:5443/SSOSvr"
-      validatePath: "/p3/serviceValidate"
-      callbackBaseUrl: "http://<Nexent IP>:30000"
-      loginMode: "force"
-      userAttribute: "userName"
-      emailAttribute: "email"
-      roleAttribute: "userType"
-      tenantAttribute: "tenant_id"
-      roleMapJson: '{"1":"ADMIN","3":"DEV"}'
-      sessionMaxAgeSeconds: 3600
-      localSessionMaxAgeSeconds: 3600
-      renewBeforeSeconds: 300
-      renewTimeoutSeconds: 10
-      syntheticEmailDomain: "cas.local"
-      logoutUrl: "/logout?service=http://<Nexent IP>:30000"
-      sslVerify: false
-      caBundle: ""
-```
-
-You also need to add a CAS client service registration file in the OMS container. Use the following steps as a reference:
-
-```bash
-# Create the registration file, paste the JSON content into it, and save it.
-vim Nexent-10000001.json
-{
-  "@class": "org.apereo.cas.services.CasRegisteredService",
-  "serviceId": "http://<Nexent IP>:30000.*",
-  "name": "Nexent CAS Client",
-  "id": 1000001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://<Nexent IP>:30000/api/user/cas/logout_callback"
-}
-
-# Run the following command to copy the registration file into the container.
-kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-```
-
 ## 🔍 Troubleshooting
 
 ### Check Pod Status
diff --git a/doc/docs/en/user-guide/agent-development.md b/doc/docs/en/user-guide/agent-development.md
index 8e6b47d4f..7637cd620 100644
--- a/doc/docs/en/user-guide/agent-development.md
+++ b/doc/docs/en/user-guide/agent-development.md
@@ -111,18 +111,6 @@ In the External A2A Agent list, you can view and manage all discovered external
 > - Batch integrate all agents from the same service registry through Nacos discovery
 > - Configure protocols to meet the requirements of different agent service providers
 
-###### Integrate [DataAgent](https://gitcode.com/datagallery/dataagent) A2A Agent via URL
-
-1. Refer to the [DataAgent documentation](https://gitcode.com/datagallery/dataagent#%F0%9F%8C%90-a2a-10-%E6%9C%8D%E5%8A%A1%E6%A8%A1%E5%BC%8F) and start DataAgent in A2A service mode.
-   > Nexent does not currently support agents that require authentication. Do not set `auth-token` when starting DataAgent.
-
-<div style="display: flex; justify-content: left;">
-  <img src="./assets/agent-development/dataagent_deploy.png" style="width: 80%; height: auto;" />
-</div>
-
-2. Refer to [Discover Agent via URL](#discover-agent-via-url) to integrate the agent. The URL is `http://<IP>:9999/.well-known/agent-card.json`.
-3. Refer to [Manage Discovered External Agents](#manage-discovered-external-agents) to configure the invocation protocol, and select HTTP + JSON for integration.
-
 ### 🛠️ Select Agent Tools
 
 Agents can use various tools to complete tasks, such as knowledge base search, file parsing, image parsing, email sending/receiving, file management, and other local tools. They can also integrate third-party MCP tools or custom tools.
diff --git a/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png b/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png
deleted file mode 100644
index 46fa9fde3..000000000
Binary files a/doc/docs/en/user-guide/assets/agent-development/dataagent_deploy.png and /dev/null differ
diff --git a/doc/docs/zh/quick-start/installation.md b/doc/docs/zh/quick-start/installation.md
index 6d3538b90..871cae0cc 100644
--- a/doc/docs/zh/quick-start/installation.md
+++ b/doc/docs/zh/quick-start/installation.md
@@ -269,111 +269,6 @@ Provider 启用规则：
 
 本地默认回调示例为 `http://localhost:3000/api/user/oauth/callback?provider=github`。生产环境应改为公网 HTTPS 域名，例如 `https://nexent.example.com/api/user/oauth/callback?provider=github`，并在 OAuth provider 控制台中登记相同地址。
 
-### CAS 登录配置
-
-CAS SSO 不依赖 `supabase`。启用 CAS 时，请将 `CAS_CALLBACK_BASE_URL` 设置为浏览器可访问的 Nexent Web 地址，且不要带结尾 `/`。`CAS_SERVER_URL` 是 CAS Server 根地址，也不要带结尾 `/`。
-
-Docker 部署在 `docker/.env` 中配置 CAS：
-
-```bash
-CAS_ENABLED=true
-CAS_SERVER_URL=http://localhost:8080/cas
-CAS_VALIDATE_PATH=/p3/serviceValidate
-CAS_CALLBACK_BASE_URL=http://localhost:3000
-
-# disabled: 禁用 CAS 登录入口和自动跳转
-# button: 在登录页显示 CAS 登录按钮
-# force: 未登录访问 Nexent 时自动跳转到 CAS
-CAS_LOGIN_MODE=force
-
-# 为空时使用 <cas:user>；填写 userName 时从 <cas:attributes><cas:userName> 取用户标识
-CAS_USER_ATTRIBUTE=
-CAS_EMAIL_ATTRIBUTE=email
-CAS_ROLE_ATTRIBUTE=role
-CAS_TENANT_ATTRIBUTE=tenant_id
-CAS_ROLE_MAP_JSON={"cas-admin":"ADMIN","cas-user":"USER"}
-CAS_SESSION_MAX_AGE_SECONDS=3600
-LOCAL_SESSION_MAX_AGE_SECONDS=3600
-CAS_RENEW_BEFORE_SECONDS=300
-CAS_RENEW_TIMEOUT_SECONDS=10
-CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
-
-# 为空时 Nexent 主动退出不会调用 CAS Server 登出接口。
-# 可配置为 /logout，系统会基于 CAS_SERVER_URL 拼接。
-CAS_LOGOUT_URL=/logout
-CAS_SSL_VERIFY=true
-CAS_CA_BUNDLE=
-```
-
-常用 CAS 地址：
-
-| 用途 | 地址 |
-|------|------|
-| Nexent 登录入口 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
-| CAS service 回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
-| CAS 无感续期回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
-| CAS 单点登出回调 | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
-
-Apereo CAS 使用 JSON Service Registry 时，可以新增一个服务注册文件，例如 `Nexent-10001.json`。文件需要放到 CAS 部署配置的 service registry 目录中，`id` 必须全局唯一。下面是本地 Docker 示例：
-
-```json
-{
-  "@class": "org.apereo.cas.services.RegexRegisteredService",
-  "serviceId": "http://localhost:3000.*",
-  "name": "Nexent CAS Client",
-  "id": 10001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://localhost:3000/api/user/cas/logout_callback"
-}
-```
-
-生产环境建议保持 `CAS_SSL_VERIFY=true`；自签名证书优先配置 `CAS_CA_BUNDLE`，仅本地验证时再临时设置 `CAS_SSL_VERIFY=false`。
-
-#### CAS对接ModelEngine
-当使用CAS协议对接ModelEngine时，可以使用如下配置部署Nexent：
-```bash
-CAS_ENABLED=true
-CAS_SERVER_URL=https://<ModelEngine IP>:5443/SSOSvr
-CAS_VALIDATE_PATH=/p3/serviceValidate
-CAS_CALLBACK_BASE_URL=http://<Nexent IP>:3000
-CAS_LOGIN_MODE=force
-CAS_USER_ATTRIBUTE=userName
-CAS_EMAIL_ATTRIBUTE=email
-CAS_ROLE_ATTRIBUTE=userType
-CAS_TENANT_ATTRIBUTE=tenant_id
-CAS_ROLE_MAP_JSON={"1":"ADMIN","3":"DEV"}
-CAS_SESSION_MAX_AGE_SECONDS=3600
-LOCAL_SESSION_MAX_AGE_SECONDS=3600
-CAS_RENEW_BEFORE_SECONDS=300
-CAS_RENEW_TIMEOUT_SECONDS=10
-CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
-CAS_LOGOUT_URL=/logout?service=http://<Nexent IP>:3000
-CAS_SSL_VERIFY=false
-CAS_CA_BUNDLE=
-```
-
-同时，需要进入oms容器添加cas client的注册配置文件，参考如下步骤：
-```bash
-# 创建注册配置文件，将json部分输入文件并保存
-vim Nexent-10000001.json
-{
-  "@class": "org.apereo.cas.services.CasRegisteredService",
-  "serviceId": "http://<Nexent IP>:3000.*",
-  "name": "Nexent CAS Client",
-  "id": 1000001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://<Nexent IP>:3000/api/user/cas/logout_callback"
-}
-
-# 执行如下命令，将配置文件拷贝到容器中
-kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-```
-
 ### 北向接口配置 (NORTHBOUND_EXTERNAL_URL)
 
 如果您需要使用以下功能，需要配置 `NORTHBOUND_EXTERNAL_URL` 环境变量：
diff --git a/doc/docs/zh/quick-start/kubernetes-installation.md b/doc/docs/zh/quick-start/kubernetes-installation.md
index 7229f1ea8..47d2af816 100644
--- a/doc/docs/zh/quick-start/kubernetes-installation.md
+++ b/doc/docs/zh/quick-start/kubernetes-installation.md
@@ -291,122 +291,6 @@ Provider 回调地址：
 
 本地 NodePort 默认回调示例为 `http://localhost:30000/api/user/oauth/callback?provider=github`。生产环境应改为公网 HTTPS 域名，并在 OAuth provider 控制台中登记相同地址。
 
-### CAS 登录配置
-
-CAS SSO 不依赖 `supabase`。启用 CAS 时，请将 `nexent-common.config.cas.callbackBaseUrl` 设置为浏览器可访问的 Nexent Web 地址，且不要带结尾 `/`。`nexent-common.config.cas.serverUrl` 是 CAS Server 根地址，也不要带结尾 `/`。
-
-Kubernetes 部署通过 `nexent-common` 的 `config.cas.*` values 写入后端环境变量：
-
-```bash
-helm upgrade --install nexent nexent \
-  --namespace nexent --create-namespace \
-  --set nexent-common.config.cas.enabled=true \
-  --set nexent-common.config.cas.serverUrl=https://cas.example.com/cas \
-  --set nexent-common.config.cas.callbackBaseUrl=https://nexent.example.com \
-  --set nexent-common.config.cas.loginMode=force \
-  --set nexent-common.config.cas.logoutUrl=/logout
-```
-
-可配置的 CAS values：
-
-| Values | 对应环境变量 | 说明 |
-|--------|--------------|------|
-| `nexent-common.config.cas.enabled` | `CAS_ENABLED` | 是否启用 CAS |
-| `nexent-common.config.cas.serverUrl` | `CAS_SERVER_URL` | CAS Server 根地址 |
-| `nexent-common.config.cas.validatePath` | `CAS_VALIDATE_PATH` | serviceValidate 路径，默认 `/p3/serviceValidate` |
-| `nexent-common.config.cas.callbackBaseUrl` | `CAS_CALLBACK_BASE_URL` | Web 入口地址，CAS 回调路径会自动拼接 |
-| `nexent-common.config.cas.loginMode` | `CAS_LOGIN_MODE` | `disabled`、`button` 或 `force` |
-| `nexent-common.config.cas.userAttribute` | `CAS_USER_ATTRIBUTE` | 用户标识属性。为空时使用 `<cas:user>` |
-| `nexent-common.config.cas.emailAttribute` | `CAS_EMAIL_ATTRIBUTE` | 邮箱属性 |
-| `nexent-common.config.cas.roleAttribute` | `CAS_ROLE_ATTRIBUTE` | 角色属性 |
-| `nexent-common.config.cas.tenantAttribute` | `CAS_TENANT_ATTRIBUTE` | 租户属性 |
-| `nexent-common.config.cas.roleMapJson` | `CAS_ROLE_MAP_JSON` | CAS 角色到 Nexent 角色的 JSON 映射 |
-| `nexent-common.config.cas.sessionMaxAgeSeconds` | `CAS_SESSION_MAX_AGE_SECONDS` | CAS 本地会话最长有效期 |
-| `nexent-common.config.cas.localSessionMaxAgeSeconds` | `LOCAL_SESSION_MAX_AGE_SECONDS` | Nexent 本地会话有效期 |
-| `nexent-common.config.cas.renewBeforeSeconds` | `CAS_RENEW_BEFORE_SECONDS` | 距离过期多少秒内触发无感续期 |
-| `nexent-common.config.cas.renewTimeoutSeconds` | `CAS_RENEW_TIMEOUT_SECONDS` | 无感续期等待超时时间 |
-| `nexent-common.config.cas.syntheticEmailDomain` | `CAS_SYNTHETIC_EMAIL_DOMAIN` | CAS 未返回邮箱时生成邮箱使用的域名 |
-| `nexent-common.config.cas.logoutUrl` | `CAS_LOGOUT_URL` | CAS 登出地址。为空时 Nexent 主动退出不调用 CAS Server 登出接口 |
-| `nexent-common.config.cas.sslVerify` | `CAS_SSL_VERIFY` | 访问 CAS Server 时是否校验证书 |
-| `nexent-common.config.cas.caBundle` | `CAS_CA_BUNDLE` | 自定义 CA bundle 路径 |
-
-常用 CAS 地址：
-
-| 用途 | 地址 |
-|------|------|
-| Nexent 登录入口 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/login?redirect=/` |
-| CAS service 回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/callback` |
-| CAS 无感续期回调 | `{CAS_CALLBACK_BASE_URL}/api/user/cas/renew_callback` |
-| CAS 单点登出回调 | `POST {CAS_CALLBACK_BASE_URL}/api/user/cas/logout_callback` |
-
-Apereo CAS 使用 JSON Service Registry 时，可以新增一个服务注册文件，例如 `Nexent-10001.json`。文件需要放到 CAS 部署配置的 service registry 目录中，`id` 必须全局唯一。本地 NodePort 示例：
-
-```json
-{
-  "@class": "org.apereo.cas.services.RegexRegisteredService",
-  "serviceId": "http://localhost:30000.*",
-  "name": "Nexent CAS Client",
-  "id": 10001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://localhost:30000/api/user/cas/logout_callback"
-}
-```
-
-生产环境建议保持 `CAS_SSL_VERIFY=true`；自签名证书优先配置 `CAS_CA_BUNDLE`，仅本地验证时再临时设置 `CAS_SSL_VERIFY=false`。
-
-#### CAS 对接 ModelEngine
-
-当使用 CAS 协议对接 ModelEngine 时，建议通过 values 文件配置 Nexent，避免 `CAS_ROLE_MAP_JSON` 在命令行中转义复杂。
-
-创建 `cas-modelengine-values.yaml`：
-
-```yaml
-nexent-common:
-  config:
-    cas:
-      enabled: true
-      serverUrl: "https://<ModelEngine IP>:5443/SSOSvr"
-      validatePath: "/p3/serviceValidate"
-      callbackBaseUrl: "http://<Nexent IP>:30000"
-      loginMode: "force"
-      userAttribute: "userName"
-      emailAttribute: "email"
-      roleAttribute: "userType"
-      tenantAttribute: "tenant_id"
-      roleMapJson: '{"1":"ADMIN","3":"DEV"}'
-      sessionMaxAgeSeconds: 3600
-      localSessionMaxAgeSeconds: 3600
-      renewBeforeSeconds: 300
-      renewTimeoutSeconds: 10
-      syntheticEmailDomain: "cas.local"
-      logoutUrl: "/logout?service=http://<Nexent IP>:30000"
-      sslVerify: false
-      caBundle: ""
-```
-
-同时，需要进入 OMS 容器添加 CAS client 的注册配置文件，参考如下步骤：
-
-```bash
-# 创建注册配置文件，将 JSON 部分输入文件并保存
-vim Nexent-10000001.json
-{
-  "@class": "org.apereo.cas.services.CasRegisteredService",
-  "serviceId": "http://<Nexent IP>:30000.*",
-  "name": "Nexent CAS Client",
-  "id": 1000001,
-  "description": "Nexent CAS SSO client",
-  "evaluationOrder": 1,
-  "logoutType": "BACK_CHANNEL",
-  "logoutUrl": "http://<Nexent IP>:30000/api/user/cas/logout_callback"
-}
-
-# 执行如下命令，将配置文件拷贝到容器中
-kubectl cp Nexent-10000001.json model-engine/$(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}'):/opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-kubectl exec -i -n model-engine $(kubectl get pods -n model-engine -l app=oms --no-headers | awk '{print $1}') -- chown tomcat:fusioncube /opt/huawei/fce/apps/platform/webapps/SSOSvr/WEB-INF/classes/services/Nexent-10000001.json
-```
-
 ## 🔍 故障排查
 
 ### 查看 Pod 状态
diff --git a/doc/docs/zh/sdk/vector-database.md b/doc/docs/zh/sdk/vector-database.md
index b940400fd..940af9c33 100644
--- a/doc/docs/zh/sdk/vector-database.md
+++ b/doc/docs/zh/sdk/vector-database.md
@@ -579,11 +579,7 @@ python -m nexent.service.vectordatabase_service
   - 参数:
     - `index_name`: 索引名称 (路径参数)
     - `path_or_url`: 文档路径或URL (查询参数)
-    - `scope`: 删除范围 (查询参数，默认 `full`)
-      - `source_only`: 仅删除 MinIO 源文件，保留 ES 中的切片与向量（检索仍可用，预览不可用）
-      - `full`: 删除 ES 文档、MinIO 源文件，并清理相关 Redis 任务记录
-  - 返回示例 (`source_only`): `{"status": "success", "scope": "source_only", "deleted_es_count": 0, "deleted_minio": true, "source_available": false}`
-  - 返回示例 (`full`): `{"status": "success", "scope": "full", "deleted_es_count": 5, "deleted_minio": true}`
+  - 返回示例: `{"status": "success", "deleted_count": 1}`
 
 #### 搜索操作
 
@@ -732,11 +728,8 @@ curl -X POST "http://localhost:8000/indices/search/hybrid" \
     "weight_accurate": 0.3
   }'
 
-# 删除源文件（保留索引）
-curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=knowledge_base/doc1.pdf&scope=source_only"
-
-# 从知识库彻底移除文档
-curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=knowledge_base/doc1.pdf&scope=full"
+# 删除文档
+curl -X DELETE "http://localhost:8000/indices/my_documents/documents?path_or_url=https://example.com/doc1"
 
 # 创建索引
 curl -X POST "http://localhost:8000/indices/my_documents"
diff --git a/doc/docs/zh/user-guide/agent-development.md b/doc/docs/zh/user-guide/agent-development.md
index 40805aeea..3edf31de7 100644
--- a/doc/docs/zh/user-guide/agent-development.md
+++ b/doc/docs/zh/user-guide/agent-development.md
@@ -113,17 +113,6 @@ Nexent 支持通过 A2A 协议与第三方 Agent 进行通信。您可以通过
 > - 通过 Nacos 发现批量接入同一服务注册中心的所有 Agent
 > - 配置协议以兼容不同 Agent 服务提供商的要求
 
-
-###### 通过URL对接[DataAgent](https://gitcode.com/datagallery/dataagent) A2A Agent
-1. 参考[DataAgent文档](https://gitcode.com/datagallery/dataagent#%F0%9F%8C%90-a2a-10-%E6%9C%8D%E5%8A%A1%E6%A8%A1%E5%BC%8F)以A2A服务模式启动DataAgent
-   >当前Nexent不支持带认证的agent，启动DataAgent时请勿设置auth-token
-<div style="display: flex; justify-content: left;">
-  <img src="./assets/agent-development/dataagent_deploy.png" style="width: 80%; height: auto;" />
-</div>
-
-2. 参考[通过 URL 发现 Agent](#通过-url-发现-agent)接入agent，url为http://\<IP\>:9999/.well-known/agent-card.json
-3. 参考[管理已发现的外部 Agent](#管理已发现的外部-agent)配置调用协议，选择HTTP+JSON方式接入
-
 ### 🛠️ 选择智能体的工具
 
 智能体可以使用各种工具来完成任务，如知识库检索、文件解析、图片解析、收发邮件、文件管理等本地工具，也可接入第三方 MCP 工具，或自定义工具。
diff --git a/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png b/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png
deleted file mode 100644
index 46fa9fde3..000000000
Binary files a/doc/docs/zh/user-guide/assets/agent-development/dataagent_deploy.png and /dev/null differ
diff --git a/doc/procedural-memory-verification.md b/doc/procedural-memory-verification.md
deleted file mode 100644
index ea9f53290..000000000
--- a/doc/procedural-memory-verification.md
+++ /dev/null
@@ -1,315 +0,0 @@
-# Procedural Memory Verification Report
-
-## Summary
-**Status: ⚠️ FULLY SUPPORTED but REQUIRES OPTIONAL DEPENDENCY**
-
-Procedural memory is a fully implemented feature in mem0ai version 0.1.117, **BUT it requires `langchain-core` to be installed separately**. Without this dependency, the feature will fail at runtime.
-
----
-
-## ⚠️ CRITICAL FINDING: Optional Dependency Required
-
-**Your colleague is partially correct.** The procedural memory code is NOT empty (it's 50 lines of real implementation), but it has a critical dependency issue:
-
-### The Problem
-
-The `_create_procedural_memory()` method contains:
-
-```python
-try:
-    from langchain_core.messages.utils import convert_to_messages
-except Exception:
-    logger.error(
-        "Import error while loading langchain-core. "
-        "Please install 'langchain-core' to use procedural memory."
-    )
-    raise  # ← Fails here if langchain-core not installed
-```
-
-### Reality Check
-
-| Aspect | Status |
-|--------|--------|
-| Code exists? | ✅ Yes, 50 lines of real implementation |
-| Code is empty/stub? | ❌ No, it's fully implemented |
-| Works out of the box? | ❌ **NO** - requires `langchain-core` package |
-| Documented requirement? | ⚠️ Only in error message, not in main docs |
-
-### Why Your Colleague Thought It Was Empty
-
-1. They called `memory.add(..., memory_type="procedural_memory")`
-2. Got `ImportError: No module named 'langchain_core'`
-3. Saw the error and concluded "it doesn't work" or "it's empty"
-4. This is understandable - the feature exists but is **disabled by default**
-
----
-
-## Verification Results
-
-### 1. API Support ✅
-The `memory_type` parameter is available in both `AsyncMemory.add()` and `Memory.add()`:
-
-```python
-async def add(
-    self,
-    messages,
-    *,
-    user_id: Optional[str] = None,
-    agent_id: Optional[str] = None,
-    run_id: Optional[str] = None,
-    metadata: Optional[Dict[str, Any]] = None,
-    infer: bool = True,
-    memory_type: Optional[str] = None,  # ✅ SUPPORTED
-    prompt: Optional[str] = None,
-    llm=None
-)
-```
-
-### 2. MemoryType Enum ✅
-Located in `mem0.configs.enums.MemoryType`:
-
-```python
-class MemoryType(Enum):
-    SEMANTIC = "semantic_memory"
-    EPISODIC = "episodic_memory"
-    PROCEDURAL = "procedural_memory"  # ✅ AVAILABLE
-```
-
-### 3. Implementation ✅
-The `_create_procedural_memory()` method exists in both `AsyncMemory` and `Memory` classes:
-
-**AsyncMemory signature:**
-```python
-async def _create_procedural_memory(
-    self,
-    messages,
-    metadata=None,
-    llm=None,
-    prompt=None
-)
-```
-
-**Memory (sync) signature:**
-```python
-def _create_procedural_memory(
-    self,
-    messages,
-    metadata=None,
-    prompt=None
-)
-```
-
-### 4. Validation Logic ✅
-The `add()` method validates `memory_type` and enforces constraints:
-
-```python
-# Only "procedural_memory" is accepted
-if memory_type is not None and memory_type != MemoryType.PROCEDURAL.value:
-    raise ValueError(
-        f"Invalid 'memory_type'. Please pass {MemoryType.PROCEDURAL.value} "
-        "to create procedural memories."
-    )
-
-# agent_id is REQUIRED for procedural memory
-if agent_id is not None and memory_type == MemoryType.PROCEDURAL.value:
-    results = await self._create_procedural_memory(
-        messages, metadata=processed_metadata, prompt=prompt, llm=llm
-    )
-    return results
-```
-
-### 5. System Prompt ✅
-A comprehensive 5,100-character system prompt exists in `mem0.configs.prompts.PROCEDURAL_MEMORY_SYSTEM_PROMPT`:
-
-**Purpose:** Records and preserves complete interaction history between human and AI agent
-
-**Structure:**
-- Overview (Global Metadata)
-  - Task Objective
-  - Progress Status
-- Sequential Agent Actions (Numbered Steps)
-  - Agent Action
-  - Action Result (Mandatory, Unmodified)
-  - Embedded Metadata (Key Findings, Navigation History, Errors, Current Context)
-
-**Key Guidelines:**
-1. Preserve every output verbatim
-2. Maintain chronological order
-3. Include exact data (URLs, element indexes, error messages, JSON responses)
-4. Output only the structured summary
-
----
-
-## Usage Example
-
-```python
-from mem0 import AsyncMemory
-
-# Initialize memory
-memory = await AsyncMemory.from_config(config)
-
-# Create procedural memory
-messages = [
-    {"role": "user", "content": "Search for AI news"},
-    {"role": "assistant", "content": "I'll search for recent AI news..."},
-    # ... more conversation history
-]
-
-result = await memory.add(
-    messages=messages,
-    user_id="user_123",
-    agent_id="research_agent",  # ⚠️ REQUIRED for procedural memory
-    memory_type="procedural_memory",
-    metadata={
-        "task": "AI news research",
-        "session_id": "session_456"
-    }
-)
-
-# Result format:
-# {
-#     "results": [
-#         {
-#             "id": "memory_id_here",
-#             "memory": "## Summary of the agent's execution history...",
-#             "event": "ADD"
-#         }
-#     ]
-# }
-```
-
----
-
-## Requirements & Constraints
-
-### Required Parameters
-- ✅ `agent_id`: **MUST** be provided when using `memory_type="procedural_memory"`
-- ✅ `metadata`: **MUST** be provided (cannot be None)
-- ✅ `messages`: List of conversation messages to summarize
-
-### Optional Parameters
-- `prompt`: Custom prompt to override default `PROCEDURAL_MEMORY_SYSTEM_PROMPT`
-- `llm`: Custom LangChain ChatModel (async version only)
-
-### Validation Rules
-1. `memory_type` must be exactly `"procedural_memory"` (or None)
-2. If `memory_type="procedural_memory"` is set, `agent_id` must be provided
-3. `metadata` cannot be None for procedural memories
-
----
-
-## Implementation Details
-
-### How It Works
-1. **Validation**: Checks `memory_type` and required parameters
-2. **Prompt Construction**: Uses default or custom system prompt
-3. **LLM Summarization**: Calls LLM to generate comprehensive execution summary
-4. **Embedding**: Generates embedding for the summary
-5. **Storage**: Stores in vector database with `metadata["memory_type"] = "procedural_memory"`
-6. **Return**: Returns memory ID and summary text
-
-### Async vs Sync
-- **AsyncMemory**: Supports custom LangChain `llm` parameter
-- **Memory**: Uses internal LLM from config only
-
----
-
-## Integration with Nexent
-
-### Current Status
-The Nexent codebase does **NOT** currently use procedural memory. The `memory_type` parameter is not passed in any `add_memory()` calls.
-
-### Recommended Integration Points
-
-1. **Agent Service** (`backend/services/agent_service.py`):
-   - Detect when agent completes a multi-step task
-   - Call `add_memory_in_levels()` with `memory_type="procedural_memory"`
-   - Pass the full conversation history as messages
-
-2. **Memory Service** (`sdk/nexent/memory/memory_service.py`):
-   - Add `memory_type` parameter to `add_memory()` and `add_memory_in_levels()`
-   - Pass through to mem0's `add()` method
-
-3. **Agent Run Info** (`sdk/nexent/core/agents/agent_model.py`):
-   - Add `memory_type` field to track if current run should create procedural memory
-
-### Example Integration
-
-```python
-# In agent_service.py, after agent completes a complex task
-if task_complexity >= threshold:  # Your logic here
-    await add_memory_in_levels(
-        messages=conversation_history,
-        memory_config=memory_ctx.memory_config,
-        tenant_id=memory_ctx.tenant_id,
-        user_id=memory_ctx.user_id,
-        agent_id=memory_ctx.agent_id,
-        memory_levels=["agent", "user_agent"],
-        memory_type="procedural_memory",  # ✅ NEW PARAMETER
-        metadata={
-            "task_type": "complex_research",
-            "duration_seconds": duration,
-            "steps_completed": step_count
-        }
-    )
-```
-
----
-
-## Conclusion
-
-Procedural memory is a **fully functional feature** in mem0ai==0.1.117, **BUT it requires an optional dependency**. It provides:
-
-- ✅ Complete API support
-- ✅ Comprehensive system prompt (5,100 characters)
-- ✅ Proper validation and error handling
-- ✅ Both sync and async implementations
-- ✅ Integration with existing memory infrastructure
-- ⚠️ **REQUIRES `langchain-core` package to be installed**
-
-### The Truth About "Empty Function" Claims
-
-**The code is NOT empty.** It's a 50-line implementation that:
-1. Calls LLM to generate execution summary
-2. Creates embeddings
-3. Stores in vector database
-4. Returns proper results
-
-**However, it fails at runtime** if `langchain-core` is not installed, which is why your colleague might have thought it was a no-op.
-
-### How to Enable
-
-**Option 1: Install the dependency**
-```bash
-pip install langchain-core
-```
-
-**Option 2: Add to Nexent's dependencies**
-```toml
-# In sdk/pyproject.toml
-dependencies = [
-    # ... existing deps ...
-    "langchain-core>=0.1.0",  # Required for procedural memory
-]
-```
-
-**Option 3: Make it optional with fallback**
-```python
-try:
-    result = await memory.add(..., memory_type="procedural_memory")
-except ImportError as e:
-    if "langchain-core" in str(e):
-        logger.warning("Procedural memory requires langchain-core. Using regular memory.")
-        result = await memory.add(...)  # Fallback
-    else:
-        raise
-```
-
-### Final Recommendation
-
-This feature **can be integrated into Nexent**, but you must:
-1. Add `langchain-core` to dependencies, OR
-2. Implement graceful fallback when dependency is missing, OR
-3. Document it as an optional feature requiring extra installation
-
-Without addressing the dependency issue, procedural memory will fail at runtime despite having complete implementation code.
diff --git a/docker/.env.example b/docker/.env.example
index 3970efb95..c34300523 100644
--- a/docker/.env.example
+++ b/docker/.env.example
@@ -226,27 +226,3 @@ OAUTH_CALLBACK_BASE_URL=http://localhost:3000
 
 # Asset owner role (opt-in; default false). Set true to enable ASSET_OWNER.
 ENABLE_ASSET_OWNER_ROLE=false
-
-# ===== CAS SSO Configuration =====
-CAS_ENABLED=false
-CAS_SERVER_URL=
-CAS_VALIDATE_PATH=/p3/serviceValidate
-CAS_CALLBACK_BASE_URL=http://localhost:3000
-# Supported values:
-# - disabled: disable CAS login entry and automatic CAS redirects.
-# - button: show CAS as an optional login entry.
-# - force: automatically redirect unauthenticated users to CAS login.
-CAS_LOGIN_MODE=disabled
-CAS_USER_ATTRIBUTE=
-CAS_EMAIL_ATTRIBUTE=email
-CAS_ROLE_ATTRIBUTE=role
-CAS_TENANT_ATTRIBUTE=tenant_id
-CAS_ROLE_MAP_JSON=
-CAS_SESSION_MAX_AGE_SECONDS=3600
-LOCAL_SESSION_MAX_AGE_SECONDS=3600
-CAS_RENEW_BEFORE_SECONDS=300
-CAS_RENEW_TIMEOUT_SECONDS=10
-CAS_SYNTHETIC_EMAIL_DOMAIN=cas.local
-CAS_LOGOUT_URL=/logout
-CAS_SSL_VERIFY=true
-CAS_CA_BUNDLE=
diff --git a/docker/deploy.sh b/docker/deploy.sh
index fbf3664b5..2069330d1 100755
--- a/docker/deploy.sh
+++ b/docker/deploy.sh
@@ -1367,7 +1367,7 @@ main_deploy() {
   echo "--------------------------------"
   echo ""
 
-  APP_VERSION="$(get_app_version)"
+  APP_VERSION="latest"
   if [ -z "$APP_VERSION" ]; then
     echo "❌ Failed to get app version, please check the backend/consts/const.py file"
     exit 1
diff --git a/docker/init.sql b/docker/init.sql
index 046bdecf1..0668def01 100644
--- a/docker/init.sql
+++ b/docker/init.sql
@@ -230,7 +230,6 @@ CREATE TABLE IF NOT EXISTS "knowledge_record_t" (
   "summary_frequency" varchar(10) COLLATE "pg_catalog"."default",
   "last_summary_time" timestamp(0),
   "last_doc_update_time" timestamp(0),
-  "preserve_source_file" boolean NOT NULL DEFAULT true,
   CONSTRAINT "knowledge_record_t_pk" PRIMARY KEY ("knowledge_id")
 );
 ALTER TABLE "knowledge_record_t" OWNER TO "root";
@@ -252,7 +251,6 @@ COMMENT ON COLUMN "knowledge_record_t"."created_by" IS 'User who created the rec
 COMMENT ON COLUMN "knowledge_record_t"."summary_frequency" IS 'Auto-summary frequency: 1h, 3h, 6h, 1d, 1w, or NULL (disabled)';
 COMMENT ON COLUMN "knowledge_record_t"."last_summary_time" IS 'Timestamp of last summary generation';
 COMMENT ON COLUMN "knowledge_record_t"."last_doc_update_time" IS 'Timestamp of last document add/delete operation, used for auto-summary optimization to skip unnecessary summary regeneration';
-COMMENT ON COLUMN "knowledge_record_t"."preserve_source_file" IS 'Whether to preserve uploaded source documents after vectorization';
 COMMENT ON COLUMN "knowledge_record_t"."updated_by" IS 'Last updater ID, audit field';
 COMMENT ON COLUMN "knowledge_record_t"."created_by" IS 'Creator ID, audit field';
 COMMENT ON TABLE "knowledge_record_t" IS 'Records knowledge base description and status information';
@@ -339,12 +337,9 @@ CREATE TABLE IF NOT EXISTS nexent.ag_tenant_agent_t (
     is_new BOOLEAN DEFAULT FALSE,
     provide_run_summary BOOLEAN DEFAULT FALSE,
     enable_context_manager BOOLEAN DEFAULT FALSE,
-    verification_config JSONB,
     version_no INTEGER DEFAULT 0 NOT NULL,
     current_version_no INTEGER NULL,
     ingroup_permission VARCHAR(30),
-    greeting_message TEXT,
-    example_questions JSONB,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -402,9 +397,6 @@ COMMENT ON COLUMN nexent.ag_tenant_agent_t.version_no IS 'Version number. 0 = dr
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.current_version_no IS 'Current published version number. NULL means no version published yet';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.ingroup_permission IS 'In-group permission: EDIT, READ_ONLY, PRIVATE';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.enable_context_manager IS 'Whether to enable context management (compression) for this agent';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
 
 -- Create index for is_new queries
 CREATE INDEX IF NOT EXISTS idx_ag_tenant_agent_t_is_new
@@ -723,7 +715,6 @@ CREATE TABLE IF NOT EXISTS nexent.ag_agent_relation_t (
     parent_agent_id INTEGER,
     tenant_id VARCHAR(100),
     version_no INTEGER DEFAULT 0 NOT NULL,
-    selected_agent_version_no INTEGER,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -756,7 +747,6 @@ COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_id IS 'Selected agen
 COMMENT ON COLUMN nexent.ag_agent_relation_t.parent_agent_id IS 'Parent agent ID';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.tenant_id IS 'Tenant ID';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.version_no IS 'Version number. 0 = draft/editing state, >=1 = published snapshot';
-COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS 'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.create_time IS 'Creation time, audit field';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.update_time IS 'Update time, audit field';
 COMMENT ON COLUMN nexent.ag_agent_relation_t.created_by IS 'Creator ID, audit field';
@@ -1270,6 +1260,7 @@ CREATE TABLE IF NOT EXISTS nexent.ag_skill_info_t (
     config_schemas JSON,
     config_values JSON,
     source VARCHAR(30) DEFAULT 'official',
+    tenant_id VARCHAR(100),
     created_by VARCHAR(100),
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     updated_by VARCHAR(100),
@@ -1909,31 +1900,3 @@ FOR EACH ROW
 EXECUTE FUNCTION update_mcp_community_record_update_time();
 
 COMMENT ON TRIGGER update_mcp_community_record_update_time_trigger ON nexent.mcp_community_record_t IS 'Trigger to maintain update_time';
-
-CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
-    cas_session_id SERIAL PRIMARY KEY,
-    session_id VARCHAR(100) NOT NULL UNIQUE,
-    user_id VARCHAR(100) NOT NULL,
-    cas_user_id VARCHAR(200) NOT NULL,
-    cas_session_index VARCHAR(500),
-    status VARCHAR(30) NOT NULL DEFAULT 'active',
-    expires_at TIMESTAMP NOT NULL,
-    revoked_at TIMESTAMP,
-    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    created_by VARCHAR(100),
-    updated_by VARCHAR(100),
-    delete_flag VARCHAR(1) DEFAULT 'N'
-);
-
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
-    ON nexent.user_cas_session_t (session_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
-    ON nexent.user_cas_session_t (user_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
-    ON nexent.user_cas_session_t (cas_user_id);
-
-COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
-COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
diff --git a/docker/official-skills-zip/create-docx.zip b/docker/official-skills-zip/create-docx.zip
deleted file mode 100644
index aa53e82b0..000000000
Binary files a/docker/official-skills-zip/create-docx.zip and /dev/null differ
diff --git a/docker/sql/v2.2.0_0526_add_cas_session_t.sql b/docker/sql/v2.2.0_0526_add_cas_session_t.sql
deleted file mode 100644
index 3f1aab4fa..000000000
--- a/docker/sql/v2.2.0_0526_add_cas_session_t.sql
+++ /dev/null
@@ -1,27 +0,0 @@
-CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
-    cas_session_id SERIAL PRIMARY KEY,
-    session_id VARCHAR(100) NOT NULL UNIQUE,
-    user_id VARCHAR(100) NOT NULL,
-    cas_user_id VARCHAR(200) NOT NULL,
-    cas_session_index VARCHAR(500),
-    status VARCHAR(30) NOT NULL DEFAULT 'active',
-    expires_at TIMESTAMP NOT NULL,
-    revoked_at TIMESTAMP,
-    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    created_by VARCHAR(100),
-    updated_by VARCHAR(100),
-    delete_flag VARCHAR(1) DEFAULT 'N'
-);
-
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
-    ON nexent.user_cas_session_t (session_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
-    ON nexent.user_cas_session_t (user_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
-    ON nexent.user_cas_session_t (cas_user_id);
-
-COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
-COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
diff --git a/docker/sql/v2.2.1_0601_add_agent_verification_config.sql b/docker/sql/v2.2.1_0601_add_agent_verification_config.sql
deleted file mode 100644
index d3882e1e2..000000000
--- a/docker/sql/v2.2.1_0601_add_agent_verification_config.sql
+++ /dev/null
@@ -1,7 +0,0 @@
--- Migration: Add layered ReAct self-verification config to agents
--- Description: Stores per-agent verification controls for step-level and final-answer validation.
-
-ALTER TABLE nexent.ag_tenant_agent_t
-ADD COLUMN IF NOT EXISTS verification_config JSONB;
-
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
diff --git a/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql b/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql
deleted file mode 100644
index 30b588a51..000000000
--- a/docker/sql/v2.2.1_0601_add_preserve_source_file_to_knowledge_record_t.sql
+++ /dev/null
@@ -1,8 +0,0 @@
--- Migration: Add preserve_source_file to knowledge_record_t table
--- Date: 2026-06-01
--- Description: Whether to preserve uploaded source documents after vectorization (default: true)
-
-ALTER TABLE nexent.knowledge_record_t
-ADD COLUMN IF NOT EXISTS preserve_source_file BOOLEAN NOT NULL DEFAULT true;
-
-COMMENT ON COLUMN nexent.knowledge_record_t.preserve_source_file IS 'Whether to preserve uploaded source documents after vectorization';
diff --git a/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql b/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql
deleted file mode 100644
index 7786bb902..000000000
--- a/docker/sql/v2.2.1_0603_add_greeting_fields_to_ag_tenant_agent_t.sql
+++ /dev/null
@@ -1,15 +0,0 @@
--- Migration: Add greeting_message and example_questions columns to ag_tenant_agent_t table
--- Date: 2026-06-03
--- Description: Add greeting message and example questions fields for agent chat initial screen
-
--- Add greeting_message column to ag_tenant_agent_t table
-ALTER TABLE nexent.ag_tenant_agent_t
-ADD COLUMN IF NOT EXISTS greeting_message TEXT;
-
--- Add example_questions column to ag_tenant_agent_t table
-ALTER TABLE nexent.ag_tenant_agent_t
-ADD COLUMN IF NOT EXISTS example_questions JSONB;
-
--- Add comments to the columns
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
\ No newline at end of file
diff --git a/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql b/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql
deleted file mode 100644
index d719fc5aa..000000000
--- a/docker/sql/v2.2.1_0605_add_ag_agent_repository_t.sql
+++ /dev/null
@@ -1,96 +0,0 @@
--- Migration: Add ag_agent_repository_t table
--- Date: 2026-06-05
--- Description: Agent marketplace repository for frozen shareable agent snapshots.
-
-SET search_path TO nexent;
-
-BEGIN;
-
-CREATE SEQUENCE IF NOT EXISTS nexent.ag_agent_repository_t_agent_repository_id_seq;
-
-CREATE TABLE IF NOT EXISTS nexent.ag_agent_repository_t (
-    agent_repository_id BIGINT NOT NULL DEFAULT nextval('nexent.ag_agent_repository_t_agent_repository_id_seq'),
-    publisher_tenant_id VARCHAR(100) NOT NULL,
-    publisher_user_id VARCHAR(100) NOT NULL,
-    agent_id INTEGER NOT NULL,
-    source_version_no INTEGER NOT NULL,
-    name VARCHAR(100) NOT NULL,
-    display_name VARCHAR(100),
-    description TEXT,
-    author VARCHAR(100),
-    category_id INTEGER,
-    tags TEXT[],
-    tool_count INTEGER,
-    version_label VARCHAR(100),
-    agent_info_json JSONB NOT NULL,
-    status VARCHAR(30) DEFAULT 'NOT_SHARED',
-    create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
-    update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
-    created_by VARCHAR(100),
-    updated_by VARCHAR(100),
-    delete_flag VARCHAR(1) DEFAULT 'N',
-    CONSTRAINT ag_agent_repository_t_pkey PRIMARY KEY (agent_repository_id)
-);
-
-ALTER SEQUENCE nexent.ag_agent_repository_t_agent_repository_id_seq
-    OWNED BY nexent.ag_agent_repository_t.agent_repository_id;
-
-ALTER TABLE nexent.ag_agent_repository_t OWNER TO root;
-
-COMMENT ON TABLE nexent.ag_agent_repository_t IS 'Agent marketplace repository for frozen shareable agent snapshots';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_repository_id IS 'Agent repository listing ID, unique primary key';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_tenant_id IS 'Publisher tenant ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_user_id IS 'Publisher user ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_id IS 'Root agent ID from ag_tenant_agent_t; upsert key with publisher_tenant_id';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.source_version_no IS 'Published version number frozen at share time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.name IS 'Root agent programmatic name for display and search';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.display_name IS 'Root agent display name';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.description IS 'Root agent description';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.author IS 'Agent author';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.category_id IS 'Optional marketplace category ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.tags IS 'Marketplace tags';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.tool_count IS 'Total tool count across all agents in the bundle (display only)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.version_label IS 'Repository entry version label for display (e.g. v1.0)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_info_json IS 'Frozen ExportAndImportDataFormat snapshot with optional skills';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.status IS 'Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.create_time IS 'Creation time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.update_time IS 'Update time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.created_by IS 'Creator ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.updated_by IS 'Updater ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.delete_flag IS 'Soft delete flag: Y/N';
-
-CREATE UNIQUE INDEX IF NOT EXISTS uq_agent_repository_tenant_agent_active
-    ON nexent.ag_agent_repository_t (publisher_tenant_id, agent_id)
-    WHERE delete_flag = 'N';
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_publisher_delete
-    ON nexent.ag_agent_repository_t (publisher_tenant_id, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_status_delete
-    ON nexent.ag_agent_repository_t (status, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_name_delete
-    ON nexent.ag_agent_repository_t (name, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_tags_gin
-    ON nexent.ag_agent_repository_t USING GIN (tags);
-
-CREATE OR REPLACE FUNCTION update_ag_agent_repository_update_time()
-RETURNS TRIGGER AS $$
-BEGIN
-    NEW.update_time = CURRENT_TIMESTAMP;
-    RETURN NEW;
-END;
-$$ LANGUAGE plpgsql;
-
-COMMENT ON FUNCTION update_ag_agent_repository_update_time() IS 'Auto-update update_time for ag_agent_repository_t';
-
-DROP TRIGGER IF EXISTS update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t;
-CREATE TRIGGER update_ag_agent_repository_update_time_trigger
-BEFORE UPDATE ON nexent.ag_agent_repository_t
-FOR EACH ROW
-EXECUTE FUNCTION update_ag_agent_repository_update_time();
-
-COMMENT ON TRIGGER update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t IS 'Trigger to maintain update_time';
-
-COMMIT;
diff --git a/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql b/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql
deleted file mode 100644
index 9a67c1ab2..000000000
--- a/docker/sql/v2.2.1_0609_add_selected_agent_version_no_to_agent_relation_t.sql
+++ /dev/null
@@ -1,15 +0,0 @@
--- Migration: Add selected_agent_version_no to ag_agent_relation_t
--- Date: 2026-06-09
--- Description: Pin child agent version on parent-child relations at publish time.
-
-SET search_path TO nexent;
-
-BEGIN;
-
-ALTER TABLE nexent.ag_agent_relation_t
-    ADD COLUMN IF NOT EXISTS selected_agent_version_no INTEGER;
-
-COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS
-    'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
-
-COMMIT;
diff --git a/frontend/app/[locale]/agents/components/AgentConfigComp.tsx b/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
index 1e750d5eb..13484595f 100644
--- a/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
+++ b/frontend/app/[locale]/agents/components/AgentConfigComp.tsx
@@ -29,8 +29,6 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
   const currentAgentId = useAgentConfigStore((state) => state.currentAgentId);
   const isCreatingMode = useAgentConfigStore((state) => state.isCreatingMode);
   const isReadOnly = useAgentConfigStore((state) => state.isReadOnly());
-  const selectedTools = useAgentConfigStore((state) => state.editedAgent.tools);
-  const selectedSkills = useAgentConfigStore((state) => state.editedAgent.skills);
 
   const [isMcpModalOpen, setIsMcpModalOpen] = useState(false);
   const [isSkillModalOpen, setIsSkillModalOpen] = useState(false);
@@ -127,12 +125,7 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
       <Tabs defaultValue="tools" className="w-full flex-1 min-h-0 flex flex-col overflow-hidden">
         <TabsList className="grid w-full grid-cols-2 flex-shrink-0">
           <TabsTrigger value="tools">
-            <span className="inline-flex items-center gap-1">
-              {t("toolPool.title")}
-              {selectedTools.length > 0 && (
-                <Badge count={selectedTools.length} size="small" color="blue" />
-              )}
-            </span>
+            {t("toolPool.title")}
             <Tooltip
               title={<div style={{ whiteSpace: "pre-line" }}>{t("toolPool.tooltip.functionGuide")}</div>}
               color="#ffffff"
@@ -151,14 +144,7 @@ export default function AgentConfigComp({}: AgentConfigCompProps) {
               <Lightbulb className="mx-2 text-yellow-500" size={16} />
             </Tooltip>
           </TabsTrigger>
-          <TabsTrigger value="skills">
-            <span className="inline-flex items-center gap-1">
-              {t("skillPool.title")}
-              {selectedSkills && selectedSkills.length > 0 && (
-                <Badge count={selectedSkills.length} size="small" color="blue" />
-              )}
-            </span>
-          </TabsTrigger>
+          <TabsTrigger value="skills">{t("skillPool.title")}</TabsTrigger>
         </TabsList>
 
         <TabsContent value="tools" className="mt-4 flex-1 min-h-0 flex flex-col overflow-hidden">
diff --git a/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
index 41c8baa45..277e85d3d 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/McpConfigModal.tsx
@@ -80,7 +80,6 @@ export default function McpConfigModal({
   const [openApiJson, setOpenApiJson] = useState("");
   const [openApiServiceName, setOpenApiServiceName] = useState("");
   const [openApiServerUrl, setOpenApiServerUrl] = useState("");
-  const [openApiHeadersTemplate, setOpenApiHeadersTemplate] = useState("");
   const [importingOpenApi, setImportingOpenApi] = useState(false);
   const [openapiServices, setOpenapiServices] = useState<any[]>([]);
   const [loadingOpenapiServices, setLoadingOpenapiServices] = useState(false);
@@ -507,7 +506,6 @@ export default function McpConfigModal({
           service_name: openApiServiceName.trim(),
           server_url: openApiServerUrl.trim(),
           openapi_json: parsedJson,
-          headers_template: openApiHeadersTemplate.trim() ? JSON.parse(openApiHeadersTemplate.trim()) : null,
         }),
       });
 
@@ -516,7 +514,6 @@ export default function McpConfigModal({
         setOpenApiJson("");
         setOpenApiServiceName("");
         setOpenApiServerUrl("");
-        setOpenApiHeadersTemplate("");
         await loadOpenapiServices();
         await refreshToolsAndAgents();
       } else {
@@ -1223,20 +1220,15 @@ export default function McpConfigModal({
                           style={{ flex: 3 }}
                         />
                       </div>
-                      <Input.TextArea
-                        placeholder={t("mcpConfig.addServer.customHeadersPlaceholder")}
-                        value={openApiHeadersTemplate}
-                        onChange={(e) => setOpenApiHeadersTemplate(e.target.value)}
-                        rows={2}
-                        disabled={actionsLocked || importingOpenApi}
-                      />
-                      <Input.TextArea
-                        placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
-                        value={openApiJson}
-                        onChange={(e) => setOpenApiJson(e.target.value)}
-                        rows={6}
-                        disabled={actionsLocked || importingOpenApi}
-                      />
+                      <div>
+                        <Input.TextArea
+                          placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
+                          value={openApiJson}
+                          onChange={(e) => setOpenApiJson(e.target.value)}
+                          rows={6}
+                          disabled={actionsLocked || importingOpenApi}
+                        />
+                      </div>
                       <div
                         style={{
                           display: "flex",
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
index 8f040d4b3..7f969edb9 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillBuildModal.tsx
@@ -56,7 +56,7 @@ import {
   SkillFilesAccessDeniedError,
   type SkillFileNode,
 } from "@/services/agentConfigService";
-import { MarkdownRenderer } from "@/components/common/markdownRenderer";
+import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
 import log from "@/lib/logger";
 
 const { TextArea } = Input;
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
index 05f11d6a3..4161a3b1a 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillDetailModal.tsx
@@ -10,7 +10,7 @@ import {
   fetchSkillFileContent,
   SkillFilesAccessDeniedError,
 } from "@/services/agentConfigService";
-import { MarkdownRenderer } from "@/components/common/markdownRenderer";
+import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
 import {
   buildTreeData,
   collectDirKeys,
diff --git a/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx b/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
index f8a733ae0..dc5e22d87 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/SkillManagement.tsx
@@ -3,7 +3,7 @@
 import { useState, useEffect } from "react";
 import { useTranslation } from "react-i18next";
 import { SkillGroup, Skill, SkillParam } from "@/types/agentConfig";
-import { Tabs, message, Tooltip, Badge } from "antd";
+import { Tabs, message, Tooltip } from "antd";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import { useSkillList } from "@/hooks/agent/useSkillList";
 import { Info, Trash2, Settings } from "lucide-react";
@@ -207,27 +207,21 @@ export default function SkillManagement({
   };
 
   const tabItems = skillGroups.map((group) => {
-    const selectedCount = group.skills.filter(s => originalSelectedSkillIdsSet.has(s.skill_id)).length;
-
     return {
       key: group.key,
       label: (
         <Tooltip title={group.label} placement="right">
-          <span className="inline-flex items-center gap-1">
-            <span
-              style={{
-                maxWidth: "100px",
-                overflow: "hidden",
-                textOverflow: "ellipsis",
-                whiteSpace: "nowrap",
-                textAlign: "left",
-              }}
-            >
-              {group.label}
-            </span>
-            {selectedCount > 0 && (
-              <Badge count={selectedCount} size="small" color="blue" />
-            )}
+          <span
+            style={{
+              display: "block",
+              maxWidth: "100px",
+              overflow: "hidden",
+              textOverflow: "ellipsis",
+              whiteSpace: "nowrap",
+              textAlign: "left",
+            }}
+          >
+            {group.label}
           </span>
         </Tooltip>
       ),
diff --git a/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx b/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
index 62edc3ac8..0cb73de62 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/ToolManagement.tsx
@@ -4,7 +4,7 @@ import { useState, useEffect, useCallback } from "react";
 import { useTranslation } from "react-i18next";
 import ToolConfigModal from "./tool/ToolConfigModal";
 import { ToolGroup, Tool, ToolParam } from "@/types/agentConfig";
-import { Tabs, Collapse, message, Tooltip, Badge } from "antd";
+import { Tabs, Collapse, message, Tooltip } from "antd";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import { useToolList } from "@/hooks/agent/useToolList";
 import { usePrefetchKnowledgeBases } from "@/hooks/useKnowledgeBaseSelector";
@@ -307,29 +307,21 @@ export default function ToolManagement({
   // Generate Tabs configuration
   const tabItems = toolGroups.map((group) => {
     const label = t(group.label);
-    const selectedCount = group.subGroups
-      ? group.subGroups.reduce(
-          (sum, sg) => sum + sg.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length, 0)
-      : group.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length;
 
     return {
       key: group.key,
       label: (
         <Tooltip title={label} placement="right">
-          <span className="inline-flex items-center gap-1">
-            <span
-              style={{
-                maxWidth: "100px",
-                overflow: "hidden",
-                textOverflow: "ellipsis",
-                whiteSpace: "nowrap",
-              }}
-            >
-              {label}
-            </span>
-            {selectedCount > 0 && (
-              <Badge count={selectedCount} size="small" color="blue" />
-            )}
+          <span
+            style={{
+              display: "block",
+              maxWidth: "100px",
+              overflow: "hidden",
+              textOverflow: "ellipsis",
+              whiteSpace: "nowrap",
+            }}
+          >
+            {label}
           </span>
         </Tooltip>
       ),
@@ -359,25 +351,17 @@ export default function ToolManagement({
                   items={group.subGroups.map((subGroup, index) => ({
                     key: subGroup.key,
                     label: (
-                      <span className="inline-flex items-center gap-1">
-                        <span
-                          className="text-gray-700 font-medium"
-                          style={{
-                            paddingTop: "8px",
-                            paddingBottom: "8px",
-                            minHeight: "36px",
-                            lineHeight: "20px",
-                          }}
-                        >
-                          {subGroup.label}
-                        </span>
-                        {subGroup.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length > 0 && (
-                          <Badge
-                            count={subGroup.tools.filter(t => originalSelectedToolIdsSet.has(t.id)).length}
-                            size="small"
-                            color="blue"
-                          />
-                        )}
+                      <span
+                        className="text-gray-700 font-medium"
+                        style={{
+                          paddingTop: "8px",
+                          paddingBottom: "8px",
+                          display: "block",
+                          minHeight: "36px",
+                          lineHeight: "20px",
+                        }}
+                      >
+                        {subGroup.label}
                       </span>
                     ),
                     className: `tool-category-panel ${
diff --git a/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx b/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
index 9729007e2..6f372e2b4 100644
--- a/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentConfig/skill/SkillConfigModal.tsx
@@ -12,13 +12,13 @@ import {
   message,
   Tag,
   Skeleton,
-  Tooltip
 } from "antd";
 import { Settings } from "lucide-react";
 import { CloseOutlined } from "@ant-design/icons";
 
 import { Skill, SkillParam } from "@/types/agentConfig";
 import { KnowledgeBase } from "@/types/knowledgeBase";
+import { Tooltip } from "@/components/ui/tooltip";
 import { saveSkillInstance } from "@/services/agentConfigService";
 import KnowledgeBaseSelectorModal from "@/components/tool-config/KnowledgeBaseSelectorModal";
 import {
diff --git a/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx b/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
index cd46d2aa3..8b6cd82d7 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/AgentGenerateDetail.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { useState, useEffect, useMemo, useRef } from "react";
+import { useState, useEffect, useMemo, useRef, useCallback } from "react";
 import { useTranslation } from "react-i18next";
 import {
   Button,
@@ -17,11 +17,9 @@ import {
 } from "antd";
 import { Tabs, TabsList, TabsTrigger, TabsContent } from "@/components/ui/tabs";
 import { Zap, Maximize2, Settings2, Sparkles } from "lucide-react";
-import { Textarea } from "@/components/ui/textarea";
 
 import {
   AgentConfigUpdate,
-  DEFAULT_AGENT_VERIFICATION_CONFIG,
   PromptTemplate,
 } from "@/types/agentConfig";
 import {
@@ -171,7 +169,6 @@ export default function AgentGenerateDetail({}) {
       constraintPrompt: editedAgent.constraint_prompt || "",
       fewShotsPrompt: editedAgent.few_shots_prompt || "",
       provideRunSummary: editedAgent.provide_run_summary || false,
-      verificationEnabled: editedAgent.verification_config?.enabled ?? false,
       businessDescription: editedAgent.business_description || "",
       businessLogicModelName:editedAgent.business_logic_model_name,
       businessLogicModelId: editedAgent.business_logic_model_id,
@@ -236,7 +233,6 @@ export default function AgentGenerateDetail({}) {
     setOptimizeModalOpen(true);
   };
 
-
   const renderExpandButton = (type: "duty" | "constraint" | "few-shots") => {
     return (
       <Button
@@ -395,7 +391,6 @@ export default function AgentGenerateDetail({}) {
     setOptimizeModalType(null);
   };
 
-
   const handleSaveExpandModal = (content: string) => {
     switch (expandModalType) {
       case 'duty':
@@ -451,35 +446,27 @@ export default function AgentGenerateDetail({}) {
     }
   };
 
-  const handleReplaceOptimizedContent = (
-    content: string,
-    sectionType: "duty" | "constraint" | "few_shots"
-  ) => {
-    const value = content.trim();
+  const getStoreFieldKey = (type: 'duty' | 'constraint' | 'few-shots') => {
+    switch (type) {
+      case "duty":
+        return "duty_prompt";
+      case "constraint":
+        return "constraint_prompt";
+      case "few-shots":
+        return "few_shots_prompt";
+    }
+  };
 
-    if (!value) {
-      handleCloseOptimizeModal();
+  const handleReplaceOptimizedContent = (content: string) => {
+    if (!optimizeModalType) {
       return;
     }
 
-    const fieldMap = {
-      duty: {
-        formField: "dutyPrompt" as const,
-        storeField: "duty_prompt" as const,
-      },
-      constraint: {
-        formField: "constraintPrompt" as const,
-        storeField: "constraint_prompt" as const,
-      },
-      few_shots: {
-        formField: "fewShotsPrompt" as const,
-        storeField: "few_shots_prompt" as const,
-      },
-    };
+    const formFieldKey = getPromptFieldKey(optimizeModalType);
+    const storeFieldKey = getStoreFieldKey(optimizeModalType);
 
-    const { formField, storeField } = fieldMap[sectionType];
-    form.setFieldsValue({ [formField]: value });
-    updateAgentConfig({ [storeField]: value } as AgentConfigUpdate);
+    form.setFieldsValue({ [formFieldKey]: content });
+    updateAgentConfig({ [storeFieldKey]: content } as AgentConfigUpdate);
     handleCloseOptimizeModal();
   };
 
@@ -695,12 +682,11 @@ export default function AgentGenerateDetail({}) {
             }}
             className="agent-config-tabs flex flex-col h-full w-full"
           >
-            <TabsList className="grid w-full grid-cols-5 flex-shrink-0">
+            <TabsList className="grid w-full grid-cols-4 flex-shrink-0">
               <TabsTrigger value="agent-info">{t("agent.info.title")}</TabsTrigger>
               <TabsTrigger value="duty">{t("systemPrompt.card.duty.title")}</TabsTrigger>
               <TabsTrigger value="constraint">{t("systemPrompt.card.constraint.title")}</TabsTrigger>
               <TabsTrigger value="few-shots">{t("systemPrompt.card.fewShots.title")}</TabsTrigger>
-              <TabsTrigger value="greeting">{t("agent.greeting.tabTitle")}</TabsTrigger>
             </TabsList>
 
             <TabsContent value="agent-info" className="flex-1 min-h-0 overflow-y-auto">
@@ -875,7 +861,7 @@ export default function AgentGenerateDetail({}) {
                       </Row>
 
                       <Row gutter={16}>
-                        <Col span={8}>
+                        <Col span={12}>
                           <Form.Item
                             name="mainAgentMaxStep"
                             label={t("businessLogic.config.maxSteps")}
@@ -903,7 +889,7 @@ export default function AgentGenerateDetail({}) {
                             />
                           </Form.Item>
                         </Col>
-                        <Col span={8}>
+                        <Col span={12}>
                           <Form.Item
                             name="provideRunSummary"
                             label={t("agent.provideRunSummary")}
@@ -925,33 +911,6 @@ export default function AgentGenerateDetail({}) {
                             />
                           </Form.Item>
                         </Col>
-                        <Col span={8}>
-                          <Form.Item
-                            name="verificationEnabled"
-                            label={t("agent.verification")}
-                            rules={[
-                              {
-                                required: true,
-                                message: t("agent.verification.error"),
-                              },
-                            ]}
-                          >
-                            <Select
-                              options={[
-                                { value: true, label: t("common.yes") },
-                                { value: false, label: t("common.no") },
-                              ]}
-                              onChange={(value) => {
-                                updateAgentConfig({
-                                  verification_config: {
-                                    ...(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG),
-                                    enabled: value,
-                                  },
-                                });
-                              }}
-                            />
-                          </Form.Item>
-                        </Col>
                       </Row>
 
                       <Form.Item
@@ -1000,70 +959,6 @@ export default function AgentGenerateDetail({}) {
                 (value) => updateAgentConfig({ few_shots_prompt: value })
               )}
             </TabsContent>
-
-            <TabsContent value="greeting" className="flex-1 min-h-0 overflow-y-auto">
-              <div className="overflow-y-auto overflow-x-hidden h-full px-3 pb-3">
-                <div className="mb-4">
-                  <div className="flex items-center mb-2">
-                    <h4 className="text-md font-medium text-gray-700">{t("agent.greeting.messageTitle")}</h4>
-                  </div>
-                  <Textarea
-                    value={editedAgent.greeting_message || ""}
-                    onChange={(e) => updateAgentConfig({ greeting_message: e.target.value })}
-                    disabled={!editable || isGenerating}
-                    placeholder={t("agent.greeting.messagePlaceholder")}
-                    className="w-full min-h-[80px]"
-                  />
-                </div>
-
-                <div className="mb-4">
-                  <div className="flex items-center mb-2">
-                    <h4 className="text-md font-medium text-gray-700">{t("agent.greeting.questionsTitle")}</h4>
-                  </div>
-                  {(editedAgent.example_questions || []).length > 0 && (
-                    <div className="space-y-2">
-                      {(editedAgent.example_questions || []).map((q: string, idx: number) => (
-                        <div key={idx} className="flex items-center gap-2">
-                          <Input
-                            value={q}
-                            onChange={(e) => {
-                              const newQuestions = [...(editedAgent.example_questions || [])];
-                              newQuestions[idx] = e.target.value;
-                              updateAgentConfig({ example_questions: newQuestions });
-                            }}
-                            disabled={!editable || isGenerating}
-                            className="flex-1"
-                          />
-                          <Button
-                            size="small"
-                            disabled={!editable || isGenerating}
-                            onClick={() => {
-                              const newQuestions = (editedAgent.example_questions || []).filter((_: string, i: number) => i !== idx);
-                              updateAgentConfig({ example_questions: newQuestions });
-                            }}
-                          >
-                            {t("agent.greeting.removeQuestion")}
-                          </Button>
-                        </div>
-                      ))}
-                    </div>
-                  )}
-                  {(editedAgent.example_questions || []).length < 6 && editable && !isGenerating && (
-                    <Button
-                      size="small"
-                      type="dashed"
-                      onClick={() => {
-                        const newQuestions = [...(editedAgent.example_questions || []), ""];
-                        updateAgentConfig({ example_questions: newQuestions });
-                      }}
-                      className="mt-2"
-                    >
-                      {t("agent.greeting.addQuestion")}
-                    </Button>
-                  )}
-                </div>
-              </div>
-            </TabsContent>
           </Tabs>
         </Col>
       </Row>
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
index 511c74218..4e284f879 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugConfig.tsx
@@ -18,7 +18,6 @@ import {
 import { useModelList } from "@/hooks/model/useModelList";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import DebugMessageList from "./DebugMessageList";
-import DebugOptimizeModal from "./DebugOptimizeModal";
 import { useCompareStream } from "./useCompareStream";
 
 // Agent debugging component Props interface
@@ -31,11 +30,6 @@ interface AgentDebuggingProps {
   isStreaming: boolean;
   isCompareStreaming?: boolean;
   messages: ChatMessageType[];
-  onOptimizeReply?: (params: {
-    userQuestion: string;
-    assistantAnswer: string;
-    history: Array<{ role: string; content: string }>;
-  }) => void;
   comparePanel?: React.ReactNode;
   showCompare?: boolean;
   onOpenCompare?: () => void;
@@ -61,7 +55,6 @@ function AgentDebugging({
   isStreaming,
   isCompareStreaming = false,
   messages,
-  onOptimizeReply,
   comparePanel,
   showCompare,
   onOpenCompare,
@@ -81,11 +74,7 @@ function AgentDebugging({
         ) : (
           <div className="flex flex-col gap-4 flex-1 min-h-0 overflow-hidden">
             {/* Message display area */}
-            <DebugMessageList
-              messages={messages}
-              isStreaming={isStreaming}
-              onOptimizeReply={onOptimizeReply}
-            />
+            <DebugMessageList messages={messages} isStreaming={isStreaming} />
           </div>
         )}
 
@@ -163,16 +152,6 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
   const prevAgentIdRef = useRef<number | null | undefined>(undefined);
   // Maintain an independent step ID counter per Agent
   const stepIdCounter = useRef<{ current: number }>({ current: 0 });
-
-  const [debugOptimizeOpen, setDebugOptimizeOpen] = useState(false);
-  const [debugOptimizeSelected, setDebugOptimizeSelected] = useState<null | {
-    userQuestion: string;
-    assistantAnswer: string;
-    history: Array<{ role: string; content: string }>;
-  }>(null);
-  const [compareOriginalPrompt, setCompareOriginalPrompt] = useState("");
-  const [compareOptimizedPrompt, setCompareOptimizedPrompt] = useState("");
-
   const [isComparePanelOpen, setIsComparePanelOpen] = useState(false);
   const [compareLeftModelId, setCompareLeftModelId] = useState<number | null>(null);
   const [compareRightModelId, setCompareRightModelId] = useState<number | null>(null);
@@ -623,113 +602,8 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
     }
   };
 
-  const handleOpenOptimize = (params: {
-    userQuestion: string;
-    assistantAnswer: string;
-    history: Array<{ role: string; content: string }>;
-  }) => {
-    if (!parsedAgentId) return;
-    if (!editedAgent?.model_id) return;
-
-    const duty = (editedAgent?.duty_prompt || "").trim();
-    const constraint = (editedAgent?.constraint_prompt || "").trim();
-    const fewShots = (editedAgent?.few_shots_prompt || "").trim();
-
-    const originalFullPrompt = [
-      "# 智能体角色",
-      duty,
-      "",
-      "# 使用要求",
-      constraint,
-      "",
-      "# 示例",
-      fewShots,
-    ]
-      .filter((part) => part !== undefined)
-      .join("\n")
-      .trim();
-
-    setCompareOriginalPrompt(originalFullPrompt);
-    setCompareOptimizedPrompt("");
-
-    setDebugOptimizeSelected(params);
-    setDebugOptimizeOpen(true);
-  };
-
-  const handleOptimized = (params: {
-    originalFullPrompt: string;
-    optimizedFullPrompt: string;
-  }) => {
-    setCompareOriginalPrompt(params.originalFullPrompt || "");
-    setCompareOptimizedPrompt(params.optimizedFullPrompt || "");
-  };
-
-  const handleApplyOptimizedPrompt = (optimizedFullPrompt?: string) => {
-    const optimized = (optimizedFullPrompt || compareOptimizedPrompt || "").trim();
-    if (!optimized) {
-      return;
-    }
-
-    const normalized = optimized
-      .replace(/\r\n/g, "\n")
-      .replace(/^#\s*智能体角色\s*$/gm, "# Duty")
-      .replace(/^#\s*使用要求\s*$/gm, "# Constraint")
-      .replace(/^#\s*示例\s*$/gm, "# FewShots");
-
-    const pickSection = (header: "Duty" | "Constraint" | "FewShots"): string => {
-      const headerRegex = new RegExp(`^#\\s*${header}\\s*$`, "gm");
-      const matches = [...normalized.matchAll(headerRegex)];
-      const current = matches[0];
-      if (!current) return "";
-
-      const start = current.index + current[0].length;
-      const rest = normalized.slice(start);
-      const nextHeaderMatch = rest.match(/^#\s*(Duty|Constraint|FewShots)\s*$/m);
-      const end = nextHeaderMatch?.index ?? rest.length;
-      return rest.slice(0, end).trim();
-    };
-
-    const duty = pickSection("Duty");
-    const constraint = pickSection("Constraint");
-    const fewShots = pickSection("FewShots");
-
-    const updateAgentConfig = useAgentConfigStore.getState().updateAgentConfig;
-
-    updateAgentConfig({
-      ...(duty ? { duty_prompt: duty } : {}),
-      ...(constraint ? { constraint_prompt: constraint } : {}),
-      ...(fewShots ? { few_shots_prompt: fewShots } : {}),
-    });
-    // Close optimize modal after applying.
-    setDebugOptimizeOpen(false);
-    setDebugOptimizeSelected(null);
-    setCompareOriginalPrompt("");
-    setCompareOptimizedPrompt("");
-  };
-
   return (
     <div className="w-full h-full bg-white">
-      <DebugOptimizeModal
-        open={debugOptimizeOpen}
-        agentId={parsedAgentId ?? 0}
-        modelId={editedAgent?.model_id ?? 0}
-        userQuestion={debugOptimizeSelected?.userQuestion || ""}
-        assistantAnswer={debugOptimizeSelected?.assistantAnswer || ""}
-        history={debugOptimizeSelected?.history || []}
-        initialOriginalFullPrompt={compareOriginalPrompt || ""}
-        onCancel={() => {
-          setDebugOptimizeOpen(false);
-          setDebugOptimizeSelected(null);
-          setCompareOriginalPrompt("");
-          setCompareOptimizedPrompt("");
-        }}
-        onOptimized={handleOptimized}
-        onApply={(optimizedFullPrompt) => {
-          setCompareOptimizedPrompt(optimizedFullPrompt || "");
-          handleApplyOptimizedPrompt(optimizedFullPrompt);
-        }}
-      />
-
       <AgentDebugging
         key={agentId} // Re-render when agentId changes to ensure state resets
         onStop={handleStop}
@@ -740,7 +614,6 @@ export default function DebugConfig({ agentId }: DebugConfigProps) {
         isStreaming={isStreaming}
         isCompareStreaming={isCompareStreaming}
         messages={messages}
-        onOptimizeReply={handleOpenOptimize}
         comparePanel={comparePanel}
         showCompare={hasMultipleLlmModels}
         onOpenCompare={toggleComparePanel}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
index 4b299d52b..7eb25c220 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/DebugMessageList.tsx
@@ -5,25 +5,17 @@ import { TaskWindow } from "@/app/chat/streaming/taskWindow";
 import { transformMessagesToTaskMessages } from "@/app/chat/streaming/messageTransformer";
 import { MESSAGE_ROLES } from "@/const/chatConfig";
 import { ChatMessageType, TaskMessageType } from "@/types/chat";
-import { Button, Tooltip } from "antd";
-import { Sparkles } from "lucide-react";
 
 interface DebugMessageListProps {
   messages: ChatMessageType[];
   isStreaming: boolean;
   emptyPlaceholder?: string;
-  onOptimizeReply?: (params: {
-    userQuestion: string;
-    assistantAnswer: string;
-    history: Array<{ role: string; content: string }>;
-  }) => void;
 }
 
 export default function DebugMessageList({
   messages,
   isStreaming,
   emptyPlaceholder,
-  onOptimizeReply,
 }: DebugMessageListProps) {
   const processMessageSteps = (message: ChatMessageType): TaskMessageType[] => {
     if (!message.steps || message.steps.length === 0) return [];
@@ -43,40 +35,6 @@ export default function DebugMessageList({
     );
   }
 
-  const buildHistory = () =>
-    messages
-      .filter((msg) => msg.isComplete !== false && msg.content?.trim())
-      .map((msg) => ({
-        role: msg.role,
-        content:
-          msg.role === MESSAGE_ROLES.ASSISTANT
-            ? msg.finalAnswer?.trim() || msg.content || ""
-            : msg.content || "",
-      }));
-
-  const onOptimizeClick = (assistantIndex: number) => {
-    if (!onOptimizeReply) return;
-
-    const assistantMsg = messages[assistantIndex];
-    if (!assistantMsg) return;
-
-    const assistantAnswer = assistantMsg.finalAnswer?.trim() || assistantMsg.content || "";
-    if (!assistantAnswer.trim()) return;
-
-    const userMsg = [...messages]
-      .slice(0, assistantIndex)
-      .reverse()
-      .find((m) => m.role === MESSAGE_ROLES.USER);
-
-    const userQuestion = userMsg?.content || "";
-
-    onOptimizeReply({
-      userQuestion,
-      assistantAnswer,
-      history: buildHistory(),
-    });
-  };
-
   return (
     <div className="flex flex-col gap-3 h-full overflow-y-auto custom-scrollbar">
       {messages.map((message, index) => {
@@ -85,18 +43,6 @@ export default function DebugMessageList({
             ? processMessageSteps(message)
             : [];
 
-        const isLastStreamingAssistant =
-          isStreaming &&
-          index === messages.length - 1 &&
-          message.role === MESSAGE_ROLES.ASSISTANT;
-
-        const canOptimize =
-          Boolean(onOptimizeReply) &&
-          message.role === MESSAGE_ROLES.ASSISTANT &&
-          message.isComplete !== false &&
-          !isLastStreamingAssistant &&
-          Boolean((message.finalAnswer || message.content || "").trim());
-
         return (
           <div key={message.id || index} className="flex flex-col gap-2">
             {message.role === MESSAGE_ROLES.USER && (
@@ -123,39 +69,16 @@ export default function DebugMessageList({
               )}
 
             {message.role === MESSAGE_ROLES.ASSISTANT && (
-              <div className="relative">
-                <ChatStreamFinalMessage
-                  message={message}
-                  onSelectMessage={() => {}}
-                  isSelected={false}
-                  searchResultsCount={message.searchResults?.length || 0}
-                  imagesCount={message.images?.length || 0}
-                  onImageClick={() => {}}
-                  onOpinionChange={() => {}}
-                  hideButtons={true}
-                />
-
-                {canOptimize && (
-                  <div className="mt-1 flex justify-start">
-                    <Tooltip title="优化" placement="top">
-                      <Button
-                        type="text"
-                        size="small"
-                        onClick={() => onOptimizeClick(index)}
-                        icon={<Sparkles size={14} />}
-                        className="prompt-toolbar-button"
-                        style={{
-                          color: "#475569",
-                          width: 24,
-                          minWidth: 24,
-                          height: 24,
-                          borderRadius: 9999,
-                        }}
-                      />
-                    </Tooltip>
-                  </div>
-                )}
-              </div>
+              <ChatStreamFinalMessage
+                message={message}
+                onSelectMessage={() => {}}
+                isSelected={false}
+                searchResultsCount={message.searchResults?.length || 0}
+                imagesCount={message.images?.length || 0}
+                onImageClick={() => {}}
+                onOpinionChange={() => {}}
+                hideButtons={true}
+              />
             )}
           </div>
         );
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx
deleted file mode 100644
index f9b1f4eca..000000000
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugOptimizeModal.tsx
+++ /dev/null
@@ -1,230 +0,0 @@
-"use client";
-
-import { useEffect, useState } from "react";
-import { useTranslation } from "react-i18next";
-import { App, Button, Input, Modal, Space, Spin, Typography } from "antd";
-
-const { TextArea } = Input;
-const { Paragraph, Text } = Typography;
-
-export interface DebugOptimizeModalProps {
-  open: boolean;
-  agentId: number;
-  modelId: number;
-  userQuestion: string;
-  assistantAnswer: string;
-  history: Array<{ role: string; content: string }>;
-  initialOriginalFullPrompt?: string;
-  onCancel: () => void;
-  onOptimized: (params: { originalFullPrompt: string; optimizedFullPrompt: string }) => void;
-  onApply: (optimizedFullPrompt: string) => void;
-  applying?: boolean;
-}
-
-export default function DebugOptimizeModal({
-  open,
-  agentId,
-  modelId,
-  userQuestion,
-  assistantAnswer,
-  history,
-  initialOriginalFullPrompt,
-  onCancel,
-  onOptimized,
-  onApply,
-  applying,
-}: DebugOptimizeModalProps) {
-  const { t } = useTranslation("common");
-  const { message } = App.useApp();
-
-  const [feedback, setFeedback] = useState("");
-  const [isOptimizing, setIsOptimizing] = useState(false);
-
-  const [originalFullPrompt, setOriginalFullPrompt] = useState("");
-  const [optimizedFullPrompt, setOptimizedFullPrompt] = useState("");
-  const [displayedContent, setDisplayedContent] = useState("");
-
-  // Section header mapping: English -> Chinese
-  const headerMap: Record<string, string> = {
-    "# Duty": "#智能体角色",
-    "# Constraint": "#使用要求",
-    "# FewShots": "#示例",
-  };
-
-  const mapHeadersToChinese = (text: string) => {
-    let result = text;
-    for (const [en, zh] of Object.entries(headerMap)) {
-      result = result.split(en).join(zh);
-    }
-    return result;
-  };
-
-  useEffect(() => {
-    if (!open) {
-      setFeedback("");
-      setIsOptimizing(false);
-      setOriginalFullPrompt("");
-      setOptimizedFullPrompt("");
-      setDisplayedContent("");
-      return;
-    }
-
-    setFeedback("");
-    setIsOptimizing(false);
-    setDisplayedContent("");
-    // Show original prompt immediately when opening the modal.
-    setOriginalFullPrompt((prev) => prev || initialOriginalFullPrompt || "");
-    // Keep original prompt visible while waiting for new optimized result.
-    setOptimizedFullPrompt("");
-  }, [open, agentId, modelId]);
-
-  const handleOk = async () => {
-    if (!feedback.trim()) {
-      message.error(t("systemPrompt.optimize.feedbackRequired"));
-      return;
-    }
-
-    setIsOptimizing(true);
-    try {
-      const resp = await fetch("/api/prompt/optimize/from_debug", {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({
-          agent_id: agentId,
-          model_id: modelId,
-          feedback: feedback.trim(),
-          selected: {
-            user_question: userQuestion,
-            assistant_answer: assistantAnswer,
-          },
-          history,
-        }),
-      });
-
-      const result = await resp.json();
-      if (!resp.ok) {
-        throw new Error(result?.message || t("systemPrompt.optimize.error"));
-      }
-
-      const data = result?.data;
-      const original = data?.original_full_prompt || "";
-      const fullText = mapHeadersToChinese(data?.optimized_full_prompt || "");
-
-      setOriginalFullPrompt(original);
-      setOptimizedFullPrompt(fullText);
-      setDisplayedContent(fullText);
-
-      // Ensure modal stays open and does not reset prompts.
-      setIsOptimizing(false);
-
-      onOptimized({
-        originalFullPrompt: original,
-        optimizedFullPrompt: fullText,
-      });
-    } catch (e: any) {
-      message.error(e?.message || t("systemPrompt.optimize.error"));
-    } finally {
-      setIsOptimizing(false);
-    }
-  };
-
-  return (
-    <Modal
-      title={t("agent.debug.optimizeTitle", "Optimize prompt")}
-      open={open}
-      onCancel={onCancel}
-      width={1200}
-      footer={
-        <Space>
-          <Button onClick={onCancel}>{t("common.cancel")}</Button>
-          <Button
-            type="primary"
-            onClick={() => onApply(optimizedFullPrompt)}
-            disabled={!optimizedFullPrompt.trim()}
-            loading={applying}
-          >
-            {t("agent.debug.promptCompare.apply", "Apply")}
-          </Button>
-          <Button type="primary" onClick={handleOk}>
-            {t("systemPrompt.optimize.submit")}
-          </Button>
-        </Space>
-      }
-      destroyOnHidden
-    >
-      <div className="flex flex-col gap-3">
-        <Text type="secondary">
-          {t(
-            "agent.debug.optimizeHint",
-            "Select a reply, provide feedback, and we will optimize the full system prompt."
-          )}
-        </Text>
-
-        <div>
-          <Text strong>{t("systemPrompt.optimize.feedbackLabel")}</Text>
-          <TextArea
-            value={feedback}
-            onChange={(e) => setFeedback(e.target.value)}
-            placeholder={t("systemPrompt.optimize.feedbackPlaceholder")}
-            rows={4}
-            className="mt-2"
-            disabled={isOptimizing}
-          />
-        </div>
-
-        <div className="grid grid-cols-1 gap-3 md:grid-cols-2">
-          <div>
-            <Text strong>{t("agent.debug.selectedQuestion", "Selected question")}</Text>
-            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
-              <Paragraph style={{ whiteSpace: "pre-wrap", marginBottom: 0 }} className="text-sm">
-                {userQuestion || t("common.none")}
-              </Paragraph>
-            </div>
-          </div>
-          <div>
-            <Text strong>{t("agent.debug.selectedAnswer", "Selected answer")}</Text>
-            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
-              <Paragraph style={{ whiteSpace: "pre-wrap", marginBottom: 0 }} className="text-sm">
-                {assistantAnswer || t("common.none")}
-              </Paragraph>
-            </div>
-          </div>
-        </div>
-
-        <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
-          <div>
-            <Text strong>{t("agent.debug.promptCompare.original", "Original")}</Text>
-            <div className="mt-2 border border-gray-200 rounded-md p-3 bg-gray-50">
-              <Paragraph
-                style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
-                className="font-mono text-sm"
-              >
-                {mapHeadersToChinese(originalFullPrompt) || "-"}
-              </Paragraph>
-            </div>
-          </div>
-          <div>
-            <Text strong>{t("agent.debug.promptCompare.optimized", "Optimized")}</Text>
-            <div className="mt-2 border border-gray-200 rounded-md p-3">
-              {isOptimizing ? (
-                <div className="flex flex-col items-center justify-center gap-3" style={{ minHeight: 520 }}>
-                  <Spin size="medium" />
-                  <span className="text-gray-500 text-sm">
-                    {t("systemPrompt.optimize.generating")}
-                  </span>
-                </div>
-              ) : (
-                <Paragraph
-                  style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
-                  className="font-mono text-sm"
-                >
-                  {displayedContent || t("systemPrompt.optimize.empty")}
-                </Paragraph>
-              )}
-            </div>
-          </div>
-        </div>
-      </div>
-    </Modal>
-  );
-}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx
deleted file mode 100644
index eec0ed132..000000000
--- a/frontend/app/[locale]/agents/components/agentInfo/DebugPromptCompareModal.tsx
+++ /dev/null
@@ -1,76 +0,0 @@
-"use client";
-
-import { useTranslation } from "react-i18next";
-import { Button, Modal, Space, Typography } from "antd";
-
-const { Paragraph, Text } = Typography;
-
-export interface DebugPromptCompareModalProps {
-  open: boolean;
-  originalFullPrompt: string;
-  optimizedFullPrompt: string;
-  onClose: () => void;
-  onApply: () => void;
-  applying?: boolean;
-}
-
-export default function DebugPromptCompareModal({
-  open,
-  originalFullPrompt,
-  optimizedFullPrompt,
-  onClose,
-  onApply,
-  applying,
-}: DebugPromptCompareModalProps) {
-  const { t } = useTranslation("common");
-
-  return (
-    <Modal
-      title={t("agent.debug.promptCompare.title", "Prompt compare")}
-      open={open}
-      onCancel={onClose}
-      width={1200}
-      footer={
-        <Space>
-          <Button onClick={onClose}>
-            {t("agent.debug.promptCompare.close", "Close")}
-          </Button>
-          <Button
-            type="primary"
-            onClick={onApply}
-            disabled={!optimizedFullPrompt.trim()}
-            loading={applying}
-          >
-            {t("agent.debug.promptCompare.apply", "Apply")}
-          </Button>
-        </Space>
-      }
-      destroyOnHidden
-    >
-      <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
-        <div className="border border-gray-200 rounded-md p-3 bg-gray-50">
-          <Text type="secondary" className="text-xs">
-            {t("agent.debug.promptCompare.original", "Original")}
-          </Text>
-          <Paragraph
-            style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
-            className="font-mono text-sm"
-          >
-            {originalFullPrompt || "-"}
-          </Paragraph>
-        </div>
-        <div className="border border-gray-200 rounded-md p-3">
-          <Text type="secondary" className="text-xs">
-            {t("agent.debug.promptCompare.optimized", "Optimized")}
-          </Text>
-          <Paragraph
-            style={{ whiteSpace: "pre-wrap", minHeight: 520, marginBottom: 0 }}
-            className="font-mono text-sm"
-          >
-            {optimizedFullPrompt || "-"}
-          </Paragraph>
-        </div>
-      </div>
-    </Modal>
-  );
-}
diff --git a/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
index 897c523c3..1d7629951 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/PromptOptimizeModal.tsx
@@ -1,22 +1,6 @@
-"use client";
-
-import { useEffect, useState, useRef, useCallback } from "react";
+import { useEffect, useState } from "react";
 import { useTranslation } from "react-i18next";
-import {
-  App,
-  Button,
-  Card,
-  Input,
-  Modal,
-  Radio,
-  Space,
-  Spin,
-  Typography,
-  Divider,
-  Tooltip,
-  Alert,
-} from "antd";
-import { MousePointer2 } from "lucide-react";
+import { App, Button, Card, Input, Modal, Space, Typography } from "antd";
 
 import log from "@/lib/logger";
 import { optimizePromptSection } from "@/services/promptService";
@@ -25,8 +9,6 @@ import type { OptimizePromptSectionResponse } from "@/types/agentConfig";
 const { TextArea } = Input;
 const { Paragraph, Text } = Typography;
 
-export type OptimizeMode = "general" | "insert" | "select";
-
 export interface PromptOptimizeModalProps {
   open: boolean;
   title: string;
@@ -39,7 +21,7 @@ export interface PromptOptimizeModalProps {
   subAgentIds: number[];
   knowledgeBaseDisplayNames?: string[];
   onClose: () => void;
-  onReplace: (content: string, sectionType: "duty" | "constraint" | "few_shots") => void;
+  onReplace: (content: string) => void;
 }
 
 export default function PromptOptimizeModal({
@@ -58,115 +40,43 @@ export default function PromptOptimizeModal({
 }: PromptOptimizeModalProps) {
   const { t } = useTranslation("common");
   const { message } = App.useApp();
-  const [mode, setMode] = useState<OptimizeMode>("general");
   const [feedback, setFeedback] = useState("");
-  const [startPos, setStartPos] = useState<string>("");
-  const [endPos, setEndPos] = useState<string>("");
   const [optimizedContent, setOptimizedContent] = useState("");
   const [isOptimizing, setIsOptimizing] = useState(false);
-  const [isContentSelected, setIsContentSelected] = useState(false);
-  const contentTextAreaRef = useRef<any>(null);
-
-  // Section header mapping: English -> Chinese
-  const headerMap: Record<string, string> = {
-    "# Duty": "#智能体角色",
-    "# Constraint": "#使用要求",
-    "# FewShots": "#示例",
-  };
-
-  const mapHeadersToChinese = (text: string) => {
-    let result = text;
-    for (const [en, zh] of Object.entries(headerMap)) {
-      result = result.split(en).join(zh);
-    }
-    return result;
-  };
 
   useEffect(() => {
     if (!open) {
       setFeedback("");
       setOptimizedContent("");
       setIsOptimizing(false);
-      setMode("general");
-      setStartPos("");
-      setEndPos("");
-      setIsContentSelected(false);
       return;
     }
+
     setFeedback("");
     setOptimizedContent("");
-    setIsOptimizing(false);
-    setMode("general");
-    setStartPos("");
-    setEndPos("");
-    setIsContentSelected(false);
   }, [open, sectionType, currentContent]);
 
-  const handleContentSelect = useCallback(() => {
-    if (!contentTextAreaRef.current) return;
-    const textarea = contentTextAreaRef.current.resizableTextArea?.textArea;
-    if (!textarea) return;
-
-    const { selectionStart, selectionEnd } = textarea;
-
-    // Insert mode: allow caret position even when no range is selected
-    if (selectionStart === selectionEnd) {
-      setStartPos(String(selectionStart));
-      setEndPos("");
-      setIsContentSelected(false);
-      setMode("insert");
-      return;
-    }
-
-    // Select mode: range selected
-    setStartPos(String(selectionStart));
-    setEndPos(String(selectionEnd));
-    setIsContentSelected(true);
-    setMode("select");
-  }, []);
-
   const handleOptimize = async () => {
     if (!feedback.trim()) {
       message.error(t("systemPrompt.optimize.feedbackRequired"));
       return;
     }
 
-    if (mode === "insert") {
-      const pos = parseInt(startPos, 10);
-      if (isNaN(pos) || pos < 0) {
-        message.error(t("systemPrompt.finetune.positionError"));
-        return;
-      }
-    }
-
-    if (mode === "select") {
-      const start = parseInt(startPos, 10);
-      const end = parseInt(endPos, 10);
-      if (isNaN(start) || isNaN(end) || start < 0 || end < 0 || start >= end) {
-        message.error(t("systemPrompt.finetune.positionError"));
-        return;
-      }
-    }
-
     setIsOptimizing(true);
     try {
       const result: OptimizePromptSectionResponse = await optimizePromptSection({
         agent_id: agentId,
         task_description: taskDescription,
-        model_id: modelId,
+        model_id: String(modelId),
         section_type: sectionType,
         section_title: title,
         current_content: currentContent,
         feedback,
-        mode,
-        start_pos: mode !== "general" ? parseInt(startPos, 10) : undefined,
-        end_pos: mode === "select" ? parseInt(endPos, 10) : undefined,
         tool_ids: toolIds,
         sub_agent_ids: subAgentIds,
         knowledge_base_display_names: knowledgeBaseDisplayNames,
       });
-      const fullText = mapHeadersToChinese(result.optimized_content || "");
-      setOptimizedContent(fullText);
+      setOptimizedContent(result.optimized_content || "");
     } catch (error: any) {
       log.error("Optimize prompt section failed:", error);
       message.error(error?.message || t("systemPrompt.optimize.error"));
@@ -176,28 +86,12 @@ export default function PromptOptimizeModal({
   };
 
   const handleReplace = () => {
-    if (!optimizedContent.trim() || isOptimizing) return;
-    onReplace(optimizedContent.trim(), sectionType);
+    if (!optimizedContent.trim()) {
+      return;
+    }
+    onReplace(optimizedContent);
   };
 
-  const modeOptions: Array<{ value: OptimizeMode; label: string; desc: string }> = [
-    {
-      value: "general",
-      label: t("systemPrompt.finetune.modeGeneral"),
-      desc: t("systemPrompt.finetune.modeGeneralDesc"),
-    },
-    {
-      value: "insert",
-      label: t("systemPrompt.finetune.modeInsert"),
-      desc: t("systemPrompt.finetune.modeInsertDesc"),
-    },
-    {
-      value: "select",
-      label: t("systemPrompt.finetune.modeSelect"),
-      desc: t("systemPrompt.finetune.modeSelectDesc"),
-    },
-  ];
-
   return (
     <Modal
       title={title}
@@ -206,7 +100,9 @@ export default function PromptOptimizeModal({
       width={1200}
       footer={
         <Space>
-          <Button onClick={onClose}>{t("common.cancel")}</Button>
+          <Button onClick={onClose}>
+            {t("common.cancel")}
+          </Button>
           <Button
             type="primary"
             onClick={handleReplace}
@@ -219,97 +115,11 @@ export default function PromptOptimizeModal({
       destroyOnHidden
     >
       <div className="flex flex-col gap-4">
-        {/* Mode Selection */}
-        <div>
-          <Text strong className="mb-2 block">
-            {t("systemPrompt.finetune.modeLabel")}
-          </Text>
-          <Radio.Group
-            value={mode}
-            onChange={(e) => setMode(e.target.value)}
-            className="flex flex-col gap-2"
-          >
-            {modeOptions.map((opt) => (
-              <Radio key={opt.value} value={opt.value} className="!ml-0">
-                <span className="font-medium">{opt.label}</span>
-                <span className="text-gray-500 text-sm ml-2">{opt.desc}</span>
-              </Radio>
-            ))}
-          </Radio.Group>
-        </div>
-
-        {/* Position inputs for insert/select modes */}
-        {mode !== "general" && (
-          <div className="bg-gray-50 rounded-md p-4">
-            {mode === "insert" && (
-              <div className="flex items-center gap-4">
-                <div className="flex-1">
-                  <Text type="secondary" className="text-xs">
-                    {t("systemPrompt.finetune.insertPositionLabel")}
-                  </Text>
-                  <Input
-                    type="number"
-                    min={0}
-                    value={startPos}
-                    onChange={(e) => setStartPos(e.target.value)}
-                    placeholder={t("systemPrompt.finetune.insertPositionPlaceholder")}
-                  />
-                </div>
-              </div>
-            )}
-            {mode === "select" && (
-              <div className="flex items-center gap-4 flex-wrap">
-                <div>
-                  <Text type="secondary" className="text-xs">
-                    {t("systemPrompt.finetune.selectStartLabel")}
-                  </Text>
-                  <Input
-                    type="number"
-                    min={0}
-                    value={startPos}
-                    onChange={(e) => setStartPos(e.target.value)}
-                    placeholder={t("systemPrompt.finetune.selectStartPlaceholder")}
-                    style={{ width: 140 }}
-                  />
-                </div>
-                <div>
-                  <Text type="secondary" className="text-xs">
-                    {t("systemPrompt.finetune.selectEndLabel")}
-                  </Text>
-                  <Input
-                    type="number"
-                    min={0}
-                    value={endPos}
-                    onChange={(e) => setEndPos(e.target.value)}
-                    placeholder={t("systemPrompt.finetune.selectEndPlaceholder")}
-                    style={{ width: 140 }}
-                  />
-                </div>
-              </div>
-            )}
-            {isContentSelected && (
-              <Alert
-                title={
-                  <span className="text-xs">
-                    {t("systemPrompt.finetune.selectTip")}: {startPos} - {endPos}
-                  </span>
-                }
-                type="success"
-                showIcon
-                className="mt-2"
-              />
-            )}
-          </div>
-        )}
-
-        <Divider className="my-2" />
-
-        {/* Feedback Input */}
         <div>
           <Text strong>{t("systemPrompt.optimize.feedbackLabel")}</Text>
           <TextArea
             value={feedback}
-            onChange={(e) => setFeedback(e.target.value)}
+            onChange={(event) => setFeedback(event.target.value)}
             placeholder={t("systemPrompt.optimize.feedbackPlaceholder")}
             rows={4}
             className="mt-2"
@@ -317,64 +127,30 @@ export default function PromptOptimizeModal({
           />
         </div>
 
-        {/* Submit Button */}
         <div className="flex justify-end">
-          <Button type="primary" onClick={handleOptimize}>
+          <Button
+            type="primary"
+            onClick={handleOptimize}
+            loading={isOptimizing}
+          >
             {t("systemPrompt.optimize.submit")}
           </Button>
         </div>
 
-        {/* Before/After Comparison */}
         <div className="grid grid-cols-1 gap-4 lg:grid-cols-2">
-          <Card
-            title={
-              <div className="flex items-center justify-between">
-                <span>{t("systemPrompt.optimize.original")}</span>
-                <Tooltip title={t("systemPrompt.finetune.selectTip")}>
-                  <Button
-                    size="small"
-                    type="text"
-                    icon={<MousePointer2 size={12} />}
-                    onClick={handleContentSelect}
-                    disabled={isOptimizing}
-                  />
-                </Tooltip>
-              </div>
-            }
-            styles={{ body: { padding: 0 } }}
-          >
-            <TextArea
-              ref={contentTextAreaRef}
-              value={mapHeadersToChinese(currentContent)}
-              readOnly
-              rows={10}
-              className="border-0 rounded-none font-mono text-sm"
-              style={{
-                resize: "none",
-                background: "#fafafa",
-                minHeight: 200,
-              }}
-              onSelect={handleContentSelect}
-              onClick={handleContentSelect}
-              onKeyUp={handleContentSelect}
-            />
+          <Card title={t("systemPrompt.optimize.original")}>
+            <Paragraph
+              style={{ whiteSpace: "pre-wrap", minHeight: 320, marginBottom: 0 }}
+            >
+              {currentContent || t("common.none")}
+            </Paragraph>
           </Card>
           <Card title={t("systemPrompt.optimize.optimized")}>
-            {isOptimizing ? (
-              <div className="flex flex-col items-center justify-center py-8 gap-3 min-h-[200px]">
-                <Spin size="medium" />
-                <span className="text-gray-500 text-sm">
-                  {t("systemPrompt.optimize.generating")}
-                </span>
-              </div>
-            ) : (
-              <Paragraph
-                style={{ whiteSpace: "pre-wrap", minHeight: 200, marginBottom: 0 }}
-                className="font-mono text-sm"
-              >
-                {optimizedContent || t("systemPrompt.optimize.empty")}
-              </Paragraph>
-            )}
+            <Paragraph
+              style={{ whiteSpace: "pre-wrap", minHeight: 320, marginBottom: 0 }}
+            >
+              {optimizedContent || t("systemPrompt.optimize.empty")}
+            </Paragraph>
           </Card>
         </div>
       </div>
diff --git a/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx b/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
index a3c6ebded..24434c0aa 100644
--- a/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
+++ b/frontend/app/[locale]/agents/components/agentInfo/PromptTemplateManagerModal.tsx
@@ -119,20 +119,16 @@ export default function PromptTemplateManagerModal({
   };
 
   const openTemplateEditor = (template: PromptTemplate, readOnly = false) => {
+    editorForm.setFieldsValue({
+      template_name: template.template_name,
+      description: template.description || "",
+      template_content_zh: template.template_content_zh || createEmptyPromptTemplateContent(),
+      template_content_en: template.template_content_en || createEmptyPromptTemplateContent(),
+    });
     setEditingTemplate(template);
     setEditorSeedTemplate(template);
     setEditorReadOnly(readOnly);
     setEditorOpen(true);
-
-    // Defer form operations until Form is mounted inside the editor modal.
-    queueMicrotask(() => {
-      editorForm.setFieldsValue({
-        template_name: template.template_name,
-        description: template.description || "",
-        template_content_zh: template.template_content_zh || createEmptyPromptTemplateContent(),
-        template_content_en: template.template_content_en || createEmptyPromptTemplateContent(),
-      });
-    });
   };
 
   const closeEditor = () => {
@@ -140,6 +136,7 @@ export default function PromptTemplateManagerModal({
     setEditingTemplate(null);
     setEditorSeedTemplate(null);
     setEditorReadOnly(false);
+    editorForm.resetFields();
   };
 
   const buildPayload = (values: PromptTemplateFormValues): PromptTemplatePayload => {
@@ -449,7 +446,7 @@ export default function PromptTemplateManagerModal({
           : t("businessLogic.config.template.createTitle")}
         width={980}
         centered
-        destroyOnHidden
+        destroyOnClose
         okText={editorReadOnly ? t("common.close") : t("common.save")}
         cancelText={t("common.cancel")}
         cancelButtonProps={editorReadOnly ? { style: { display: "none" } } : undefined}
diff --git a/frontend/app/[locale]/agents/page.tsx b/frontend/app/[locale]/agents/page.tsx
index 2ef7692d4..52d66fe8a 100644
--- a/frontend/app/[locale]/agents/page.tsx
+++ b/frontend/app/[locale]/agents/page.tsx
@@ -12,8 +12,6 @@ import AgentInfoComp from "./components/AgentInfoComp";
 import { useAgentConfigStore } from "@/stores/agentConfigStore";
 import AgentVersionManage from "./AgentVersionManage";
 import AgentSelectorHeader from "./components/AgentSelectorHeader";
-import { searchAgentInfo } from "@/services/agentConfigService";
-import log from "@/lib/logger";
 
 const { Header, Content } = Layout;
 
@@ -23,8 +21,6 @@ export default function AgentSetupOrchestrator() {
   const enterCreateMode = useAgentConfigStore((state) => state.enterCreateMode);
   const reset = useAgentConfigStore((state) => state.reset);
   const setDefaultLlmConfig = useAgentConfigStore((state) => state.setDefaultLlmConfig);
-  const currentAgentId = useAgentConfigStore((state) => state.currentAgentId);
-  const setCurrentAgent = useAgentConfigStore((state) => state.setCurrentAgent);
   const { config } = useConfig();
 
   // Sync default LLM config from load_config
@@ -51,26 +47,6 @@ export default function AgentSetupOrchestrator() {
     }
   }, [searchParams, enterCreateMode]);
 
-  // Handle auto-select agent from URL params (agent_id)
-  useEffect(() => {
-    const agentId = searchParams.get('agent_id');
-    if (agentId && (!currentAgentId || String(currentAgentId) !== agentId)) {
-      const loadAgent = async () => {
-        try {
-          const result = await searchAgentInfo(parseInt(agentId));
-          if (result.success && result.data) {
-            setCurrentAgent(result.data);
-          } else {
-            log.warn("Failed to load agent from URL agent_id:", result.message);
-          }
-        } catch (error) {
-          log.error("Failed to load agent from URL agent_id:", error);
-        }
-      };
-      loadAgent();
-    }
-  }, [searchParams, currentAgentId, setCurrentAgent]);
-
   // Reset agent selection state when leaving the page
   useEffect(() => {
     return () => {
diff --git a/frontend/app/[locale]/chat/components/chatAgentSelector.tsx b/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
index 47449fd08..f7a540172 100644
--- a/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
+++ b/frontend/app/[locale]/chat/components/chatAgentSelector.tsx
@@ -209,8 +209,7 @@ export function ChatAgentSelector({
       }
     }
 
-    const agent = agentId !== null ? agents.find((a: Agent) => a.id === agentId) : null;
-    onAgentSelect(agentId, agent?.greeting_message, agent?.example_questions);
+    onAgentSelect(agentId);
     setIsOpen(false);
 
     // If it's an iframe embedded page, send postMessage to the parent page
diff --git a/frontend/app/[locale]/chat/components/chatAttachment.tsx b/frontend/app/[locale]/chat/components/chatAttachment.tsx
index 69dfbc71a..d12e939cd 100644
--- a/frontend/app/[locale]/chat/components/chatAttachment.tsx
+++ b/frontend/app/[locale]/chat/components/chatAttachment.tsx
@@ -19,7 +19,7 @@ import {
 } from "@/services/storageService";
 import { cn } from "@/lib/utils";
 import { AttachmentItem, ChatAttachmentProps } from "@/types/chat";
-import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
+import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
 import { App } from "antd";
 
 // Selected file state for preview drawer
diff --git a/frontend/app/[locale]/chat/components/chatInput.tsx b/frontend/app/[locale]/chat/components/chatInput.tsx
index 512f940e9..bcfc86f6b 100644
--- a/frontend/app/[locale]/chat/components/chatInput.tsx
+++ b/frontend/app/[locale]/chat/components/chatInput.tsx
@@ -15,9 +15,10 @@ import {
 } from "@ant-design/icons";
 
 import { Input } from "@/components/ui/input";
-import { Button, Tooltip } from "antd";
+import { Button } from "antd";
+import { Tooltip } from "@/components/ui/tooltip";
 import { Textarea } from "@/components/ui/textarea";
-import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
+import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
 import { conversationService } from "@/services/conversationService";
 import { useConfig } from "@/hooks/useConfig";
 import { extractColorsFromUri } from "@/lib/avatar";
@@ -26,7 +27,7 @@ import { chatConfig } from "@/const/chatConfig";
 import { FilePreview } from "@/types/chat";
 
 import { ChatAgentSelector } from "./chatAgentSelector";
-import { TokenUsageIndicator } from "@/components/common/tokenUsageIndicator";
+import { TokenUsageIndicator } from "@/components/ui/tokenUsageIndicator";
 import { TokenMetrics } from "@/types/chat";
 
 // Get file extension
@@ -134,10 +135,8 @@ interface ChatInputProps {
   attachments?: FilePreview[];
   onAttachmentsChange?: (attachments: FilePreview[]) => void;
   selectedAgentId?: string | null;
-  onAgentSelect?: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
+  onAgentSelect?: (agentId: string | null) => void;
   latestMetrics?: TokenMetrics | null;
-  agentGreeting?: string | null;
-  agentExampleQuestions?: string[];
 }
 
 export function ChatInput({
@@ -157,8 +156,6 @@ export function ChatInput({
   selectedAgentId = null,
   onAgentSelect,
   latestMetrics = null,
-  agentGreeting = null,
-  agentExampleQuestions = [],
 }: ChatInputProps) {
   const [isRecording, setIsRecording] = useState(false);
   const [recordingStatus, setRecordingStatus] = useState<
@@ -1068,23 +1065,17 @@ export function ChatInput({
       {/* Chat input part */}
       {isInitialMode ? (
         <div className="flex flex-col items-center justify-center h-full w-full max-w-5xl mx-auto mt-[-80px]">
-          <div className="flex flex-col items-center mb-6">
-            <div className="h-16 w-16 rounded-full overflow-hidden mb-4 ring-2 ring-offset-2 ring-slate-100">
-              <img
-                src={avatarUrl}
-                alt={appConfig.appName}
-                className="h-full w-full object-cover"
-              />
-            </div>
-            {agentGreeting ? (
-              <div className="bg-gradient-to-br from-slate-50 to-white rounded-2xl px-6 py-5 max-w-2xl shadow-sm border border-slate-100 mb-4">
-                <p className="text-lg text-gray-800 leading-relaxed text-center">
-                  {agentGreeting}
-                </p>
+          <div className="flex flex-col items-center mb-4">
+            <div className="flex items-center mb-6">
+              <div className="h-16 w-16 rounded-full overflow-hidden mr-4">
+                <img
+                  src={avatarUrl}
+                  alt={appConfig.appName}
+                  className="h-full w-full object-cover"
+                />
               </div>
-            ) : (
               <h1
-                className="text-4xl font-bold bg-clip-text text-transparent mb-2"
+                className="text-4xl font-bold bg-clip-text text-transparent"
                 style={{
                   backgroundImage: (() => {
                     const colors = extractColorsFromUri(
@@ -1098,27 +1089,11 @@ export function ChatInput({
               >
                 {t("chatInput.helloIm", { appName: appConfig.appName })}
               </h1>
-            )}
-            {!agentGreeting && (
-              <p className="text-left text-muted-foreground max-w-2xl mx-auto leading-relaxed">
-                {appConfig.appDescription || t("chatInput.introMessage")}
-              </p>
-            )}
-          </div>
-          {agentExampleQuestions.length > 0 && (
-            <div className="flex flex-col gap-2 max-w-3xl mb-4 w-full">
-              {agentExampleQuestions.map((question, idx) => (
-                <button
-                  key={idx}
-                  onClick={() => onInputChange(question)}
-                  className="w-full px-4 py-3 rounded-xl border border-slate-200 bg-white hover:bg-slate-50 hover:border-slate-300 text-sm text-gray-700 shadow-sm transition-all text-left flex items-center gap-2"
-                >
-                  <span className="text-muted-foreground font-medium">{idx + 1}.</span>
-                  <span>{question}</span>
-                </button>
-              ))}
             </div>
-          )}
+            <p className="text-left text-muted-foreground max-w-2xl mx-auto leading-relaxed">
+              {appConfig.appDescription || t("chatInput.introMessage")}
+            </p>
+          </div>
           <div
             ref={dropAreaRef}
             className="relative w-full max-w-4xl rounded-3xl shadow-sm border border-slate-200 bg-slate-100 overflow-hidden"
diff --git a/frontend/app/[locale]/chat/internal/chatInterface.tsx b/frontend/app/[locale]/chat/internal/chatInterface.tsx
index 9dd9bb847..0f3c99715 100644
--- a/frontend/app/[locale]/chat/internal/chatInterface.tsx
+++ b/frontend/app/[locale]/chat/internal/chatInterface.tsx
@@ -113,14 +113,6 @@ export function ChatInterface() {
 
   // Add agent selection state
   const [selectedAgentId, setSelectedAgentId] = useState<string | null>(null);
-  const [agentGreeting, setAgentGreeting] = useState<string | null>(null);
-  const [agentExampleQuestions, setAgentExampleQuestions] = useState<string[]>([]);
-
-  const handleAgentSelectWithGreeting = (agentId: string | null, greeting?: string, exampleQuestions?: string[]) => {
-    setSelectedAgentId(agentId);
-    setAgentGreeting(greeting || null);
-    setAgentExampleQuestions(exampleQuestions || []);
-  };
 
   useEffect(() => {
     const agentId = sessionStorage.getItem("selectedAgentId");
@@ -1305,11 +1297,9 @@ export function ChatInterface() {
                 currentConversationId={conversationManagement.selectedConversationId ?? undefined}
                 shouldScrollToBottom={shouldScrollToBottom}
                 selectedAgentId={selectedAgentId}
-                onAgentSelect={handleAgentSelectWithGreeting}
+                onAgentSelect={setSelectedAgentId}
                 onCitationHover={clearCompletedIndicator}
                 onScroll={clearCompletedIndicator}
-                agentGreeting={agentGreeting}
-                agentExampleQuestions={agentExampleQuestions}
               />
             </div>
 
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx b/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
index 285225f23..e5809c435 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamFinalMessage.tsx
@@ -10,7 +10,7 @@ import {
   ThumbsUp,
 } from "lucide-react";
 
-import { MarkdownRenderer } from "@/components/common/markdownRenderer";
+import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
 
 /**
  * Convert custom code tags to standard markdown code fences
@@ -30,7 +30,8 @@ const convertToMarkdownCodeFences = (content: string): string => {
   });
   return content;
 };
-import { Button, Tooltip } from "antd";
+import { Button } from "antd";
+import { Tooltip, TooltipProvider } from "@/components/ui/tooltip";
 import { ChatMessageType, MaxStepsInfo } from "@/types/chat";
 import { chatConfig, Opinion } from "@/const/chatConfig";
 import { conversationService } from "@/services/conversationService";
@@ -353,16 +354,6 @@ function ChatStreamFinalMessageInner({
                 resolveS3Media={Boolean(message.finalAnswer || message.content)}
               />
 
-              {/* Skill-generated file attachments - render below the main content */}
-              {message.attachments && message.attachments.length > 0 && (
-                <div className="mt-3">
-                  <ChatAttachment
-                    attachments={message.attachments as AttachmentItem[]}
-                    onImageClick={onImageClick}
-                  />
-                </div>
-              )}
-
               {/* Button group - only show when hideButtons is false and message is complete */}
               {!hideButtons && message.isComplete && (
                 <div className="flex items-center justify-between mt-3">
@@ -402,7 +393,7 @@ function ChatStreamFinalMessageInner({
 
                   {/* Tool button */}
                   <div className="flex items-center space-x-2 mt-1 justify-end">
-                    <div>
+                    <TooltipProvider>
                       {/* Copy button */}
                       <Tooltip
                         title={
@@ -486,7 +477,7 @@ function ChatStreamFinalMessageInner({
                           {ttsButtonContent.icon}
                         </Button>
                       </Tooltip>
-                    </div>
+                    </TooltipProvider>
                   </div>
                 </div>
               )}
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx b/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
index 8d19cd69f..366d0f035 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamHandler.tsx
@@ -148,7 +148,6 @@ export const handleStreamResponse = async (
     | typeof chatConfig.contentTypes.SEARCH_CONTENT
     | typeof chatConfig.contentTypes.CARD
     | typeof chatConfig.contentTypes.MEMORY_SEARCH
-    | typeof chatConfig.contentTypes.VERIFICATION
     | typeof chatConfig.contentTypes.PREPROCESS
     | null = null;
   let lastModelOutputIndex = -1; // Track the index of the last model output in currentStep.contents
@@ -796,36 +795,6 @@ export const handleStreamResponse = async (
                   });
                   break;
 
-                case chatConfig.messageTypes.VERIFICATION:
-                  if (!currentStep) {
-                    currentStep = {
-                      id: `step-verification-${Date.now()}-${Math.random()
-                        .toString(36)
-                        .substring(2, 9)}`,
-                      title: "Verification",
-                      content: "",
-                      expanded: true,
-                      contents: [],
-                      metrics: null,
-                      thinking: { content: "", expanded: true },
-                      code: { content: "", expanded: true },
-                      output: { content: "", expanded: true },
-                    };
-                  }
-
-                  currentStep.contents.push({
-                    id: `verification-${Date.now()}-${Math.random()
-                      .toString(36)
-                      .substring(2, 7)}`,
-                    type: chatConfig.messageTypes.VERIFICATION,
-                    subType: "verification",
-                    content: messageContent,
-                    expanded: true,
-                    timestamp: Date.now(),
-                  });
-                  lastContentType = chatConfig.contentTypes.VERIFICATION;
-                  break;
-
                 case chatConfig.messageTypes.MEMORY_SEARCH:
                   // If there's no currentStep, create one
                   if (!currentStep) {
@@ -974,43 +943,6 @@ export const handleStreamResponse = async (
                   }
                   break;
 
-                case chatConfig.messageTypes.SKILL_FILES:
-                  // Process skill-generated file uploads (e.g., documents created by skills)
-                  try {
-                    const skillFilesData = JSON.parse(messageContent);
-                    const skillUploads = skillFilesData.skill_file_uploads || [];
-
-                    // Convert uploads to AttachmentItem format
-                    const newAttachments = skillUploads
-                      .filter((upload: any) => upload.status === "success")
-                      .map((upload: any) => ({
-                        type: "file",
-                        name: upload.file_name || "document",
-                        size: upload.file_size || 0,
-                        object_name: upload.object_name,
-                        url: upload.preview_url || upload.presigned_url || upload.object_name,
-                        contentType: upload.mime_type,
-                      }));
-
-                    if (newAttachments.length > 0) {
-                      setMessages((prev) => {
-                        const newMessages = [...prev];
-                        const lastMsg = newMessages[newMessages.length - 1];
-                        if (lastMsg && lastMsg.role === MESSAGE_ROLES.ASSISTANT) {
-                          const existingAttachments = lastMsg.attachments || [];
-                          newMessages[newMessages.length - 1] = {
-                            ...lastMsg,
-                            attachments: [...existingAttachments, ...newAttachments],
-                          };
-                        }
-                        return newMessages;
-                      });
-                    }
-                  } catch (e) {
-                    log.error(t("chatStreamHandler.streamResponseError"), e);
-                  }
-                  break;
-
                 default:
                   // Process other types of messages
                   break;
diff --git a/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx b/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
index 27f2649d7..4d0dd8d88 100644
--- a/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
+++ b/frontend/app/[locale]/chat/streaming/chatStreamMain.tsx
@@ -39,8 +39,6 @@ export function ChatStreamMain({
   onAgentSelect,
   onCitationHover,
   onScroll,
-  agentGreeting,
-  agentExampleQuestions,
 }: ChatStreamMainProps) {
   const { t } = useTranslation();
   // Animation variants for ChatInput
@@ -359,8 +357,6 @@ export function ChatStreamMain({
                         selectedAgentId={selectedAgentId}
                         onAgentSelect={onAgentSelect}
                         latestMetrics={latestMetrics}
-                        agentGreeting={agentGreeting}
-                        agentExampleQuestions={agentExampleQuestions}
                       />
                     </motion.div>
                   </AnimatePresence>
@@ -459,8 +455,6 @@ export function ChatStreamMain({
               selectedAgentId={selectedAgentId}
               onAgentSelect={onAgentSelect}
               latestMetrics={latestMetrics}
-              agentGreeting={agentGreeting}
-              agentExampleQuestions={agentExampleQuestions}
             />
           </motion.div>
         </AnimatePresence>
diff --git a/frontend/app/[locale]/chat/streaming/taskWindow.tsx b/frontend/app/[locale]/chat/streaming/taskWindow.tsx
index 5211c6ab8..665ed8467 100644
--- a/frontend/app/[locale]/chat/streaming/taskWindow.tsx
+++ b/frontend/app/[locale]/chat/streaming/taskWindow.tsx
@@ -9,15 +9,11 @@ import {
   FileText,
   ChevronRight,
   Wrench,
-  CheckCircle2,
-  AlertTriangle,
-  RotateCcw,
-  ShieldCheck,
 } from "lucide-react";
 
 import { ScrollArea } from "@/components/ui/scrollArea";
 import { Button, message as antdMessage } from "antd";
-import { MarkdownRenderer, CodeBlock } from "@/components/common/markdownRenderer";
+import { MarkdownRenderer, CodeBlock } from "@/components/ui/markdownRenderer";
 import { chatConfig } from "@/const/chatConfig";
 import {
   ChatMessageType,
@@ -1154,114 +1150,6 @@ const messageHandlers: MessageHandler[] = [
     render: (_message, _t) => null, // Return null, do not render this type of message
   },
 
-  // verification type processor - layered ReAct self-check status
-  {
-    canHandle: (message) =>
-      message.type === chatConfig.messageTypes.VERIFICATION,
-    render: (message, t) => {
-      let data: any = {};
-      try {
-        data =
-          typeof message.content === "string"
-            ? JSON.parse(message.content)
-            : message.content || {};
-      } catch (_) {
-        data = { message: message.content };
-      }
-
-      const phase = data.phase || "start";
-      const severity = data.severity || "info";
-      const labelMap: Record<string, string> = {
-        start: t("taskWindow.verification.start"),
-        pass: t("taskWindow.verification.pass"),
-        warning: t("taskWindow.verification.warning"),
-        blocked: t("taskWindow.verification.blocked"),
-        repair: t("taskWindow.verification.repair"),
-        final_pass: t("taskWindow.verification.finalPass"),
-        final_fail: t("taskWindow.verification.finalFail"),
-      };
-      const label =
-        labelMap[phase] || data.message || t("taskWindow.verification.start");
-      const rawMessage =
-        typeof data.message === "string" ? data.message.trim() : "";
-      const genericPassMessages = new Set([
-        "自检通过",
-        "最终自检通过",
-        "Self-check passed",
-        "Final self-check passed",
-      ]);
-      const fallbackReason = (() => {
-        if (data.event === "tool_precheck") {
-          return "动作非空、参数和语法已检查";
-        }
-        if (data.event === "retrieval") {
-          return "检索结果和错误信号已检查";
-        }
-        if (data.event === "handoff") {
-          return "子任务返回内容已检查";
-        }
-        if (data.event === "tool_result" || data.event === "code_execution") {
-          return "执行结果非空，未发现未处理错误";
-        }
-        if (data.event === "final_answer") {
-          return phase === "final_pass"
-            ? "答案完整、格式正常，未发现未处理错误"
-            : "答案非空、无内部标记、无占位符";
-        }
-        return "未发现阻断问题";
-      })();
-      const displayMessage =
-        (phase === "pass" || phase === "final_pass") &&
-        (!rawMessage || genericPassMessages.has(rawMessage))
-          ? `${rawMessage || label}：${fallbackReason}`
-          : rawMessage || label;
-      const tone =
-        phase === "final_pass" || phase === "pass"
-          ? "#047857"
-          : phase === "blocked" ||
-              phase === "final_fail" ||
-              severity === "blocking"
-            ? "#dc2626"
-            : phase === "repair" || phase === "warning"
-              ? "#d97706"
-              : "#2563eb";
-      const Icon =
-        phase === "final_pass" || phase === "pass"
-          ? CheckCircle2
-          : phase === "repair"
-            ? RotateCcw
-            : phase === "blocked" || phase === "final_fail"
-              ? AlertTriangle
-              : ShieldCheck;
-
-      return (
-        <div
-          style={{
-            display: "flex",
-            alignItems: "center",
-            gap: "0.5rem",
-            fontFamily:
-              "-apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Helvetica, Arial, sans-serif",
-            fontSize: "0.875rem",
-            lineHeight: 1.5,
-            color: tone,
-            fontWeight: 500,
-            borderRadius: "0.25rem",
-            paddingTop: "0.5rem",
-          }}
-        >
-          <Icon size={16} />
-          <span>{displayMessage}</span>
-          {typeof data.score === "number" && (
-            <span style={{ opacity: 0.72 }}>
-              {Math.round(data.score * 100)}%
-            </span>
-          )}
-        </div>
-      );
-    },
-  },
-
   // error type processor - error information
   {
     canHandle: (message) => message.type === "error",
diff --git a/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx b/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
index 26cd438a5..09fe5c962 100644
--- a/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
+++ b/frontend/app/[locale]/knowledges/KnowledgeBaseConfiguration.tsx
@@ -157,14 +157,7 @@ function DataConfig({ isActive }: DataConfigProps) {
   const { t } = useTranslation();
   const { message } = App.useApp();
   const { confirm } = useConfirmModal();
-  const {
-    modelConfig,
-    data: configData,
-    invalidateConfig,
-    config,
-    updateConfig,
-    saveConfig,
-  } = useConfig();
+  const { modelConfig, data: configData, invalidateConfig, config, updateConfig, saveConfig } = useConfig();
   const { token } = theme.useToken();
 
   // Get available embedding models for knowledge base creation
@@ -184,10 +177,7 @@ function DataConfig({ isActive }: DataConfigProps) {
       setDataMateUrl("");
     }
 
-    if (
-      configData?.app &&
-      typeof configData.app.modelEngineEnabled === "boolean"
-    ) {
+    if (configData?.app && typeof configData.app.modelEngineEnabled === "boolean") {
       setModelEngineEnabled(configData.app.modelEngineEnabled);
     }
 
@@ -224,11 +214,8 @@ function DataConfig({ isActive }: DataConfigProps) {
   // Create mode state
   const [isCreatingMode, setIsCreatingMode] = useState(false);
   const [newKbName, setNewKbName] = useState("");
-  const [newKbIngroupPermission, setNewKbIngroupPermission] =
-    useState<string>("READ_ONLY");
+  const [newKbIngroupPermission, setNewKbIngroupPermission] = useState<string>("READ_ONLY");
   const [newKbGroupIds, setNewKbGroupIds] = useState<number[]>([]);
-  const [newKbPreserveSourceFile, setNewKbPreserveSourceFile] =
-    useState<boolean>(true);
   const [newKbEmbeddingModel, setNewKbEmbeddingModel] = useState<string>(""); // Selected embedding model for new KB
   const [uploadFiles, setUploadFiles] = useState<File[]>([]);
   const [hasClickedUpload, setHasClickedUpload] = useState(false);
@@ -282,8 +269,7 @@ function DataConfig({ isActive }: DataConfigProps) {
       const modelType = isMultimodal ? "multi_embedding" : "embedding";
       return availableEmbeddingModels.find(
         (model) =>
-          model.displayName === normalizedDisplayName &&
-          model.type === modelType
+          model.displayName === normalizedDisplayName && model.type === modelType
       )?.id;
     },
     [availableEmbeddingModels]
@@ -294,13 +280,8 @@ function DataConfig({ isActive }: DataConfigProps) {
     const singleEmbeddingModelName = modelConfig?.embedding?.modelName?.trim();
     const multiEmbeddingModelName =
       modelConfig?.multiEmbedding?.modelName?.trim();
-    setShowEmbeddingWarning(
-      !singleEmbeddingModelName && !multiEmbeddingModelName
-    );
-  }, [
-    modelConfig?.embedding?.modelName,
-    modelConfig?.multiEmbedding?.modelName,
-  ]);
+    setShowEmbeddingWarning(!singleEmbeddingModelName && !multiEmbeddingModelName);
+  }, [modelConfig?.embedding?.modelName, modelConfig?.multiEmbedding?.modelName]);
 
   // Add event listener for selecting new knowledge base
   useEffect(() => {
@@ -717,11 +698,9 @@ function DataConfig({ isActive }: DataConfigProps) {
     setNewKbName(defaultName);
     setNewKbIngroupPermission("READ_ONLY");
     setNewKbGroupIds([]);
-    setNewKbPreserveSourceFile(true);
     // Set default embedding model:
     // 1) configured embedding model, 2) configured multimodal model, 3) first available option.
-    const configEmbeddingModel =
-      modelConfig?.embedding?.modelName?.trim() || "";
+    const configEmbeddingModel = modelConfig?.embedding?.modelName?.trim() || "";
     const configMultiEmbeddingModel =
       modelConfig?.multiEmbedding?.modelName?.trim() || "";
     const preferredModel = [
@@ -736,10 +715,7 @@ function DataConfig({ isActive }: DataConfigProps) {
     );
     const defaultModel =
       (preferredModel &&
-        toEmbeddingModelOptionValue(
-          preferredModel.modelName,
-          preferredModel.type
-        )) ||
+        toEmbeddingModelOptionValue(preferredModel.modelName, preferredModel.type)) ||
       (availableEmbeddingModels[0]
         ? toEmbeddingModelOptionValue(
             availableEmbeddingModels[0].displayName,
@@ -819,8 +795,7 @@ function DataConfig({ isActive }: DataConfigProps) {
           newKbIngroupPermission,
           newKbGroupIds,
           parsedSelectedModel.displayName,
-          isMultimodal,
-          newKbPreserveSourceFile
+          isMultimodal
         );
 
         if (!newKB) {
@@ -1040,10 +1015,7 @@ function DataConfig({ isActive }: DataConfigProps) {
               onKnowledgeBaseUpdate={(updatedKnowledgeBase) => {
                 // Update knowledge base in list and active knowledge base
                 updateKnowledgeBase(updatedKnowledgeBase);
-                if (
-                  kbState.activeKnowledgeBase &&
-                  kbState.activeKnowledgeBase.id === updatedKnowledgeBase.id
-                ) {
+                if (kbState.activeKnowledgeBase && kbState.activeKnowledgeBase.id === updatedKnowledgeBase.id) {
                   setActiveKnowledgeBase(updatedKnowledgeBase);
                 }
               }}
@@ -1090,8 +1062,6 @@ function DataConfig({ isActive }: DataConfigProps) {
                 onIngroupPermissionChange={setNewKbIngroupPermission}
                 selectedGroupIds={newKbGroupIds}
                 onSelectedGroupIdsChange={setNewKbGroupIds}
-                preserveSourceFile={newKbPreserveSourceFile}
-                onPreserveSourceFileChange={setNewKbPreserveSourceFile}
                 // Embedding model for create mode
                 availableEmbeddingModels={availableEmbeddingModels}
                 selectedEmbeddingModel={newKbEmbeddingModel}
@@ -1132,30 +1102,25 @@ function DataConfig({ isActive }: DataConfigProps) {
                 isNewlyCreatedAndWaiting={isNewlyCreatedAndWaiting}
                 onChunkCountChange={() => {
                   // Trigger knowledge base list update to refresh chunk count
-                  knowledgeBasePollingService.triggerKnowledgeBaseListUpdate(
-                    true
-                  );
+                  knowledgeBasePollingService.triggerKnowledgeBaseListUpdate(true);
                 }}
-                permission={kbState.activeKnowledgeBase?.permission}
+                  permission={kbState.activeKnowledgeBase?.permission}
                 summaryFrequency={kbState.activeKnowledgeBase?.summaryFrequency}
                 onSummaryFrequencyChange={(frequency) => {
                   if (kbState.activeKnowledgeBase) {
-                    knowledgeBaseService
-                      .updateSummaryFrequency(
-                        kbState.activeKnowledgeBase.id,
-                        frequency
-                      )
-                      .then(() => {
-                        const updatedKB: KnowledgeBase = {
-                          ...kbState.activeKnowledgeBase!,
-                          summaryFrequency: frequency,
-                        };
-                        updateKnowledgeBase(updatedKB);
-                        setActiveKnowledgeBase(updatedKB);
-                      })
-                      .catch((error) => {
-                        log.error("Failed to update summary frequency:", error);
-                      });
+                    knowledgeBaseService.updateSummaryFrequency(
+                      kbState.activeKnowledgeBase.id,
+                      frequency
+                    ).then(() => {
+                      const updatedKB: KnowledgeBase = {
+                        ...kbState.activeKnowledgeBase!,
+                        summaryFrequency: frequency
+                      };
+                      updateKnowledgeBase(updatedKB);
+                      setActiveKnowledgeBase(updatedKB);
+                    }).catch((error) => {
+                      log.error("Failed to update summary frequency:", error);
+                    });
                   }
                 }}
                 // Upload related props
diff --git a/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx b/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
index 4f75fd66e..3590db86b 100644
--- a/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
+++ b/frontend/app/[locale]/knowledges/components/document/DocumentList.tsx
@@ -10,16 +10,9 @@ import { useTranslation } from "react-i18next";
 import { Input, Button, App, Select } from "antd";
 const { TextArea } = Input;
 import { InfoCircleFilled } from "@ant-design/icons";
-import {
-  BookText,
-  Pilcrow,
-  PencilRuler,
-  Eye,
-  Glasses,
-  CircleOff,
-} from "lucide-react";
-import { MarkdownRenderer } from "@/components/common/markdownRenderer";
-import { FilePreviewDrawer } from "@/components/common/filePreviewDrawer";
+import { BookText, Pilcrow, PencilRuler, Eye, Glasses, CircleOff } from "lucide-react";
+import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
+import { FilePreviewDrawer } from "@/components/ui/filePreviewDrawer";
 
 import {
   UI_CONFIG,
@@ -28,10 +21,7 @@ import {
   LAYOUT,
   DOCUMENT_STATUS,
 } from "@/const/knowledgeBase";
-import {
-  SUMMARY_FREQUENCY_OPTIONS_API,
-  FrequencyOption,
-} from "@/const/scheduler";
+import { SUMMARY_FREQUENCY_OPTIONS_API, FrequencyOption } from "@/const/scheduler";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
 import { modelService } from "@/services/modelService";
 import { getTenantDefaultGroupId } from "@/services/groupService";
@@ -93,9 +83,7 @@ interface DocumentListProps {
   isMultimodal?: boolean;
   onMultimodalChange?: (value: boolean) => void;
   permission?: string; // User's permission for this knowledge base (READ_ONLY, EDIT, etc.)
-  preserveSourceFile?: boolean;
-  onPreserveSourceFileChange?: (value: boolean) => void;
-
+  
   // Auto-summary frequency
   summaryFrequency?: string | null;
   onSummaryFrequencyChange?: (frequency: string | null) => void;
@@ -144,9 +132,7 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
       isMultimodal = false,
       onMultimodalChange,
       permission,
-      preserveSourceFile = true,
-      onPreserveSourceFileChange,
-
+      
       // Auto-summary frequency
       summaryFrequency,
       onSummaryFrequencyChange,
@@ -254,16 +240,14 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
     const [showDetail, setShowDetail] = React.useState(false);
     const [showChunk, setShowChunk] = React.useState(false);
     const [summary, setSummary] = useState("");
-    const [isSummarizing, setIsSummarizing] = useState(false);
-    const [isEditing, setIsEditing] = useState(false);
-    const [isSaving, setIsSaving] = useState(false);
-    const [selectedModel, setSelectedModel] = useState<number>(0);
-    const [availableModels, setAvailableModels] = useState<ModelOption[]>([]);
-    const [isLoadingModels, setIsLoadingModels] = useState(false);
-    const [frequencyOptions, setFrequencyOptions] = useState<FrequencyOption[]>(
-      []
-    );
-    const { t } = useTranslation();
+const [isSummarizing, setIsSummarizing] = useState(false);
+  const [isEditing, setIsEditing] = useState(false);
+  const [isSaving, setIsSaving] = useState(false);
+  const [selectedModel, setSelectedModel] = useState<number>(0);
+  const [availableModels, setAvailableModels] = useState<ModelOption[]>([]);
+  const [isLoadingModels, setIsLoadingModels] = useState(false);
+  const [frequencyOptions, setFrequencyOptions] = useState<FrequencyOption[]>([]);
+  const { t } = useTranslation();
     const isDataMate = (knowledgeBaseSource || "").toLowerCase() === "datamate";
 
     // Determine if user has read-only permission
@@ -287,9 +271,7 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
         label: (
           <span className="flex items-center gap-2">
             {getPermissionIcon("READ_ONLY")}
-            <span>
-              {t("tenantResources.knowledgeBase.permission.READ_ONLY")}
-            </span>
+            <span>{t("tenantResources.knowledgeBase.permission.READ_ONLY")}</span>
           </span>
         ),
       },
@@ -359,38 +341,33 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
     };
 
     // Load frequency options from backend API
-    useEffect(() => {
-      const loadFrequencyOptions = async () => {
-        if (showDetail && frequencyOptions.length === 0) {
-          try {
-            const response = await fetch(SUMMARY_FREQUENCY_OPTIONS_API);
-            const data = await response.json();
-            setFrequencyOptions(data.options || []);
-          } catch (error) {
-            log.error("Failed to load frequency options:", error);
-            // Fallback to default options if API fails
-            setFrequencyOptions([
-              {
-                value: "disabled",
-                label: t("knowledgeBase.tag.autoSummary.off"),
-              },
-            ]);
-          }
+  useEffect(() => {
+    const loadFrequencyOptions = async () => {
+      if (showDetail && frequencyOptions.length === 0) {
+        try {
+          const response = await fetch(SUMMARY_FREQUENCY_OPTIONS_API);
+          const data = await response.json();
+          setFrequencyOptions(data.options || []);
+        } catch (error) {
+          log.error("Failed to load frequency options:", error);
+          // Fallback to default options if API fails
+          setFrequencyOptions([
+            { value: "disabled", label: t("knowledgeBase.tag.autoSummary.off") },
+          ]);
         }
-      };
-      loadFrequencyOptions();
-    }, [showDetail, frequencyOptions.length, t]);
+      }
+    };
+    loadFrequencyOptions();
+  }, [showDetail, frequencyOptions.length, t]);
 
-    // Load available models when showing detail
-    useEffect(() => {
-      const loadModels = async () => {
-        if (showDetail && availableModels.length === 0) {
+  // Load available models when showing detail
+  useEffect(() => {
+    const loadModels = async () => {
+      if (showDetail && availableModels.length === 0) {
           setIsLoadingModels(true);
           try {
             const models = await modelService.getLLMModels();
-            setAvailableModels(
-              models.filter((m) => m.connect_status === "available")
-            );
+            setAvailableModels(models.filter(m => m.connect_status === "available"));
 
             // Determine initial selection order:
             // 1) Knowledge base's own configured model (server-side config)
@@ -555,16 +532,10 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
         <div
           className={`${LAYOUT.KB_HEADER_PADDING} border-b border-gray-200 flex-shrink-0 flex items-center ${titleBarHeightClass}`}
         >
-          <div
-            className="flex items-center justify-between w-full"
-            style={{ width: "100%" }}
-          >
-            <div className="flex items-center" style={{ width: "100%" }}>
+          <div className="flex items-center justify-between w-full" style={{ width: "100%" }}>
+            <div className="flex items-center" style={{width: "100%"}}>
               {isCreatingMode ? (
-                <div
-                  className="flex items-center flex-1"
-                  style={{ width: "100%" }}
-                >
+                <div className="flex items-center flex-1" style={{ width: "100%" }}>
                   <Input
                     value={knowledgeBaseName}
                     onChange={(e) =>
@@ -580,29 +551,14 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                     }
                   />
                   {/* Right-aligned container for dropdowns */}
-                  <div
-                    className="flex items-center ml-auto justify-end"
-                    style={{
-                      gap: "12px",
-                      justifyContent: "flex-end",
-                      alignItems: "flex-end",
-                      width: "100%",
-                    }}
-                  >
+                  <div className="flex items-center ml-auto justify-end" style={{ gap: "12px", justifyContent: "flex-end", alignItems: "flex-end", width: "100%" }}>
                     {/* Embedding model selection - first position in create mode */}
                     {isCreatingMode && onEmbeddingModelChange && (
                       <Select
                         value={selectedEmbeddingModel}
                         onChange={onEmbeddingModelChange}
-                        style={{
-                          minWidth: 200,
-                          justifyContent: "center",
-                          alignItems: "flex-end",
-                        }}
-                        placeholder={
-                          t("knowledgeBase.create.embeddingModelPlaceholder") ||
-                          "Select embedding model"
-                        }
+                        style={{ minWidth: 200, justifyContent: "center", alignItems: "flex-end" }}
+                        placeholder={t("knowledgeBase.create.embeddingModelPlaceholder") || "Select embedding model"}
                         allowClear={false}
                         options={[
                           {
@@ -618,9 +574,7 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                           {
                             label: t("modelConfig.option.multiEmbeddingModel"),
                             options: embeddingModelsForOptions
-                              .filter(
-                                (model) => model.type === "multi_embedding"
-                              )
+                              .filter((model) => model.type === "multi_embedding")
                               .map((model) => ({
                                 value: `${model.displayName}::${model.type}`,
                                 label: model.displayName,
@@ -636,14 +590,8 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                         mode="multiple"
                         value={isGroupSelectDisabled ? [] : selectedGroupIds}
                         onChange={onSelectedGroupIdsChange}
-                        style={{
-                          minWidth: 200,
-                          justifyContent: "center",
-                          alignItems: "flex-end",
-                        }}
-                        placeholder={t(
-                          "knowledgeBase.create.permission.groupPlaceholder"
-                        )}
+                        style={{ minWidth: 200, justifyContent: "center", alignItems: "flex-end" }}
+                        placeholder={t("knowledgeBase.create.permission.groupPlaceholder")}
                         options={groupOptions}
                         maxTagCount={2}
                         allowClear
@@ -655,39 +603,11 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                       <Select
                         value={ingroupPermission}
                         onChange={onIngroupPermissionChange}
-                        style={{
-                          width: 160,
-                          justifyContent: "center",
-                          alignItems: "flex-end",
-                        }}
-                        placeholder={t(
-                          "knowledgeBase.ingroup.permission.DEFAULT"
-                        )}
+                        style={{ width: 160, justifyContent: "center", alignItems: "flex-end" }}
+                        placeholder={t("knowledgeBase.ingroup.permission.DEFAULT")}
                         options={permissionOptions}
                       />
                     </Can>
-                    {onPreserveSourceFileChange && (
-                      <Select
-                        value={preserveSourceFile}
-                        onChange={onPreserveSourceFileChange}
-                        style={{
-                          width: 200,
-                          justifyContent: "center",
-                          alignItems: "flex-end",
-                        }}
-                        allowClear={false}
-                        options={[
-                          {
-                            value: true,
-                            label: t("knowledgeBase.create.preserveSourceFile"),
-                          },
-                          {
-                            value: false,
-                            label: t("knowledgeBase.tag.noPreserveSourceFile"),
-                          },
-                        ]}
-                      />
-                    )}
                   </div>
                 </div>
               ) : (
@@ -779,7 +699,7 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
               />
             </div>
           ) : showDetail ? (
-            <div className="px-8 py-4 h-full flex flex-col">
+<div className="px-8 py-4 h-full flex flex-col">
               <div className="flex items-center justify-between mb-5">
                 <span className="font-bold text-lg">
                   {t("document.summary.title")}
@@ -817,14 +737,13 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                       }}
                       disabled={isReadOnlyMode}
                       style={{ width: 85 }}
-                      placeholder={t("knowledgeBase.tag.autoSummary.off")}
-                      options={frequencyOptions.map((opt) => ({
-                        value: opt.value,
-                        label:
-                          opt.value === "disabled"
-                            ? t("knowledgeBase.tag.autoSummary.off")
+placeholder={t("knowledgeBase.tag.autoSummary.off")}
+                      options={frequencyOptions.map(opt => ({
+                          value: opt.value,
+                          label: opt.value === "disabled" 
+                            ? t("knowledgeBase.tag.autoSummary.off") 
                             : opt.label,
-                      }))}
+                        }))}
                     />
                   </div>
                   <Button
@@ -832,10 +751,7 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                     onClick={handleAutoSummary}
                     loading={isSummarizing}
                     disabled={
-                      !knowledgeBaseName ||
-                      isSummarizing ||
-                      !selectedModel ||
-                      isReadOnlyMode
+                      !knowledgeBaseName || isSummarizing || !selectedModel || isReadOnlyMode
                     }
                   >
                     {t("document.button.autoSummary")}
@@ -843,59 +759,59 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                 </div>
               </div>
               <div className="flex-1 min-h-0 mb-5 border border-gray-300 rounded-md overflow-auto">
-                {isReadOnlyMode ? (
-                  <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                    <MarkdownRenderer content={summary} />
-                  </div>
-                ) : isSummarizing ? (
-                  <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                    <MarkdownRenderer content={summary} />
-                  </div>
-                ) : (
-                  <div
-                    className="w-full h-full cursor-text hover:bg-gray-50"
-                    onClick={() => {
-                      if (!isSummarizing) {
-                        setIsEditing(true);
-                      }
-                    }}
-                  >
-                    {isEditing ? (
-                      <TextArea
-                        value={summary}
-                        onChange={(e) => setSummary(e.target.value)}
-                        onBlur={() => setIsEditing(false)}
-                        className="w-full h-full border-0 resize-none focus:shadow-none"
-                        style={{
-                          height: "100%",
-                          padding: "20px",
-                          fontSize: "18px",
-                          lineHeight: "1.7",
-                          whiteSpace: "pre-wrap",
-                        }}
-                        autoFocus
-                        placeholder={t("document.summary.placeholder")}
-                      />
-                    ) : (
-                      <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
-                        <MarkdownRenderer content={summary} />
-                      </div>
-                    )}
-                  </div>
-                )}
+                  {isReadOnlyMode ? (
+                    <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                      <MarkdownRenderer content={summary} />
+                    </div>
+                  ) : isSummarizing ? (
+                    <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                      <MarkdownRenderer content={summary} />
+                    </div>
+                  ) : (
+                    <div
+                          className="w-full h-full cursor-text hover:bg-gray-50"
+                      onClick={() => {
+                        if (!isSummarizing) {
+                          setIsEditing(true);
+                        }
+                      }}
+                    >
+                      {isEditing ? (
+                        <TextArea
+                          value={summary}
+                          onChange={(e) => setSummary(e.target.value)}
+                          onBlur={() => setIsEditing(false)}
+                              className="w-full h-full border-0 resize-none focus:shadow-none"
+                          style={{
+                            height: '100%',
+                            padding: '20px',
+                            fontSize: '18px',
+                            lineHeight: '1.7',
+                            whiteSpace: 'pre-wrap',
+                          }}
+                          autoFocus
+                          placeholder={t("document.summary.placeholder")}
+                        />
+                      ) : (
+                              <div className="p-5 text-lg leading-[1.7] whitespace-pre-wrap">
+                                <MarkdownRenderer content={summary} />
+                              </div>
+                      )}
+                    </div>
+                  )}
               </div>
               <div className="flex gap-3 justify-end">
-                {!isReadOnlyMode && (
-                  <Button
-                    type="primary"
-                    size="large"
-                    onClick={handleSaveSummary}
-                    loading={isSaving}
-                    disabled={!summary || isSaving}
-                  >
-                    {t("common.save")}
-                  </Button>
-                )}
+                  {!isReadOnlyMode && (
+                    <Button
+                      type="primary"
+                      size="large"
+                      onClick={handleSaveSummary}
+                      loading={isSaving}
+                      disabled={!summary || isSaving}
+                    >
+                      {t("common.save")}
+                    </Button>
+                  )}
                 <Button
                   size="large"
                   onClick={() => {
@@ -1028,12 +944,9 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
                           <div className="flex gap-2">
                             <button
                               onClick={() => {
-                                const objectName =
-                                  extractObjectNameFromUrl(doc.id) || undefined;
+                                const objectName =  extractObjectNameFromUrl(doc.id) || undefined;
                                 if (!objectName) {
-                                  message.warning(
-                                    t("filePreview.previewFailed")
-                                  );
+                                  message.warning(t("filePreview.previewFailed"));
                                   return;
                                 }
 
@@ -1118,7 +1031,6 @@ const DocumentListContainer = forwardRef<DocumentListRef, DocumentListProps>(
             fileName={selectedFile.fileName}
             fileType={selectedFile.fileType}
             fileSize={selectedFile.fileSize}
-            previewContext="knowledgeBase"
             onClose={() => setSelectedFile(null)}
           />
         )}
diff --git a/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx b/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
index 53758147b..186b8e36c 100644
--- a/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
+++ b/frontend/app/[locale]/knowledges/components/knowledge/KnowledgeBaseList.tsx
@@ -3,7 +3,7 @@ import { useTranslation } from "react-i18next";
 
 import log from "@/lib/logger";
 
-import { Button, Input, Select, Tooltip } from "antd";
+import { Button, Input, Select } from "antd";
 import {
   SyncOutlined,
   PlusOutlined,
@@ -19,6 +19,7 @@ import {
   SquarePen,
   CircleOff,
 } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { Can } from "@/components/permission/Can";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import { useGroupList } from "@/hooks/group/useGroupList";
@@ -638,13 +639,6 @@ const KnowledgeBaseList: React.FC<KnowledgeBaseListProps> = ({
                                   </span>
                                 ))}
                             </Can>
-                            {kb.preserve_source_file === false && (
-                              <span
-                                className={`inline-flex items-center ${KB_LAYOUT.TAG_PADDING} ${KB_LAYOUT.TAG_ROUNDED} ${KB_LAYOUT.TAG_TEXT} ${KB_LAYOUT.SECOND_ROW_TAG_MARGIN} bg-blue-100 text-blue-800 border border-blue-200 mr-1`}
-                              >
-                                {t("knowledgeBase.tag.noPreserveSourceFile")}
-                              </span>
-                            )}
                           </>
                         )}
                       </div>
diff --git a/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx b/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
index 668436765..63d9ad1c2 100644
--- a/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
+++ b/frontend/app/[locale]/knowledges/contexts/DocumentContext.tsx
@@ -1,14 +1,7 @@
-"use client";
+"use client"
 
-import {
-  createContext,
-  useReducer,
-  useContext,
-  ReactNode,
-  useCallback,
-  useEffect,
-} from "react";
-import { useTranslation } from "react-i18next";
+import { createContext, useReducer, useContext, ReactNode, useCallback, useEffect } from "react";
+import { useTranslation } from 'react-i18next';
 
 import { DOCUMENT_ACTION_TYPES } from "@/const/knowledgeBase";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
@@ -16,20 +9,17 @@ import { DocumentState, DocumentAction } from "@/types/knowledgeBase";
 import log from "@/lib/logger";
 
 // Reducer function
-const documentReducer = (
-  state: DocumentState,
-  action: DocumentAction
-): DocumentState => {
+const documentReducer = (state: DocumentState, action: DocumentAction): DocumentState => {
   switch (action.type) {
     case DOCUMENT_ACTION_TYPES.FETCH_SUCCESS:
       return {
         ...state,
         documentsMap: {
           ...state.documentsMap,
-          [action.payload.kbId]: action.payload.documents,
+          [action.payload.kbId]: action.payload.documents
         },
         isLoadingDocuments: false,
-        error: null,
+        error: null
       };
     case DOCUMENT_ACTION_TYPES.SELECT_DOCUMENT:
       // Toggle document selection
@@ -38,48 +28,41 @@ const documentReducer = (
       return {
         ...state,
         selectedIds: isSelected
-          ? state.selectedIds.filter((id) => id !== docId)
-          : [...state.selectedIds, docId],
+          ? state.selectedIds.filter(id => id !== docId)
+          : [...state.selectedIds, docId]
       };
     case DOCUMENT_ACTION_TYPES.SELECT_DOCUMENTS:
       return {
         ...state,
-        selectedIds: action.payload,
+        selectedIds: action.payload
       };
     case DOCUMENT_ACTION_TYPES.SELECT_ALL:
       const { kbId, selected } = action.payload;
       const documents = state.documentsMap[kbId] || [];
-
+      
       // If selected is true, add all document IDs, else remove all
       const newSelectedIds = selected
-        ? [
-            ...new Set([
-              ...state.selectedIds,
-              ...documents.map((doc) => doc.id),
-            ]),
-          ]
-        : state.selectedIds.filter(
-            (id) => !documents.some((doc) => doc.id === id)
-          );
-
+        ? [...new Set([...state.selectedIds, ...documents.map(doc => doc.id)])]
+        : state.selectedIds.filter(id => !documents.some(doc => doc.id === id));
+      
       return {
         ...state,
-        selectedIds: newSelectedIds,
+        selectedIds: newSelectedIds
       };
     case DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES:
       return {
         ...state,
-        uploadFiles: action.payload,
+        uploadFiles: action.payload
       };
     case DOCUMENT_ACTION_TYPES.SET_UPLOADING:
       return {
         ...state,
-        isUploading: action.payload,
+        isUploading: action.payload
       };
     case DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS:
       return {
         ...state,
-        isLoadingDocuments: action.payload,
+        isLoadingDocuments: action.payload
       };
     case DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT:
       const { kbId: deleteKbId, docId: deleteDocId } = action.payload;
@@ -88,39 +71,36 @@ const documentReducer = (
         ...state,
         documentsMap: {
           ...state.documentsMap,
-          [deleteKbId]:
-            state.documentsMap[deleteKbId]?.filter(
-              (doc) => doc.id !== deleteDocId
-            ) || [],
+          [deleteKbId]: state.documentsMap[deleteKbId]?.filter(doc => doc.id !== deleteDocId) || []
         },
-        selectedIds: state.selectedIds.filter((id) => id !== deleteDocId),
+        selectedIds: state.selectedIds.filter(id => id !== deleteDocId)
       };
     case DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID:
       const { kbId: loadingKbId, isLoading } = action.payload;
       const newLoadingKbIds = new Set(state.loadingKbIds);
-
+      
       if (isLoading) {
         newLoadingKbIds.add(loadingKbId);
       } else {
         newLoadingKbIds.delete(loadingKbId);
       }
-
+      
       return {
         ...state,
-        loadingKbIds: newLoadingKbIds,
+        loadingKbIds: newLoadingKbIds
       };
     case DOCUMENT_ACTION_TYPES.CLEAR_DOCUMENTS:
       return {
         ...state,
         documentsMap: {},
         selectedIds: [],
-        error: null,
+        error: null
       };
     case DOCUMENT_ACTION_TYPES.ERROR:
       return {
         ...state,
         error: action.payload,
-        isLoadingDocuments: false,
+        isLoadingDocuments: false
       };
     default:
       return state;
@@ -131,16 +111,8 @@ const documentReducer = (
 export const DocumentContext = createContext<{
   state: DocumentState;
   dispatch: React.Dispatch<DocumentAction>;
-  fetchDocuments: (
-    kbId: string,
-    forceRefresh?: boolean,
-    kbSource?: string
-  ) => Promise<void>;
-  uploadDocuments: (
-    kbId: string,
-    files: File[],
-    modelId?: number
-  ) => Promise<void>;
+  fetchDocuments: (kbId: string, forceRefresh?: boolean, kbSource?: string) => Promise<void>;
+  uploadDocuments: (kbId: string, files: File[], modelId?: number) => Promise<void>;
   deleteDocument: (kbId: string, docId: string) => Promise<void>;
 }>({
   state: {
@@ -150,12 +122,12 @@ export const DocumentContext = createContext<{
     isUploading: false,
     loadingKbIds: new Set<string>(),
     isLoadingDocuments: false,
-    error: null,
+    error: null
   },
   dispatch: () => {},
   fetchDocuments: async () => {},
   uploadDocuments: async () => {},
-  deleteDocument: async () => {},
+  deleteDocument: async () => {}
 });
 
 // Custom hook for using the context
@@ -166,9 +138,7 @@ interface DocumentProviderProps {
   children: ReactNode;
 }
 
-export const DocumentProvider: React.FC<DocumentProviderProps> = ({
-  children,
-}) => {
+export const DocumentProvider: React.FC<DocumentProviderProps> = ({ children }) => {
   const { t } = useTranslation();
   const [state, dispatch] = useReducer(documentReducer, {
     documentsMap: {},
@@ -177,169 +147,115 @@ export const DocumentProvider: React.FC<DocumentProviderProps> = ({
     isUploading: false,
     loadingKbIds: new Set<string>(),
     isLoadingDocuments: false,
-    error: null,
+    error: null
   });
 
   // Listen for document update events
   useEffect(() => {
     const handleDocumentsUpdated = (event: Event) => {
       const customEvent = event as CustomEvent;
-      if (
-        customEvent.detail &&
-        customEvent.detail.kbId &&
-        customEvent.detail.documents
-      ) {
+      if (customEvent.detail && customEvent.detail.kbId && customEvent.detail.documents) {
         const { kbId, documents } = customEvent.detail;
-
+        
         // Update document information directly
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
-          payload: { kbId, documents },
+        dispatch({ 
+          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS, 
+          payload: { kbId, documents } 
         });
       }
     };
-
+    
     // Add event listener
-    window.addEventListener(
-      "documentsUpdated",
-      handleDocumentsUpdated as EventListener
-    );
-
+    window.addEventListener('documentsUpdated', handleDocumentsUpdated as EventListener);
+    
     // Cleanup function
     return () => {
-      window.removeEventListener(
-        "documentsUpdated",
-        handleDocumentsUpdated as EventListener
-      );
+      window.removeEventListener('documentsUpdated', handleDocumentsUpdated as EventListener);
     };
   }, []);
 
   // Fetch documents for a knowledge base
-  const fetchDocuments = useCallback(
-    async (kbId: string, forceRefresh?: boolean, kbSource?: string) => {
-      // Skip if already loading this kb
-      if (state.loadingKbIds.has(kbId)) return;
+  const fetchDocuments = useCallback(async (kbId: string, forceRefresh?: boolean, kbSource?: string) => {
+    // Skip if already loading this kb
+    if (state.loadingKbIds.has(kbId)) return;
 
-      // If forceRefresh is false and we have cached data, return directly
-      if (
-        !forceRefresh &&
-        state.documentsMap[kbId] &&
-        state.documentsMap[kbId].length > 0
-      ) {
-        return; // If we have cached data and don't need force refresh, return directly without server request
-      }
+    // If forceRefresh is false and we have cached data, return directly
+    if (!forceRefresh && state.documentsMap[kbId] && state.documentsMap[kbId].length > 0) {
+      return; // If we have cached data and don't need force refresh, return directly without server request
+    }
 
+    dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID, payload: { kbId, isLoading: true } });
+
+    try {
+      // Use getAllFiles() to get documents including those not yet in ES
+      const documents = await knowledgeBaseService.getAllFiles(kbId, kbSource);
       dispatch({
-        type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID,
-        payload: { kbId, isLoading: true },
+        type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
+        payload: { kbId, documents }
       });
-
-      try {
-        // Use getAllFiles() to get documents including those not yet in ES
-        const documents = await knowledgeBaseService.getAllFiles(
-          kbId,
-          kbSource
-        );
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
-          payload: { kbId, documents },
-        });
-      } catch (error) {
-        log.error(t("document.error.fetch"), error);
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.ERROR,
-          payload: t("document.error.load"),
-        });
-      } finally {
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID,
-          payload: { kbId, isLoading: false },
-        });
-      }
-    },
-    [state.loadingKbIds, state.documentsMap, t]
-  );
+    } catch (error) {
+      log.error(t('document.error.fetch'), error);
+      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: t('document.error.load') });
+    } finally {
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_KB_ID, payload: { kbId, isLoading: false } });
+    }
+  }, [state.loadingKbIds, state.documentsMap, t]);
 
   // Upload documents to a knowledge base
-  const uploadDocuments = useCallback(
-    async (kbId: string, files: File[], modelId?: number) => {
-      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: true });
-
-      try {
-        await knowledgeBaseService.uploadDocuments(
+  const uploadDocuments = useCallback(async (kbId: string, files: File[], modelId?: number) => {
+    dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: true });
+    
+    try {
+      await knowledgeBaseService.uploadDocuments(kbId, files, undefined, modelId);
+      
+      // Set loading state before fetching latest documents
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS, payload: true });
+      
+      // Get latest status immediately after upload
+      const latestDocuments = await knowledgeBaseService.getAllFiles(kbId);
+      // Update document status
+      dispatch({ 
+        type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS, 
+        payload: { kbId, documents: latestDocuments } 
+      });
+      
+      // Trigger document status update event to notify other components
+      window.dispatchEvent(new CustomEvent('documentsUpdated', {
+        detail: { 
           kbId,
-          files,
-          undefined,
-          modelId
-        );
-
-        // Set loading state before fetching latest documents
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS,
-          payload: true,
-        });
-
-        // Get latest status immediately after upload
-        const latestDocuments = await knowledgeBaseService.getAllFiles(kbId);
-        // Update document status
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.FETCH_SUCCESS,
-          payload: { kbId, documents: latestDocuments },
-        });
-
-        // Trigger document status update event to notify other components
-        window.dispatchEvent(
-          new CustomEvent("documentsUpdated", {
-            detail: {
-              kbId,
-              documents: latestDocuments,
-            },
-          })
-        );
-
-        // Clear upload files
-        dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES, payload: [] });
-      } catch (error) {
-        log.error(t("document.error.upload"), error);
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.ERROR,
-          payload: `${t("document.error.upload")}. ${t("document.error.retry")}`,
-        });
-      } finally {
-        dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: false });
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS,
-          payload: false,
-        });
-      }
-    },
-    [t]
-  );
+          documents: latestDocuments 
+        }
+      }));
+      
+      // Clear upload files
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOAD_FILES, payload: [] });
+    } catch (error) {
+      log.error(t('document.error.upload'), error);
+      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: `${t('document.error.upload')}. ${t('document.error.retry')}` });
+    } finally {
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_UPLOADING, payload: false });
+      dispatch({ type: DOCUMENT_ACTION_TYPES.SET_LOADING_DOCUMENTS, payload: false });
+    }
+  }, [t]);
 
   // Delete a document
-  const deleteDocument = useCallback(
-    async (kbId: string, docId: string) => {
-      try {
-        await knowledgeBaseService.deleteDocument(docId, kbId);
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT,
-          payload: { kbId, docId },
-        });
-      } catch (error) {
-        log.error(t("document.error.delete"), error);
-        dispatch({
-          type: DOCUMENT_ACTION_TYPES.ERROR,
-          payload: `${t("document.error.delete")}. ${t("document.error.retry")}`,
-        });
-      }
-    },
-    [t]
-  );
+  const deleteDocument = useCallback(async (kbId: string, docId: string) => {
+    try {
+      await knowledgeBaseService.deleteDocument(docId, kbId);
+      dispatch({ 
+        type: DOCUMENT_ACTION_TYPES.DELETE_DOCUMENT, 
+        payload: { kbId, docId } 
+      });
+    } catch (error) {
+      log.error(t('document.error.delete'), error);
+      dispatch({ type: DOCUMENT_ACTION_TYPES.ERROR, payload: `${t('document.error.delete')}. ${t('document.error.retry')}` });
+    }
+  }, [t]);
 
   return (
-    <DocumentContext.Provider
-      value={{
-        state,
+    <DocumentContext.Provider 
+      value={{ 
+        state, 
         dispatch,
         fetchDocuments,
         uploadDocuments,
@@ -349,4 +265,4 @@ export const DocumentProvider: React.FC<DocumentProviderProps> = ({
       {children}
     </DocumentContext.Provider>
   );
-};
+}; 
diff --git a/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx b/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
index eb3a05fa0..9733d44c4 100644
--- a/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
+++ b/frontend/app/[locale]/knowledges/contexts/KnowledgeBaseContext.tsx
@@ -118,8 +118,7 @@ export const KnowledgeBaseContext = createContext<{
     ingroup_permission?: string,
     group_ids?: number[],
     embeddingModel?: string,
-    is_multimodal?: boolean,
-    preserve_source_file?: boolean
+    is_multimodal?: boolean
   ) => Promise<KnowledgeBase | null>;
   deleteKnowledgeBase: (id: string) => Promise<boolean>;
   selectKnowledgeBase: (id: string) => void;
@@ -349,8 +348,7 @@ export const KnowledgeBaseProvider: React.FC<KnowledgeBaseProviderProps> = ({
       ingroup_permission?: string,
       group_ids?: number[],
       embeddingModel?: string,
-      is_multimodal?: boolean,
-      preserve_source_file?: boolean
+      is_multimodal?: boolean
     ) => {
       try {
         const selectedEmbeddingModel = embeddingModel?.trim() || "";
@@ -374,7 +372,6 @@ export const KnowledgeBaseProvider: React.FC<KnowledgeBaseProviderProps> = ({
           ingroup_permission,
           group_ids,
           is_multimodal: resolvedIsMultimodal,
-          preserve_source_file,
         });
         return newKB;
       } catch (error) {
diff --git a/frontend/app/[locale]/space/components/AgentCard.tsx b/frontend/app/[locale]/space/components/AgentCard.tsx
index cd4ecb57a..0e005d9be 100644
--- a/frontend/app/[locale]/space/components/AgentCard.tsx
+++ b/frontend/app/[locale]/space/components/AgentCard.tsx
@@ -139,9 +139,9 @@ export default function AgentCard({ agent, onRefresh }: AgentCardProps) {
     }
   };
 
-  // Handle edit - navigate to agents view with agent id
+  // Handle edit - navigate to agents view
   const handleEdit = () => {
-    router.push(`/agents?agent_id=${agent.id}`);
+    router.push("/agents");
   };
 
   const queryClient = useQueryClient();
@@ -166,10 +166,7 @@ export default function AgentCard({ agent, onRefresh }: AgentCardProps) {
     setShowDetail(true);
     setIsLoadingDetails(true);
     try {
-      // Use current_version_no if available (the currently published version)
-      // Falls back to 0 only if not set (for unpublished/draft agents)
-      const versionNo = agent.current_version_no ?? 0;
-      const result = await searchAgentInfo(parseInt(agent.id), undefined, versionNo);
+      const result = await searchAgentInfo(parseInt(agent.id));
       if (result.success) {
         setAgentDetails(result.data);
       } else {
diff --git a/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx b/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
index 6cf23c0a9..38fb3ceb1 100644
--- a/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/AssetOwnerResourcesComp.tsx
@@ -54,7 +54,7 @@ export default function AssetOwnerResourcesComp() {
 
           <Tabs
             defaultActiveKey="users"
-            className="h-full flex flex-col overflow-hidden [&_.ant-tabs-contentHolder]:flex-1 [&_.ant-tabs-contentHolder]:overflow-hidden asset-owner-tabs"
+            className="h-full flex flex-col"
             items={[
               {
                 key: "users",
@@ -108,17 +108,3 @@ export default function AssetOwnerResourcesComp() {
     </div>
   );
 }
-
-<style jsx global>{`
-  .asset-owner-tabs .ant-tabs-content {
-    width: 100%;
-    height: 100%;
-  }
-  .asset-owner-tabs .ant-tabs-tabpane {
-    height: 100%;
-    overflow: hidden;
-  }
-  .asset-owner-tabs .ant-tabs-nav {
-    flex-shrink: 0;
-  }
-`}</style>
diff --git a/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx b/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
index cfff26fe9..f4d20ae0b 100644
--- a/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/UserManageComp.tsx
@@ -18,8 +18,6 @@ import {
   Pagination,
   Alert,
   Space,
-  Divider,
-  Tooltip
 } from "antd";
 import {
   Users,
@@ -64,6 +62,7 @@ import { useDeployment } from "@/components/providers/deploymentProvider";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import { USER_ROLES } from "@/const/auth";
 import { Can } from "@/components/permission/Can";
+import { Tooltip } from "@/components/ui/tooltip";
 import {
   getPasswordChecks,
   getStrengthLevel,
@@ -1180,182 +1179,167 @@ export default function UserManageComp() {
   };
 
   return (
-    <div className="flex flex-col w-full h-full">
+    <div className="w-full h-full">
       {/* Page header: grouped header without dividing line */}
-      <div className="flex w-full px-6 pt-12">
-        <div className="flex items-center gap-3">
-          <div className="w-12 h-12 rounded-full bg-gradient-to-br from-purple-500 to-indigo-500 flex items-center justify-center shadow-sm">
-            <Building2 className="h-6 w-6 text-white" />
-          </div>
-          <div>
-            <h1 className="text-2xl font-bold text-purple-600 dark:text-purple-500">
-              {t("tenantResources.title") || "Tenant Resource Management"}
-            </h1>
-            <p className="text-slate-600 dark:text-slate-300 mt-1">
-              {t("tenantResources.subtitle") ||
-                "Manage tenants, users, groups and resources"}
-            </p>
+      <div className="w-full px-10 pt-10">
+        <motion.div
+          initial={{ opacity: 0, y: -8 }}
+          animate={{ opacity: 1, y: 0 }}
+          transition={{ duration: 0.35 }}
+        >
+          <div className="flex items-center gap-3">
+            <div className="w-12 h-12 rounded-full bg-gradient-to-br from-purple-500 to-indigo-500 flex items-center justify-center shadow-sm">
+              <Building2 className="h-6 w-6 text-white" />
+            </div>
+            <div>
+              <h1 className="text-2xl font-bold text-purple-600 dark:text-purple-500">
+                {t("tenantResources.title") || "Tenant Resource Management"}
+              </h1>
+              <p className="text-slate-600 dark:text-slate-300 mt-1">
+                {t("tenantResources.subtitle") ||
+                  "Manage tenants, users, groups and resources"}
+              </p>
+            </div>
           </div>
-        </div>
+        </motion.div>
       </div>
-      <div className="flex-1 min-h-0 h-full">
-        <div className="flex h-full">
-          <Can permission="tenant.list:read">
-            <Col className="flex flex-col h-full" style={{ width: 300 }}>
-              <div className="h-full pr-6">
-                <div className="sticky top-6">
-                  <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-3">
-                    <TenantList
-                      selected={tenantId}
-                      onSelect={(id) => setTenantId(id)}
-                      tenants={tenantData?.data || []}
-                      total={tenantData?.total}
-                      page={tenantData?.page}
-                      pageSize={tenantData?.page_size}
-                      totalPages={tenantData?.total_pages}
-                      onPageChange={handlePageChange}
-                      onTenantsRefetch={async () => {
-                        setCurrentPage(1);
-                        return refetchTenants();
-                      }}
-                      loading={tenantsLoading}
-                      t={t}
-                      onUserListRefresh={() =>
-                        setUserListRefreshKey((prev) => prev + 1)
-                      }
-                      onInvitationListRefresh={() =>
-                        setInvitationListRefreshKey((prev) => prev + 1)
-                      }
-                      locale={locale}
-                    />
-                  </div>
-                </div>
-              </div>
-            </Col>
-          </Can>
-          <Col className="flex-1 flex flex-col p-6 overflow-hidden">
-            <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-4 h-full flex flex-col overflow-hidden">
-              {/* Tenant name header */}
-              <div className="flex">
-                {isEditingTenantName ? (
-                  <Input
-                    ref={tenantNameInputRef}
-                    value={editingTenantName}
-                    onChange={(e) => setEditingTenantName(e.target.value)}
-                    onBlur={saveTenantName}
-                    onKeyDown={handleTenantNameKeyDown}
-                    className="text-lg font-semibold text-gray-900 dark:text-gray-100"
-                    placeholder={t("tenantResources.tenants.name")}
+      <Row className="flex-1 min-h-0 h-full" align="stretch">
+        <Can permission="tenant.list:read">
+          <Col className="flex flex-col h-full" style={{ width: 300 }}>
+            <div className="h-full pr-6">
+              <div className="sticky top-6">
+                <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-3">
+                  <TenantList
+                    selected={tenantId}
+                    onSelect={(id) => setTenantId(id)}
+                    tenants={tenantData?.data || []}
+                    total={tenantData?.total}
+                    page={tenantData?.page}
+                    pageSize={tenantData?.page_size}
+                    totalPages={tenantData?.total_pages}
+                    onPageChange={handlePageChange}
+                    onTenantsRefetch={async () => {
+                      setCurrentPage(1);
+                      return refetchTenants();
+                    }}
+                    loading={tenantsLoading}
+                    t={t}
+                    onUserListRefresh={() =>
+                      setUserListRefreshKey((prev) => prev + 1)
+                    }
+                    onInvitationListRefresh={() =>
+                      setInvitationListRefreshKey((prev) => prev + 1)
+                    }
+                    locale={locale}
                   />
-                ) : (
-                  <div
-                    className="flex items-center gap-2 group cursor-pointer"
-                    onClick={startEditingTenantName}
-                  >
-                    <h2 className="text-lg font-semibold text-gray-900 dark:text-gray-100">
-                      {currentTenantName}
-                    </h2>
-                    <Edit2 className="h-4 w-4 text-gray-400 opacity-0 group-hover:opacity-100 transition-opacity" />
-                  </div>
-                )}
-                
-              </div>
-              
-              <div className="flex-1 min-h-0 h-full">
-                <Divider size="small"/>
-                <div className="flex h-full w-full">
-                  {tenantId ? (
-                    <Tabs
-                      defaultActiveKey="users"
-                      className="h-full flex flex-col tenant-resource-tabs w-full overflow-hidden"
-                      items={[
-                        {
-                          key: "users",
-                          label: t("tenantResources.tabs.users") || "Users",
-                          children: (
-                            <UserList
-                              tenantId={tenantId}
-                              refreshKey={userListRefreshKey}
-                            />
-                          ),
-                        },
-                        {
-                          key: "groups",
-                          label: t("tenantResources.tabs.groups") || "Groups",
-                          children: <GroupList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "models",
-                          label: t("tenantResources.tabs.models") || "Models",
-                          children: <ModelList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "knowledge",
-                          label:
-                            t("tenantResources.tabs.knowledge") || "Knowledge Base",
-                          children: <KnowledgeList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "agents",
-                          label: t("tenantResources.tabs.agents") || "Agents",
-                          children: <AgentList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "mcp",
-                          label: t("tenantResources.tabs.mcp") || "MCP",
-                          children: <McpList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "skills",
-                          label: "Skills",
-                          children: <SkillList tenantId={tenantId} />,
-                        },
-                        {
-                          key: "invitations",
-                          label: t("tenantResources.invitation.tab") || "Invitations",
-                          children: (
-                            <InvitationList
-                              tenantId={tenantId}
-                              refreshKey={invitationListRefreshKey}
-                            />
-                          ),
-                        },
-                      ]}
-                    />
-                  ) : (
-                    <div className="flex flex-col items-center justify-center py-12 text-center">
-                      <div className="w-16 h-16 bg-gray-100 dark:bg-gray-700 rounded-full flex items-center justify-center mb-4">
-                        <Users className="h-8 w-8 text-gray-400" />
-                      </div>
-                      <h3 className="text-lg font-medium text-gray-900 dark:text-gray-100">
-                        {t("tenantResources.selectTenantFirst") ||
-                          "Please select a tenant"}
-                      </h3>
-                      <p className="text-gray-500 dark:text-gray-400 max-w-sm">
-                        {t("tenantResources.selectTenantDescription") ||
-                          "Choose a tenant from the list to manage its users, groups, models, and knowledge base."}
-                      </p>
-                    </div>
-                  )}
                 </div>
-
               </div>
             </div>
           </Col>
-        </div>
-      </div>
+        </Can>
+        <Col className="flex-1 flex flex-col p-6 overflow-hidden">
+          <div className="bg-white dark:bg-gray-800 rounded-md shadow-sm p-4 h-full flex flex-col overflow-hidden">
+            {/* Tenant name header */}
+            <div className="mb-4 pb-2 border-b border-gray-200 dark:border-gray-700 flex-shrink-0">
+              {isEditingTenantName ? (
+                <Input
+                  ref={tenantNameInputRef}
+                  value={editingTenantName}
+                  onChange={(e) => setEditingTenantName(e.target.value)}
+                  onBlur={saveTenantName}
+                  onKeyDown={handleTenantNameKeyDown}
+                  className="text-lg font-semibold text-gray-900 dark:text-gray-100"
+                  placeholder={t("tenantResources.tenants.name")}
+                />
+              ) : (
+                <div
+                  className="flex items-center gap-2 group cursor-pointer"
+                  onClick={startEditingTenantName}
+                >
+                  <h2 className="text-lg font-semibold text-gray-900 dark:text-gray-100">
+                    {currentTenantName}
+                  </h2>
+                  <Edit2 className="h-4 w-4 text-gray-400 opacity-0 group-hover:opacity-100 transition-opacity" />
+                </div>
+              )}
+            </div>
+
+            {tenantId ? (
+              <Tabs
+                defaultActiveKey="users"
+                className="h-full flex flex-col"
+                items={[
+                  {
+                    key: "users",
+                    label: t("tenantResources.tabs.users") || "Users",
+                    children: (
+                      <UserList
+                        tenantId={tenantId}
+                        refreshKey={userListRefreshKey}
+                      />
+                    ),
+                  },
+                  {
+                    key: "groups",
+                    label: t("tenantResources.tabs.groups") || "Groups",
+                    children: <GroupList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "models",
+                    label: t("tenantResources.tabs.models") || "Models",
+                    children: <ModelList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "knowledge",
+                    label:
+                      t("tenantResources.tabs.knowledge") || "Knowledge Base",
+                    children: <KnowledgeList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "agents",
+                    label: t("tenantResources.tabs.agents") || "Agents",
+                    children: <AgentList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "mcp",
+                    label: t("tenantResources.tabs.mcp") || "MCP",
+                    children: <McpList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "skills",
+                    label: "Skills",
+                    children: <SkillList tenantId={tenantId} />,
+                  },
+                  {
+                    key: "invitations",
+                    label: t("tenantResources.invitation.tab") || "Invitations",
+                    children: (
+                      <InvitationList
+                        tenantId={tenantId}
+                        refreshKey={invitationListRefreshKey}
+                      />
+                    ),
+                  },
+                ]}
+              />
+            ) : (
+              <div className="flex flex-col items-center justify-center py-12 text-center">
+                <div className="w-16 h-16 bg-gray-100 dark:bg-gray-700 rounded-full flex items-center justify-center mb-4">
+                  <Users className="h-8 w-8 text-gray-400" />
+                </div>
+                <h3 className="text-lg font-medium text-gray-900 dark:text-gray-100">
+                  {t("tenantResources.selectTenantFirst") ||
+                    "Please select a tenant"}
+                </h3>
+                <p className="text-gray-500 dark:text-gray-400 max-w-sm">
+                  {t("tenantResources.selectTenantDescription") ||
+                    "Choose a tenant from the list to manage its users, groups, models, and knowledge base."}
+                </p>
+              </div>
+            )}
+          </div>
+        </Col>
+      </Row>
     </div>
   );
 }
-
-<style jsx global>{`
-  .tenant-resource-tabs .ant-tabs-content {
-    width: 100%;
-    max-width: 100%;
-    overflow: hidden;
-  }
-  .tenant-resource-tabs .ant-tabs-tabpane {
-    max-width: 100%;
-    overflow: hidden;
-  }
-`}</style>
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
index 2e2383ad5..41fbf4c93 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/AgentList.tsx
@@ -411,19 +411,20 @@ export default function AgentList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
-      <div className="flex-1 overflow-hidden">
-        <Table
-          columns={columns}
-          dataSource={agents as AgentListRow[]}
-          rowKey="id"
-          loading={isLoading}
-          size="small"
-          pagination={{ pageSize: 10 }}
-          locale={{ emptyText: t("space.noAgents") }}
-          scroll={{ y: "calc(100vh - 480px)" }}
-          className="[&_.ant-table]:h-full"
-        />
+    <div className="h-full flex flex-col overflow-hidden">
+      <div className="space-y-6 flex-1 overflow-auto">
+        <div className="min-w-0">
+          <Table
+            columns={columns}
+            dataSource={agents as AgentListRow[]}
+            rowKey="id"
+            loading={isLoading}
+            size="small"
+            pagination={{ pageSize: 10 }}
+            locale={{ emptyText: t("space.noAgents") }}
+            scroll={{ x: true }}
+          />
+        </div>
       </div>
 
       {/* View Modal */}
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
index 32af131db..ec3397219 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/GroupList.tsx
@@ -12,9 +12,9 @@ import {
   Popconfirm,
   message,
   Select,
-  Tooltip
 } from "antd";
 import { Edit, Trash2 } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import { useGroupList } from "@/hooks/group/useGroupList";
 import { useUserList } from "@/hooks/user/useUserList";
@@ -278,7 +278,7 @@ export default function GroupList({ tenantId }: { tenantId: string | null }) {
   };
 
   return (
-    <div className="h-full w-full flex flex-col overflow-auto">
+    <div className="h-full flex flex-col overflow-hidden">
       <div className="flex items-center justify-between mb-4 flex-shrink-0">
         <div />
         <div>
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
index 6365ab68a..688fda8b1 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/InvitationList.tsx
@@ -17,7 +17,6 @@ import {
   Collapse,
   DatePicker,
   Progress,
-  Tooltip 
 } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { useInvitationList } from "@/hooks/invitation/useInvitationList";
@@ -42,6 +41,7 @@ import {
   Copy,
   CircleSlash,
 } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { formatDate } from "@/lib/date";
 import { useAuthorizationContext } from "@/components/providers/AuthorizationProvider";
 import {
@@ -443,7 +443,7 @@ export default function InvitationList({
   }, [invitations, tenantId]);
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
+    <div className="h-full flex flex-col overflow-hidden">
       <div className="mb-4 flex justify-between items-center flex-shrink-0">
         <div />
         <div>
@@ -465,8 +465,8 @@ export default function InvitationList({
           loading={isLoading}
           rowKey="invitation_id"
           pagination={{ pageSize: 10 }}
-          scroll={{ y: "calc(100vh - 560px)" }}
-          className="flex-1 [&_.ant-table]:h-full"
+          scroll={{ x: 1000 }}
+          className="flex-1"
         />
       ) : (
         // Multi-tenant view with collapse
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
index 7b1a703b1..18d70ad51 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/KnowledgeList.tsx
@@ -2,10 +2,11 @@
 
 import React, { useMemo, useState } from "react";
 import { useTranslation } from "react-i18next";
-import { Table, Popconfirm, message, Button, Modal, Tag, Tooltip } from "antd";
+import { Table, Popconfirm, message, Button, Modal, Tag } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { Edit, Trash2, BookOpen } from "lucide-react";
-import { MarkdownRenderer } from "@/components/common/markdownRenderer";
+import { Tooltip } from "@/components/ui/tooltip";
+import { MarkdownRenderer } from "@/components/ui/markdownRenderer";
 import { useKnowledgeList } from "@/hooks/knowledge/useKnowledgeList";
 import { useGroupList } from "@/hooks/group/useGroupList";
 import knowledgeBaseService from "@/services/knowledgeBaseService";
@@ -254,15 +255,15 @@ export default function KnowledgeList({
   ];
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
+    <div className="h-full flex flex-col overflow-hidden">
       <Table
         columns={columns}
         dataSource={knowledgeBases}
         loading={isLoading}
         rowKey="id"
         pagination={{ pageSize: 10 }}
-        className="flex-1 [&_.ant-table]:h-full"
-        scroll={{ y: "calc(100vh - 510px)" }}
+        scroll={{ x: 1400 }}
+        className="flex-1"
       />
 
       {/* Edit Knowledge Base Modal */}
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
index 412ff402f..ba2d20c0d 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/McpList.tsx
@@ -114,7 +114,6 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
   const [openApiJson, setOpenApiJson] = useState("");
   const [openApiServiceName, setOpenApiServiceName] = useState("");
   const [openApiServerUrl, setOpenApiServerUrl] = useState("");
-  const [openApiHeadersTemplate, setOpenApiHeadersTemplate] = useState("");
   const [importingOpenApi, setImportingOpenApi] = useState(false);
   const [openapiServices, setOpenapiServices] = useState<any[]>([]);
   const [loadingOpenapiServices, setLoadingOpenapiServices] = useState(false);
@@ -446,7 +445,6 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
           service_name: openApiServiceName.trim(),
           server_url: openApiServerUrl.trim(),
           openapi_json: parsedJson,
-          headers_template: openApiHeadersTemplate.trim() ? JSON.parse(openApiHeadersTemplate.trim()) : null,
         }),
       });
 
@@ -455,7 +453,6 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
         setOpenApiJson("");
         setOpenApiServiceName("");
         setOpenApiServerUrl("");
-        setOpenApiHeadersTemplate("");
         await loadOpenapiServices();
       } else {
         const errorData = await response.json();
@@ -760,7 +757,7 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
+    <div className="h-full flex flex-col overflow-hidden">
       <div className="flex justify-between items-center mb-4 flex-shrink-0">
         <div />
         <Button type="primary" icon={<Plus size={16} />} onClick={() => setAddModalVisible(true)}>
@@ -768,45 +765,47 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
         </Button>
       </div>
 
-      <div className="flex-1 overflow-hidden">
-        <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.serverList.title")}</Title>
-        <Table
-          columns={serverColumns}
-          dataSource={serverList}
-          rowKey={(record) => `${record.service_name}-${record.mcp_url}`}
-          loading={loading}
-          size="small"
-          pagination={{ pageSize: 7 }}
-          locale={{ emptyText: t("mcpConfig.serverList.empty") }}
-          scroll={{ y: "calc(100vh - 560px)" }}
-          className="flex-1 [&_.ant-table]:h-full"
-        />
+      <div className="space-y-6 flex-1 overflow-auto">
+        <div className="min-w-0">
+          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.serverList.title")}</Title>
+          <Table
+            columns={serverColumns}
+            dataSource={serverList}
+            rowKey={(record) => `${record.service_name}-${record.mcp_url}`}
+            loading={loading}
+            size="small"
+            pagination={{ pageSize: 7 }}
+            locale={{ emptyText: t("mcpConfig.serverList.empty") }}
+          />
+        </div>
 
-        <Title level={5} style={{ marginTop: 24, marginBottom: 12 }}>{t("mcpConfig.containerList.title")}</Title>
-        <Table
-          columns={containerColumns}
-          dataSource={containerList}
-          rowKey="container_id"
-          loading={loading}
-          size="small"
-          pagination={{ pageSize: 3 }}
-          locale={{ emptyText: t("mcpConfig.containerList.empty") }}
-          scroll={{ y: 200 }}
-          className="[&_.ant-table]:h-full"
-        />
+        <div className="min-w-0">
+          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.containerList.title")}</Title>
+          <Table
+            columns={containerColumns}
+            dataSource={containerList}
+            rowKey="container_id"
+            loading={loading}
+            size="small"
+            pagination={{ pageSize: 3 }}
+            locale={{ emptyText: t("mcpConfig.containerList.empty") }}
+            scroll={{ x: true }}
+          />
+        </div>
 
-        <Title level={5} style={{ marginTop: 24, marginBottom: 12 }}>{t("mcpConfig.openapiService.list.title")}</Title>
-        <Table
-          columns={openapiServicesColumns}
-          dataSource={openapiServices}
-          rowKey="id"
-          loading={loadingOpenapiServices}
-          size="small"
-          pagination={{ pageSize: 5 }}
-          locale={{ emptyText: t("mcpConfig.openapiService.list.empty") }}
-          scroll={{ y: 250 }}
-          className="[&_.ant-table]:h-full"
-        />
+        <div className="min-w-0">
+          <Title level={5} style={{ marginBottom: 12 }}>{t("mcpConfig.openapiService.list.title")}</Title>
+          <Table
+            columns={openapiServicesColumns}
+            dataSource={openapiServices}
+            rowKey="id"
+            loading={loadingOpenapiServices}
+            size="small"
+            pagination={{ pageSize: 5 }}
+            locale={{ emptyText: t("mcpConfig.openapiService.list.empty") }}
+            scroll={{ x: true }}
+          />
+        </div>
       </div>
 
       {/* Add Modal */}
@@ -1036,22 +1035,13 @@ export default function McpList({ tenantId }: { tenantId: string | null }) {
                         style={{ flex: 3 }}
                       />
                     </div>
-                    <div className="space-y-2">
-                      <Input.TextArea
-                        placeholder={t("mcpConfig.addServer.customHeadersPlaceholder")}
-                        value={openApiHeadersTemplate}
-                        onChange={(e) => setOpenApiHeadersTemplate(e.target.value)}
-                        rows={2}
-                        disabled={actionsLocked || importingOpenApi}
-                      />
-                      <Input.TextArea
-                        placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
-                        value={openApiJson}
-                        onChange={(e) => setOpenApiJson(e.target.value)}
-                        rows={6}
-                        disabled={actionsLocked || importingOpenApi}
-                      />
-                    </div>
+                    <Input.TextArea
+                      placeholder={t("mcpConfig.openApiToMcp.jsonPlaceholder")}
+                      value={openApiJson}
+                      onChange={(e) => setOpenApiJson(e.target.value)}
+                      rows={6}
+                      disabled={actionsLocked || importingOpenApi}
+                    />
                     <div className="flex justify-end">
                       <Button
                         type="primary"
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
index 6715852f7..560df8cb8 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/ModelList.tsx
@@ -2,8 +2,9 @@
 
 import React, { useState, useMemo } from "react";
 import { useTranslation } from "react-i18next";
-import { Table, Button, Popconfirm, message, Tag, Segmented, Tooltip } from "antd";
+import { Table, Button, Popconfirm, message, Tag, Segmented } from "antd";
 import { Edit, Trash2, RefreshCw } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import type { TablePaginationConfig } from "antd";
 import { FilterValue, SorterResult } from "antd/es/table/interface";
@@ -360,7 +361,7 @@ export default function ModelList({ tenantId }: { tenantId: string | null }) {
   ];
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
+    <div className="h-full flex flex-col overflow-auto">
       <div className="flex items-center justify-between mb-4 flex-shrink-0">
         <div className="flex items-center gap-3">
           <Segmented
@@ -397,8 +398,8 @@ export default function ModelList({ tenantId }: { tenantId: string | null }) {
           total: total,
         }}
         onChange={handlePageChange}
-        scroll={{ y: "calc(100vh - 580px)" }}
-        className="flex-1 [&_.ant-table]:h-full"
+        scroll={{ x: true }}
+        className="flex-1"
       />
 
       <ModelAddDialog
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
index c25f89b57..04d45720d 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/SkillList.tsx
@@ -13,10 +13,10 @@ import {
   Form,
   Switch,
   InputNumber,
-  Tooltip
 } from "antd";
 import { ColumnsType } from "antd/es/table";
 import { Download } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 
 import {
   fetchSkillsList,
@@ -547,6 +547,7 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
   const { t } = useTranslation("common");
   const { message } = App.useApp();
   const [form] = Form.useForm();
+
   const [paramsModalOpen, setParamsModalOpen] = useState(false);
   const [editingSkill, setEditingSkill] = useState<SkillListItem | null>(null);
   const [savingParams, setSavingParams] = useState(false);
@@ -729,8 +730,8 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
     : "closed";
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
-      <div className="flex justify-end mb-2 flex-shrink-0">
+    <div className="h-full flex flex-col overflow-hidden">
+      <div className="flex justify-end mb-2">
         <Button
           type="primary"
           icon={<Download className="h-4 w-4" />}
@@ -747,8 +748,7 @@ export default function SkillList({ tenantId }: { tenantId: string | null }) {
         size="small"
         pagination={{ pageSize: 10 }}
         locale={{ emptyText: t("tenantResources.skills.empty") }}
-        scroll={{ y: "calc(100vh - 500px)" }}
-        className="flex-1 [&_.ant-table]:h-full"
+        scroll={{ x: true }}
       />
 
       <Modal
diff --git a/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx b/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
index 13d54ee5c..64f4e6760 100644
--- a/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
+++ b/frontend/app/[locale]/tenant-resources/components/resources/UserList.tsx
@@ -12,9 +12,9 @@ import {
   Popconfirm,
   message,
   Tag,
-  Tooltip 
 } from "antd";
 import { Edit, Trash2 } from "lucide-react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { ColumnsType } from "antd/es/table";
 import { useUserList } from "@/hooks/user/useUserList";
 import { useGroupList } from "@/hooks/group/useGroupList";
@@ -141,7 +141,6 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
         title: t("common.email"),
         dataIndex: "username",
         key: "username",
-        width: "50%"
       },
       {
         title: t("common.type"),
@@ -165,7 +164,6 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
               {roleLabels[role] || role}
             </Tag>;
         },
-        width: "20%"
       },
       {
         title: t("common.actions"),
@@ -199,7 +197,6 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
             </Popconfirm>
           </div>
         ),
-        width: "20%"
       },
     ],
     []
@@ -210,7 +207,7 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
   };
 
   return (
-    <div className="flex flex-col h-full overflow-hidden">
+    <div className="h-full flex flex-col overflow-hidden">
       <Table
         dataSource={users}
         columns={columns}
@@ -222,9 +219,10 @@ export default function UserList({ tenantId, refreshKey }: { tenantId: string |
           total: total,
           onChange: handlePageChange,
         }}
-        className="flex-1 [&_.ant-table]:h-full"
-        scroll={{ y: "calc(100vh - 480px)" }}
+        scroll={{ x: true }}
+        className="flex-1"
       />
+
       <Modal
         title={t("tenantResources.users.editUser")}
         open={modalVisible}
diff --git a/frontend/app/[locale]/users/components/UserProfileComp.tsx b/frontend/app/[locale]/users/components/UserProfileComp.tsx
index 41cfeb0a0..67b34d250 100644
--- a/frontend/app/[locale]/users/components/UserProfileComp.tsx
+++ b/frontend/app/[locale]/users/components/UserProfileComp.tsx
@@ -39,7 +39,6 @@ import { OAuthAccountsSection } from "@/components/settings/OAuthAccountsSection
 import log from "@/lib/logger";
 import { authService } from "@/services/authService";
 import { getPasswordChecks, getStrengthLevel } from "@/lib/utils";
-import { useConfirmModal } from "@/hooks/useConfirmModal";
 import {
   getUserTokens,
   deleteUserToken,
@@ -62,7 +61,6 @@ export default function UserProfileComp() {
   const { message: antdMessage } = App.useApp();
   const { logout, revoke, isLoading } = useAuthenticationContext();
   const { user, groupIds } = useAuthorizationContext();
-  const { confirm } = useConfirmModal();
 
   // Fetch groups for group name mapping
   const { data: groupData } = useGroupList(user?.tenantId || null);
@@ -109,7 +107,6 @@ export default function UserProfileComp() {
   // Check if user is admin or super admin (cannot delete account)
   const isAdminOrSuperAdmin =
     user?.role === USER_ROLES.ADMIN || user?.role === USER_ROLES.SU;
-  const isCasUser = user?.authProvider === "cas";
   const getRoleDisplayName = (role: string) => {
     switch (role) {
       case USER_ROLES.SPEED:
@@ -128,20 +125,17 @@ export default function UserProfileComp() {
   };
 
   // Handle logout
-  const handleLogout = () => {
-    confirm({
-      title: t("auth.confirmLogout"),
-      content: t("auth.confirmLogoutPrompt"),
-      onOk: () => {
-        logout();
-      },
-    });
+  const handleLogout = async () => {
+    try {
+      await logout();
+      window.location.href = "/";
+    } catch (error) {
+      antdMessage.error(t("auth.logoutFailed"));
+    }
   };
 
   // Handle delete account
   const handleDeleteAccount = async () => {
-    if (isAdminOrSuperAdmin || isCasUser) return;
-
     try {
       await revoke();
       antdMessage.success(t("auth.revokeSuccess"));
@@ -475,16 +469,8 @@ export default function UserProfileComp() {
                 </div>
 
                 <button
-                  disabled={isCasUser}
-                  onClick={() => {
-                    if (isCasUser) return;
-                    setIsDeleteModalOpen(true);
-                  }}
-                  className={`w-full px-6 py-3 flex items-center justify-between transition-colors text-left ${
-                    isCasUser
-                      ? "cursor-not-allowed opacity-50"
-                      : "hover:bg-red-50 dark:hover:bg-red-900/20"
-                  }`}
+                  onClick={() => setIsDeleteModalOpen(true)}
+                  className="w-full px-6 py-3 flex items-center justify-between hover:bg-red-50 dark:hover:bg-red-900/20 transition-colors text-left"
                 >
                   <div className="flex items-center gap-3">
                     <div className="w-8 h-8 rounded-lg bg-red-50 dark:bg-red-900/20 flex items-center justify-center">
@@ -709,7 +695,7 @@ export default function UserProfileComp() {
         onOk={handleDeleteAccount}
         onCancel={() => setIsDeleteModalOpen(false)}
         loading={isLoading}
-        disabled={isAdminOrSuperAdmin || isCasUser}
+        disabled={isAdminOrSuperAdmin}
       />
 
       {/* OAuth Linked Accounts */}
diff --git a/frontend/components/agent/AgentImportWizard.tsx b/frontend/components/agent/AgentImportWizard.tsx
index 504237c1c..5ccf79033 100644
--- a/frontend/components/agent/AgentImportWizard.tsx
+++ b/frontend/components/agent/AgentImportWizard.tsx
@@ -393,6 +393,7 @@ export default function AgentImportWizard({
         items: agentsWithConflicts.map(([agentKey, conflict]) => {
           const agentInfo = initialData.agent_info[agentKey] as any;
           return {
+            agent_id: agentInfo?.agent_id,
             name: conflict.renamedName || agentInfo?.name || "",
             display_name: conflict.renamedDisplayName || agentInfo?.display_name || "",
             task_description: agentInfo?.business_description || agentInfo?.description || "",
diff --git a/frontend/components/auth/avatarDropdown.tsx b/frontend/components/auth/avatarDropdown.tsx
index f52f59119..e77f5f1e2 100644
--- a/frontend/components/auth/avatarDropdown.tsx
+++ b/frontend/components/auth/avatarDropdown.tsx
@@ -3,14 +3,7 @@
 import React, { useState } from "react";
 import { useTranslation } from "react-i18next";
 import { Dropdown, Avatar, Spin, Button, Tag, ConfigProvider } from "antd";
-import {
-  UserRound,
-  LogOut,
-  LogIn,
-  UserRoundPlus,
-  UserCircle,
-  Power,
-} from "lucide-react";
+import { UserRound, LogOut, LogIn, UserRoundPlus, UserCircle, Power } from "lucide-react";
 import type { ItemType } from "antd/es/menu/interface";
 import Link from "next/link";
 
@@ -113,8 +106,6 @@ export function AvatarDropdown() {
     );
   }
 
-  const isCasUser = user.authProvider === "cas";
-
   // User has logged in, show user menu
   const menuItems: ItemType[] = [
     {
@@ -168,12 +159,8 @@ export function AvatarDropdown() {
       icon: <Power size={16} />,
       label: t("auth.revoke"),
       // danger: true,
-      disabled: isCasUser,
-      className: isCasUser
-        ? "cursor-not-allowed opacity-50"
-        : "hover:!bg-red-100 focus:!bg-red-400 focus:!text-white",
+      className: "hover:!bg-red-100 focus:!bg-red-400 focus:!text-white",
       onClick: () => {
-        if (isCasUser) return;
         setIsDeleteModalOpen(true);
       },
     },
@@ -208,11 +195,7 @@ export function AvatarDropdown() {
         }}
         onCancel={() => setIsDeleteModalOpen(false)}
         loading={isLoading}
-        disabled={
-          isCasUser ||
-          user.role === USER_ROLES.ADMIN ||
-          user.role === USER_ROLES.SU
-        }
+        disabled={user.role === USER_ROLES.ADMIN || user.role === USER_ROLES.SU}
       />
     </ConfigProvider>
   );
diff --git a/frontend/components/auth/loginModal.tsx b/frontend/components/auth/loginModal.tsx
index 7425c3ff8..3a4b94a90 100644
--- a/frontend/components/auth/loginModal.tsx
+++ b/frontend/components/auth/loginModal.tsx
@@ -3,14 +3,13 @@
 import { useCallback, useState, useEffect } from "react";
 import { useTranslation } from "react-i18next";
 import { Modal, Form, Input, Button, Typography, Space, Divider, Alert } from "antd";
-import { UserRound, LockKeyhole, Github, Link2, KeyRound } from "lucide-react";
+import { UserRound, LockKeyhole, Github, Link2 } from "lucide-react";
 import { usePathname, useRouter, useSearchParams } from "next/navigation";
 
 import { useAuthenticationContext } from "@/components/providers/AuthenticationProvider";
 import { useDeployment } from "@/components/providers/deploymentProvider";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { oauthService } from "@/services/oauthService";
-import { casService, CasConfig } from "@/services/casService";
 import log from "@/lib/logger";
 
 const { Text } = Typography;
@@ -49,30 +48,6 @@ function OAuthLoginButtons() {
   );
 }
 
-function CasLoginButton() {
-  const { t } = useTranslation("common");
-  const [config, setConfig] = useState<CasConfig | null>(null);
-
-  useEffect(() => {
-    casService.getConfig().then(setConfig);
-  }, []);
-
-  if (!config?.enabled || config.login_mode !== "button") return null;
-
-  return (
-    <div className="mt-2 mb-2">
-      <Button
-        block
-        size="large"
-        icon={<KeyRound size={18} />}
-        onClick={() => casService.startLogin()}
-      >
-        {t("auth.casLogin", { provider: config.display_name }) || `${config.display_name} Login`}
-      </Button>
-    </div>
-  );
-}
-
 /**
  * LoginModal Component
  * Handles user authentication through a modal interface
@@ -120,15 +95,6 @@ export function LoginModal() {
     }
   }, [searchParams, router, getOAuthLoginErrorMessage]);
 
-  useEffect(() => {
-    if (!isLoginModalOpen || isAuthenticated || isSpeedMode) return;
-    casService.getConfig().then((config) => {
-      if (config.enabled && config.login_mode === "force") {
-        casService.startLogin();
-      }
-    });
-  }, [isLoginModalOpen, isAuthenticated, isSpeedMode]);
-
   const resetForm = () => {
     setEmailError("");
     setPasswordError(false);
@@ -342,8 +308,6 @@ export function LoginModal() {
             </Button>
           </Form.Item>
 
-          <CasLoginButton />
-
           {/* OAuth login section */}
           <OAuthLoginButtons />
 
diff --git a/frontend/components/navigation/SideNavigation.tsx b/frontend/components/navigation/SideNavigation.tsx
index dbef5ace0..77b74fee1 100644
--- a/frontend/components/navigation/SideNavigation.tsx
+++ b/frontend/components/navigation/SideNavigation.tsx
@@ -27,8 +27,6 @@ import { SIDER_CONFIG } from "@/const/layoutConstants";
 import { AUTH_EVENTS } from "@/const/auth";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { authEvents } from "@/lib/authEvents";
-import { authFlowState } from "@/lib/authFlow";
-import { casService } from "@/services/casService";
 
 interface SideNavigationProps {
   collapsed?: boolean;
@@ -53,50 +51,15 @@ const ROUTE_CONFIG: RouteConfig[] = [
   { path: "/chat", Icon: Bot, labelKey: "sidebar.startChat", order: 1 },
   { path: "/setup", Icon: Zap, labelKey: "sidebar.quickConfig", order: 2 },
   { path: "/space", Icon: Globe, labelKey: "sidebar.agentSpace", order: 3 },
-  {
-    path: "/market",
-    Icon: ShoppingBag,
-    labelKey: "sidebar.agentMarket",
-    order: 4,
-  },
+  { path: "/market", Icon: ShoppingBag, labelKey: "sidebar.agentMarket", order: 4 },
   { path: "/agents", Icon: Code, labelKey: "sidebar.agentDev", order: 5 },
-  {
-    path: "/knowledges",
-    Icon: BookOpen,
-    labelKey: "sidebar.knowledgeBase",
-    order: 6,
-  },
-  {
-    path: "/mcp-tools",
-    Icon: Puzzle,
-    labelKey: "sidebar.mcpToolsManagement",
-    order: 7,
-  },
-  {
-    path: "/monitoring",
-    Icon: Activity,
-    labelKey: "sidebar.monitoringManagement",
-    order: 8,
-  },
-  {
-    path: "/models",
-    Icon: Settings,
-    labelKey: "sidebar.modelManagement",
-    order: 9,
-  },
-  {
-    path: "/memory",
-    Icon: Database,
-    labelKey: "sidebar.memoryManagement",
-    order: 10,
-  },
+  { path: "/knowledges", Icon: BookOpen, labelKey: "sidebar.knowledgeBase", order: 6 },
+  { path: "/mcp-tools", Icon: Puzzle, labelKey: "sidebar.mcpToolsManagement", order: 7 },
+  { path: "/monitoring", Icon: Activity, labelKey: "sidebar.monitoringManagement", order: 8 },
+  { path: "/models", Icon: Settings, labelKey: "sidebar.modelManagement", order: 9 },
+  { path: "/memory", Icon: Database, labelKey: "sidebar.memoryManagement", order: 10 },
   { path: "/users", Icon: User, labelKey: "sidebar.userManagement", order: 11 },
-  {
-    path: "/tenant-resources",
-    Icon: Building2,
-    labelKey: "sidebar.tenantResources",
-    order: 12,
-  },
+  { path: "/tenant-resources", Icon: Building2, labelKey: "sidebar.tenantResources", order: 12 },
   { path: "/asset-owner-resources", Icon: Building2, labelKey: "sidebar.assetOwnerResources", order: 13 },
 ];
 
@@ -109,7 +72,9 @@ const ROUTE_PATHS = ROUTE_CONFIG.map((route) => route.path);
  * Side navigation component with collapsible menu
  * Displays main navigation items for the application based on user's accessible routes
  */
-export function SideNavigation({ collapsed }: SideNavigationProps) {
+export function SideNavigation({
+  collapsed,
+}: SideNavigationProps) {
   const { t } = useTranslation("common");
   const { accessibleRoutes } = useAuthorizationContext();
   const { isAuthenticated, openAuthPromptModal } = useAuthenticationContext();
@@ -118,9 +83,7 @@ export function SideNavigation({ collapsed }: SideNavigationProps) {
   const pathname = usePathname();
 
   const [selectedKey, setSelectedKey] = useState("/");
-  const [pendingNavigationPath, setPendingNavigationPath] = useState<
-    string | null
-  >(null);
+  const [pendingNavigationPath, setPendingNavigationPath] = useState<string | null>(null);
   const isCollapsed = typeof collapsed === "boolean" ? collapsed : false;
 
   // Update selected key when pathname changes
@@ -142,10 +105,7 @@ export function SideNavigation({ collapsed }: SideNavigationProps) {
       }
     };
 
-    const cleanup = authEvents.on(
-      AUTH_EVENTS.LOGIN_SUCCESS,
-      handleLoginSuccess
-    );
+    const cleanup = authEvents.on(AUTH_EVENTS.LOGIN_SUCCESS, handleLoginSuccess);
     return cleanup;
   }, [pendingNavigationPath, isAuthenticated, router]);
 
@@ -188,17 +148,7 @@ export function SideNavigation({ collapsed }: SideNavigationProps) {
         // Pre-check authentication - show auth prompt if user is not authenticated
         if (!isAuthenticated && !isSpeedMode && route.path !== "/") {
           setPendingNavigationPath(route.path);
-          casService.getConfig().then((config) => {
-            if (
-              !authFlowState.isExplicitLogoutInProgress() &&
-              config.enabled &&
-              config.login_mode === "force"
-            ) {
-              casService.startLogin(route.path);
-              return;
-            }
-            openAuthPromptModal();
-          });
+          openAuthPromptModal();
           return; // Prevent navigation
         }
 
diff --git a/frontend/components/skill/InstallOfficialSkillsModal.tsx b/frontend/components/skill/InstallOfficialSkillsModal.tsx
index b8e8d4ce6..e3cc83d1f 100644
--- a/frontend/components/skill/InstallOfficialSkillsModal.tsx
+++ b/frontend/components/skill/InstallOfficialSkillsModal.tsx
@@ -1,12 +1,13 @@
 "use client";
 
 import React, { useState, useEffect } from "react";
-import { Modal, Spin, message, Tooltip } from "antd";
+import { Modal, Spin, message } from "antd";
 import { useTranslation } from "react-i18next";
 import { CircleCheckBig, CircleOff, CircleDot, LoaderCircle } from "lucide-react";
 
 import { fetchOfficialSkillsWithStatus, installOfficialSkills } from "@/services/skillService";
 import { InstallableSkill } from "@/types/agentConfig";
+import { Tooltip } from "@/components/ui/tooltip";
 
 interface InstallOfficialSkillsModalProps {
   open: boolean;
diff --git a/frontend/components/common/Diagram.tsx b/frontend/components/ui/Diagram.tsx
similarity index 100%
rename from frontend/components/common/Diagram.tsx
rename to frontend/components/ui/Diagram.tsx
diff --git a/frontend/components/common/PdfViewer.tsx b/frontend/components/ui/PdfViewer.tsx
similarity index 100%
rename from frontend/components/common/PdfViewer.tsx
rename to frontend/components/ui/PdfViewer.tsx
diff --git a/frontend/components/common/copyButton.tsx b/frontend/components/ui/copyButton.tsx
similarity index 100%
rename from frontend/components/common/copyButton.tsx
rename to frontend/components/ui/copyButton.tsx
diff --git a/frontend/components/common/filePreviewDrawer.tsx b/frontend/components/ui/filePreviewDrawer.tsx
similarity index 50%
rename from frontend/components/common/filePreviewDrawer.tsx
rename to frontend/components/ui/filePreviewDrawer.tsx
index 409352e15..7f7f08c4a 100644
--- a/frontend/components/common/filePreviewDrawer.tsx
+++ b/frontend/components/ui/filePreviewDrawer.tsx
@@ -1,28 +1,12 @@
 "use client";
 
-import {
-  useState,
-  useEffect,
-  useCallback,
-  useMemo,
-  useRef,
-  type PointerEvent as ReactPointerEvent,
-  type WheelEvent as ReactWheelEvent,
-} from "react";
-import { useTranslation } from "react-i18next";
-import dynamic from "next/dynamic";
-import { Drawer, Modal, Spin, Button, Table } from "antd";
-import {
-  Download,
-  Maximize2,
-  Minimize2,
-  Minus,
-  Plus,
-  RotateCw,
-  X,
-} from "lucide-react";
-import { FilePreviewProps } from "@/types/chat";
-import { DetectedFileType, ImageBaseMode } from "@/types/file";
+import { useState, useEffect, useCallback, useMemo, useRef, type PointerEvent as ReactPointerEvent, type WheelEvent as ReactWheelEvent } from 'react';
+import { useTranslation } from 'react-i18next';
+import dynamic from 'next/dynamic';
+import { Drawer, Spin, Button, Table } from 'antd';
+import { Download, Maximize2, Minimize2, Minus, Plus, RotateCw, X } from 'lucide-react';
+import { FilePreviewProps } from '@/types/chat';
+import { DetectedFileType, ImageBaseMode } from '@/types/file';
 import {
   CHUNK_SIZE,
   TEXT_RENDER_BLOCK_SIZE,
@@ -42,63 +26,40 @@ import {
   clamp,
   ignoreAbortError,
   getPageWrapperStyle,
-  fetchPreviewBlob,
-  PreviewAccessError,
-  getPreviewAccessReasonFromStatus,
-  type PreviewAccessReason,
-} from "@/lib/filePreviewUtils";
-import { storageService } from "@/services/storageService";
-import {
-  MarkdownRenderer,
-  extractMarkdownHeadings,
-  type MarkdownHeading,
-} from "@/components/common/markdownRenderer";
-import { formatFileSize } from "@/lib/utils";
-import log from "@/lib/logger";
-
-const PdfViewer = dynamic(
-  () =>
-    import("@/components/common/PdfViewer").then((mod) => ({
-      default: mod.PdfViewer,
-    })),
-  {
-    ssr: false,
-    loading: () => (
-      <div className="flex items-center justify-center h-full">
-        <Spin size="large" />
-      </div>
-    ),
-  }
-);
+} from '@/lib/filePreviewUtils';
+import { storageService } from '@/services/storageService';
+import { MarkdownRenderer, extractMarkdownHeadings, type MarkdownHeading } from '@/components/ui/markdownRenderer';
+import { formatFileSize } from '@/lib/utils';
+import log from '@/lib/logger';
+
+const PdfViewer = dynamic(() => import('@/components/ui/PdfViewer').then(mod => ({ default: mod.PdfViewer })), {
+  ssr: false,
+  loading: () => (
+    <div className="flex items-center justify-center h-full">
+      <Spin size="large" />
+    </div>
+  ),
+});
 
 export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
-  const { open, onClose, previewContext } = props;
-  const { t } = useTranslation("common");
-  const isLocalSource = props.source === "local";
+  const { open, onClose } = props;
+  const { t } = useTranslation('common');
+  const isLocalSource = props.source === 'local';
   const localFile = isLocalSource ? props.file : null;
-  const objectName = !isLocalSource ? props.objectName : "";
-  const fileName =
-    isLocalSource && localFile
-      ? localFile.name
-      : "fileName" in props
-        ? props.fileName
-        : "";
-  const providedFileType =
-    isLocalSource && localFile
-      ? localFile.type
-      : "fileType" in props
-        ? props.fileType
-        : undefined;
-  const fileSize =
-    isLocalSource && localFile
-      ? localFile.size
-      : "fileSize" in props
-        ? props.fileSize
-        : undefined;
+  const objectName = !isLocalSource ? props.objectName : '';
+  const fileName = isLocalSource && localFile
+    ? localFile.name
+    : ('fileName' in props ? props.fileName : '');
+  const providedFileType = isLocalSource && localFile
+    ? localFile.type
+    : ('fileType' in props ? props.fileType : undefined);
+  const fileSize = isLocalSource && localFile
+    ? localFile.size
+    : ('fileSize' in props ? props.fileSize : undefined);
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState<string | null>(null);
-  const [textContent, setTextContent] = useState<string>("");
-  const [previewUrl, setPreviewUrl] = useState<string>("");
+  const [textContent, setTextContent] = useState<string>('');
+  const [previewUrl, setPreviewUrl] = useState<string>('');
   const [loadingMore, setLoadingMore] = useState(false);
   const [showMarkdownToc, setShowMarkdownToc] = useState(false);
 
@@ -112,15 +73,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const [imageScale, setImageScale] = useState(1);
   const [imageRotation, setImageRotation] = useState(0);
   const [imageLoadError, setImageLoadError] = useState(false);
-  const [imageNaturalSize, setImageNaturalSize] = useState({
-    width: 0,
-    height: 0,
-  });
-  const [imageViewportSize, setImageViewportSize] = useState({
-    width: 0,
-    height: 0,
-  });
-  const [imageBaseMode, setImageBaseMode] = useState<ImageBaseMode>("fit");
+  const [imageNaturalSize, setImageNaturalSize] = useState({ width: 0, height: 0 });
+  const [imageViewportSize, setImageViewportSize] = useState({ width: 0, height: 0 });
+  const [imageBaseMode, setImageBaseMode] = useState<ImageBaseMode>('fit');
   const imageViewportResizeObserverRef = useRef<ResizeObserver | null>(null);
   const [imagePan, setImagePan] = useState({ x: 0, y: 0 });
   const [isImageDragging, setIsImageDragging] = useState(false);
@@ -146,9 +101,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
   const byteOffsetRef = useRef(0);
   const totalBytesRef = useRef<number | null>(null);
-  const remainderRef = useRef("");
+  const remainderRef = useRef('');
   const isFetchingRef = useRef(false);
-  const previewUrlRef = useRef("");
+  const previewUrlRef = useRef('');
   const textDecoderRef = useRef<TextDecoder | null>(null);
   const decoderEncodingRef = useRef<string | null>(null);
   const decoderHasExplicitCharsetRef = useRef(false);
@@ -156,99 +111,71 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const observerRef = useRef<IntersectionObserver | null>(null);
   const markdownContainerRef = useRef<HTMLDivElement | null>(null);
   const textFetchSessionRef = useRef(0);
-  const csvDelimiterRef = useRef<string>(",");
-
-  const handleKnowledgePreviewAccessError = useCallback(
-    (reason: PreviewAccessReason) => {
-      if (previewContext !== "knowledgeBase") {
-        return false;
-      }
-      const key =
-        reason === "forbidden"
-          ? "filePreview.knowledge.accessDenied"
-          : "filePreview.knowledge.noStoredCopy";
-      Modal.info({
-        title: t(`${key}.title`),
-        content: t(`${key}.content`),
-        okText: t("common.confirm"),
-        centered: true,
-      });
-      onClose();
-      return true;
-    },
-    [previewContext, t, onClose]
-  );
+  const csvDelimiterRef = useRef<string>(',');
 
   const resetTextPreviewState = useCallback(() => {
-    setTextContent("");
+    setTextContent('');
     setTxtLines([]);
     setCsvRows([]);
     setLoadingMore(false);
 
     byteOffsetRef.current = 0;
     totalBytesRef.current = null;
-    remainderRef.current = "";
+    remainderRef.current = '';
     isFetchingRef.current = false;
     textDecoderRef.current = null;
     decoderEncodingRef.current = null;
     decoderHasExplicitCharsetRef.current = false;
     decoderAllowGbFallbackRef.current = false;
-    csvDelimiterRef.current = ",";
+    csvDelimiterRef.current = ',';
 
     observerRef.current?.disconnect();
     observerRef.current = null;
   }, []);
 
   const getDetectedFileType = useCallback((): DetectedFileType => {
-    const mime = providedFileType?.toLowerCase() || "";
-
-    if (mime === "application/pdf") return "pdf";
-
-    if (
-      mime === "application/msword" ||
-      mime ===
-        "application/vnd.openxmlformats-officedocument.wordprocessingml.document" ||
-      mime === "application/vnd.ms-excel" ||
-      mime ===
-        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" ||
-      mime === "application/vnd.ms-powerpoint" ||
-      mime ===
-        "application/vnd.openxmlformats-officedocument.presentationml.presentation"
-    ) {
-      return isLocalSource ? "office" : "pdf";
+    const mime = providedFileType?.toLowerCase() || '';
+
+    if (mime === 'application/pdf') return 'pdf';
+    
+    if (mime === 'application/msword' || 
+        mime === 'application/vnd.openxmlformats-officedocument.wordprocessingml.document' ||
+        mime === 'application/vnd.ms-excel' || 
+        mime === 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet' ||
+        mime === 'application/vnd.ms-powerpoint' || 
+        mime === 'application/vnd.openxmlformats-officedocument.presentationml.presentation') {
+      return isLocalSource ? 'office' : 'pdf';
     }
+    
+    if (mime.startsWith('image/')) return 'image';
+    
+    if (mime === 'text/markdown') return 'markdown';
 
-    if (mime.startsWith("image/")) return "image";
-
-    if (mime === "text/markdown") return "markdown";
-
-    if (mime === "text/csv") return "csv";
+    if (mime === 'text/csv') return 'csv';
 
-    if (mime === "text/html") return "html";
+    if (mime === 'text/html') return 'html';
 
-    if (mime === "text/plain") return "text";
+    if (mime === 'text/plain') return 'text';
 
-    const extension = fileName.split(".").pop()?.toLowerCase() || "";
-
-    if (extension === "pdf") return "pdf";
-    if (["doc", "docx", "xls", "xlsx", "ppt", "pptx"].includes(extension)) {
-      return isLocalSource ? "office" : "pdf";
+    const extension = fileName.split('.').pop()?.toLowerCase() || '';
+    
+    if (extension === 'pdf') return 'pdf';
+    if (['doc', 'docx', 'xls', 'xlsx', 'ppt', 'pptx'].includes(extension)) {
+      return isLocalSource ? 'office' : 'pdf';
     }
-    if (["jpg", "jpeg", "png", "gif", "webp", "svg", "bmp"].includes(extension))
-      return "image";
-    if (["md", "markdown"].includes(extension)) return "markdown";
-    if (extension === "csv") return "csv";
-    if (["html", "htm"].includes(extension)) return "html";
-    if (["txt", "log", "json", "xml", "yaml", "yml"].includes(extension))
-      return "text";
-
-    return "unknown";
+    if (['jpg', 'jpeg', 'png', 'gif', 'webp', 'svg', 'bmp'].includes(extension)) return 'image';
+    if (['md', 'markdown'].includes(extension)) return 'markdown';
+    if (extension === 'csv') return 'csv';
+    if (['html', 'htm'].includes(extension)) return 'html';
+    if (['txt', 'log', 'json', 'xml', 'yaml', 'yml'].includes(extension)) return 'text';
+
+    return 'unknown';
   }, [providedFileType, fileName, isLocalSource]);
 
   const detectedFileType = getDetectedFileType();
 
   const markdownHeadings = useMemo<MarkdownHeading[]>(() => {
-    if (detectedFileType !== "markdown" || !textContent) {
+    if (detectedFileType !== 'markdown' || !textContent) {
       return [];
     }
     return extractMarkdownHeadings(textContent);
@@ -261,21 +188,16 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     }
     return blocks;
   }, [txtLines]);
-
+  
   const isEmptyFile = fileSize === 0;
   const isTooLargeToPreview = !!(fileSize && fileSize > 100 * 1024 * 1024);
 
   const normalizedImageRotation = ((imageRotation % 360) + 360) % 360;
   const imageFitScale = useMemo(
-    () =>
-      computeRotateFitScale(
-        normalizedImageRotation,
-        imageNaturalSize,
-        imageViewportSize
-      ),
-    [imageNaturalSize, imageViewportSize, normalizedImageRotation]
+    () => computeRotateFitScale(normalizedImageRotation, imageNaturalSize, imageViewportSize),
+    [imageNaturalSize, imageViewportSize, normalizedImageRotation],
   );
-  const imageBaseScale = imageBaseMode === "fit" ? imageFitScale : 1;
+  const imageBaseScale = imageBaseMode === 'fit' ? imageFitScale : 1;
   const effectiveImageScale = imageScale * imageBaseScale;
   const imageScaleMin = imageBaseScale > 0 ? 0.25 / imageBaseScale : 0.25;
   const imageScaleMax = imageBaseScale > 0 ? 6 / imageBaseScale : 6;
@@ -285,38 +207,26 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (naturalWidth <= 0 || naturalHeight <= 0) {
       return { width: 0, height: 0 };
     }
-    const isQuarterTurn =
-      normalizedImageRotation === 90 || normalizedImageRotation === 270;
-    const displayWidth =
-      (isQuarterTurn ? naturalHeight : naturalWidth) * effectiveImageScale;
-    const displayHeight =
-      (isQuarterTurn ? naturalWidth : naturalHeight) * effectiveImageScale;
+    const isQuarterTurn = normalizedImageRotation === 90 || normalizedImageRotation === 270;
+    const displayWidth = (isQuarterTurn ? naturalHeight : naturalWidth) * effectiveImageScale;
+    const displayHeight = (isQuarterTurn ? naturalWidth : naturalHeight) * effectiveImageScale;
     return { width: displayWidth, height: displayHeight };
   }, [imageNaturalSize, normalizedImageRotation, effectiveImageScale]);
 
-  const clampImagePan = useCallback(
-    (pan: { x: number; y: number }) => {
-      const { width: viewportWidth, height: viewportHeight } =
-        imageViewportSize;
-      const { width: displayWidth, height: displayHeight } = imageDisplaySize;
-      if (
-        viewportWidth <= 0 ||
-        viewportHeight <= 0 ||
-        displayWidth <= 0 ||
-        displayHeight <= 0
-      ) {
-        return { x: 0, y: 0 };
-      }
+  const clampImagePan = useCallback((pan: { x: number; y: number }) => {
+    const { width: viewportWidth, height: viewportHeight } = imageViewportSize;
+    const { width: displayWidth, height: displayHeight } = imageDisplaySize;
+    if (viewportWidth <= 0 || viewportHeight <= 0 || displayWidth <= 0 || displayHeight <= 0) {
+      return { x: 0, y: 0 };
+    }
 
-      const maxPanX = Math.max(0, (displayWidth - viewportWidth) / 2);
-      const maxPanY = Math.max(0, (displayHeight - viewportHeight) / 2);
-      return {
-        x: clamp(pan.x, -maxPanX, maxPanX),
-        y: clamp(pan.y, -maxPanY, maxPanY),
-      };
-    },
-    [imageDisplaySize, imageViewportSize]
-  );
+    const maxPanX = Math.max(0, (displayWidth - viewportWidth) / 2);
+    const maxPanY = Math.max(0, (displayHeight - viewportHeight) / 2);
+    return {
+      x: clamp(pan.x, -maxPanX, maxPanX),
+      y: clamp(pan.y, -maxPanY, maxPanY),
+    };
+  }, [imageDisplaySize, imageViewportSize]);
 
   useEffect(() => {
     imagePanRef.current = imagePan;
@@ -331,21 +241,13 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (imageNaturalSize.width === 0 || imageNaturalSize.height === 0) return;
     if (imageViewportSize.width === 0 || imageViewportSize.height === 0) return;
     const normalizedRotation = ((imageRotation % 360) + 360) % 360;
-    const isQuarterTurn =
-      normalizedRotation === 90 || normalizedRotation === 270;
-    const rotatedWidth = isQuarterTurn
-      ? imageNaturalSize.height
-      : imageNaturalSize.width;
-    const rotatedHeight = isQuarterTurn
-      ? imageNaturalSize.width
-      : imageNaturalSize.height;
-    if (
-      rotatedWidth > imageViewportSize.width ||
-      rotatedHeight > imageViewportSize.height
-    ) {
-      setImageBaseMode("fit");
+    const isQuarterTurn = normalizedRotation === 90 || normalizedRotation === 270;
+    const rotatedWidth = isQuarterTurn ? imageNaturalSize.height : imageNaturalSize.width;
+    const rotatedHeight = isQuarterTurn ? imageNaturalSize.width : imageNaturalSize.height;
+    if (rotatedWidth > imageViewportSize.width || rotatedHeight > imageViewportSize.height) {
+      setImageBaseMode('fit');
     } else {
-      setImageBaseMode("actual");
+      setImageBaseMode('actual');
     }
   }, [open, imageNaturalSize, imageViewportSize, imageRotation]);
 
@@ -375,128 +277,109 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     setIsImageDragging(false);
   }, []);
 
-  const applyImageScale = useCallback(
-    (nextScale: number, anchorX = 0, anchorY = 0) => {
-      const currentScale = imageScaleRef.current;
-      if (nextScale === currentScale) {
-        return;
-      }
-      const scaleRatio = nextScale / currentScale;
-      const currentPan = imagePanRef.current;
-      const nextPan = clampImagePan({
-        x: anchorX - scaleRatio * (anchorX - currentPan.x),
-        y: anchorY - scaleRatio * (anchorY - currentPan.y),
-      });
-      imagePanRef.current = nextPan;
-      setImagePan(nextPan);
-      imageScaleRef.current = nextScale;
-      setImageScale(nextScale);
-    },
-    [clampImagePan]
-  );
+  const applyImageScale = useCallback((nextScale: number, anchorX = 0, anchorY = 0) => {
+    const currentScale = imageScaleRef.current;
+    if (nextScale === currentScale) {
+      return;
+    }
+    const scaleRatio = nextScale / currentScale;
+    const currentPan = imagePanRef.current;
+    const nextPan = clampImagePan({
+      x: anchorX - scaleRatio * (anchorX - currentPan.x),
+      y: anchorY - scaleRatio * (anchorY - currentPan.y),
+    });
+    imagePanRef.current = nextPan;
+    setImagePan(nextPan);
+    imageScaleRef.current = nextScale;
+    setImageScale(nextScale);
+  }, [clampImagePan]);
 
-  const handleImageWheel = useCallback(
-    (event: ReactWheelEvent<HTMLDivElement>) => {
-      if (imageLoadError) {
-        return;
-      }
+  const handleImageWheel = useCallback((event: ReactWheelEvent<HTMLDivElement>) => {
+    if (imageLoadError) {
+      return;
+    }
 
-      event.preventDefault();
+    event.preventDefault();
 
-      const currentScale = imageScaleRef.current;
-      const zoomFactor = Math.exp(-event.deltaY * 0.0015);
-      const nextScale = clamp(
-        currentScale * zoomFactor,
-        imageScaleMin,
-        imageScaleMax
-      );
-      if (nextScale === currentScale) {
-        return;
-      }
+    const currentScale = imageScaleRef.current;
+    const zoomFactor = Math.exp(-event.deltaY * 0.0015);
+    const nextScale = clamp(currentScale * zoomFactor, imageScaleMin, imageScaleMax);
+    if (nextScale === currentScale) {
+      return;
+    }
 
-      const rect = event.currentTarget.getBoundingClientRect();
-      const cursorX = event.clientX - rect.left - rect.width / 2;
-      const cursorY = event.clientY - rect.top - rect.height / 2;
-      applyImageScale(nextScale, cursorX, cursorY);
-    },
-    [applyImageScale, imageLoadError, imageScaleMin, imageScaleMax]
-  );
+    const rect = event.currentTarget.getBoundingClientRect();
+    const cursorX = event.clientX - rect.left - rect.width / 2;
+    const cursorY = event.clientY - rect.top - rect.height / 2;
+    applyImageScale(nextScale, cursorX, cursorY);
+  }, [applyImageScale, imageLoadError, imageScaleMin, imageScaleMax]);
 
-  const handleImagePointerDown = useCallback(
-    (event: ReactPointerEvent<HTMLDivElement>) => {
-      if (imageLoadError || event.button !== 0) {
-        return;
-      }
+  const handleImagePointerDown = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
+    if (imageLoadError || event.button !== 0) {
+      return;
+    }
 
-      event.preventDefault();
-      event.currentTarget.setPointerCapture(event.pointerId);
-      setIsImageDragging(true);
-      dragStateRef.current = {
-        isDragging: true,
-        pointerId: event.pointerId,
-        startX: event.clientX,
-        startY: event.clientY,
-        startPanX: imagePanRef.current.x,
-        startPanY: imagePanRef.current.y,
-      };
-    },
-    [imageLoadError]
-  );
+    event.preventDefault();
+    event.currentTarget.setPointerCapture(event.pointerId);
+    setIsImageDragging(true);
+    dragStateRef.current = {
+      isDragging: true,
+      pointerId: event.pointerId,
+      startX: event.clientX,
+      startY: event.clientY,
+      startPanX: imagePanRef.current.x,
+      startPanY: imagePanRef.current.y,
+    };
+  }, [imageLoadError]);
 
-  const handleImagePointerMove = useCallback(
-    (event: ReactPointerEvent<HTMLDivElement>) => {
-      const dragState = dragStateRef.current;
-      if (!dragState.isDragging || dragState.pointerId !== event.pointerId) {
-        return;
-      }
+  const handleImagePointerMove = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
+    const dragState = dragStateRef.current;
+    if (!dragState.isDragging || dragState.pointerId !== event.pointerId) {
+      return;
+    }
 
-      event.preventDefault();
-      const nextPan = {
-        x: dragState.startPanX + (event.clientX - dragState.startX),
-        y: dragState.startPanY + (event.clientY - dragState.startY),
-      };
-      const clamped = clampImagePan(nextPan);
-      imagePanRef.current = clamped;
-      setImagePan(clamped);
-    },
-    [clampImagePan]
-  );
+    event.preventDefault();
+    const nextPan = {
+      x: dragState.startPanX + (event.clientX - dragState.startX),
+      y: dragState.startPanY + (event.clientY - dragState.startY),
+    };
+    const clamped = clampImagePan(nextPan);
+    imagePanRef.current = clamped;
+    setImagePan(clamped);
+  }, [clampImagePan]);
 
-  const handleImagePointerEnd = useCallback(
-    (event: ReactPointerEvent<HTMLDivElement>) => {
-      const dragState = dragStateRef.current;
-      if (dragState.pointerId !== event.pointerId) {
-        return;
-      }
+  const handleImagePointerEnd = useCallback((event: ReactPointerEvent<HTMLDivElement>) => {
+    const dragState = dragStateRef.current;
+    if (dragState.pointerId !== event.pointerId) {
+      return;
+    }
 
-      dragStateRef.current = {
-        isDragging: false,
-        pointerId: null,
-        startX: 0,
-        startY: 0,
-        startPanX: 0,
-        startPanY: 0,
-      };
-      setIsImageDragging(false);
-    },
-    []
-  );
+    dragStateRef.current = {
+      isDragging: false,
+      pointerId: null,
+      startX: 0,
+      startY: 0,
+      startPanX: 0,
+      startPanY: 0,
+    };
+    setIsImageDragging(false);
+  }, []);
 
   const handleImageDoubleClick = useCallback(() => {
-    if (imageScale !== 1 || imageBaseMode !== "fit") {
-      setImageBaseMode("fit");
+    if (imageScale !== 1 || imageBaseMode !== 'fit') {
+      setImageBaseMode('fit');
       setImageScale(1);
       imageScaleRef.current = 1;
     } else {
-      setImageBaseMode("actual");
+      setImageBaseMode('actual');
     }
   }, [imageBaseMode, imageScale]);
 
   const toggleImageBaseMode = useCallback(() => {
-    if (imageBaseMode === "fit") {
-      setImageBaseMode("actual");
+    if (imageBaseMode === 'fit') {
+      setImageBaseMode('actual');
     } else {
-      setImageBaseMode("fit");
+      setImageBaseMode('fit');
     }
     setImageScale(1);
     imageScaleRef.current = 1;
@@ -507,178 +390,118 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     const clamped = clampImagePan(imagePanRef.current);
     imagePanRef.current = clamped;
     setImagePan(clamped);
-  }, [
-    clampImagePan,
-    effectiveImageScale,
-    normalizedImageRotation,
-    imageViewportSize,
-  ]);
-
-  const fetchTextChunk = useCallback(
-    async (
-      url: string,
-      isFirst = false,
-      sessionId?: number,
-      signal?: AbortSignal
-    ): Promise<void> => {
-      const activeSessionId = sessionId ?? textFetchSessionRef.current;
-      if (!url) {
-        if (isFirst) setLoading(false);
-        else setLoadingMore(false);
+  }, [clampImagePan, effectiveImageScale, normalizedImageRotation, imageViewportSize]);
+
+  const fetchTextChunk = useCallback(async (url: string, isFirst = false, sessionId?: number): Promise<void> => {
+    const activeSessionId = sessionId ?? textFetchSessionRef.current;
+    if (!url) {
+      if (isFirst) setLoading(false);
+      else setLoadingMore(false);
+      return;
+    }
+    if (isFetchingRef.current) return;
+    if (totalBytesRef.current !== null && byteOffsetRef.current >= totalBytesRef.current) return;
+
+    isFetchingRef.current = true;
+    if (!isFirst) setLoadingMore(true);
+
+    try {
+      const start = byteOffsetRef.current;
+      const end   = start + CHUNK_SIZE - 1;
+      const resp = await fetch(url, {
+        headers: { Range: `bytes=${start}-${end}` },
+        cache: 'no-store',
+      });
+      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
+      if (handlePreviewChunkBoundaryResponse(
+        resp.status,
+        isFirst,
+        setServerTooLarge,
+        setLoading,
+        setLoadingMore,
+        observerRef,
+        isFetchingRef,
+      )) {
         return;
       }
-      if (isFetchingRef.current) return;
-      if (
-        totalBytesRef.current !== null &&
-        byteOffsetRef.current >= totalBytesRef.current
-      )
+      if (!resp.ok && resp.status !== 206) throw new Error(`HTTP ${resp.status}`);
+
+      const contentRange = resp.headers.get('Content-Range');
+      const buf = await resp.arrayBuffer();
+      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
+      const hasMore = updateChunkRangeState(contentRange, buf.byteLength, byteOffsetRef, totalBytesRef);
+      ensurePreviewTextDecoder(
+        resp.headers.get('Content-Type'),
+        textDecoderRef,
+        decoderEncodingRef,
+        decoderHasExplicitCharsetRef,
+        decoderAllowGbFallbackRef,
+      );
+      const raw = decodePreviewChunk(
+        buf,
+        hasMore,
+        textDecoderRef,
+        decoderEncodingRef,
+        decoderAllowGbFallbackRef,
+      );
+      const { remainder, safeText } = splitPreviewSafeText(
+        raw,
+        remainderRef.current,
+        hasMore,
+        detectedFileType,
+      );
+      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) return;
+      remainderRef.current = remainder;
+      appendTextPreviewContent({
+        detectedFileType,
+        safeText,
+        byteOffset: byteOffsetRef.current,
+        currentChunkLength: buf.byteLength,
+        csvDelimiterRef,
+        setTxtLines,
+        setCsvRows,
+        setTextContent,
+      });
+      if (!hasMore) observerRef.current?.disconnect();
+    } finally {
+      if (shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)) {
         return;
+      }
+      isFetchingRef.current = false;
+      if (isFirst) setLoading(false);
+      else setLoadingMore(false);
+    }
+  }, [detectedFileType]);
 
-      isFetchingRef.current = true;
-      if (!isFirst) setLoadingMore(true);
-
-      try {
-        const start = byteOffsetRef.current;
-        const end = start + CHUNK_SIZE - 1;
-        const resp = await fetch(url, {
-          headers: { Range: `bytes=${start}-${end}` },
-          cache: "no-store",
-          credentials: "include",
-          signal,
-        });
-        if (
-          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
-        )
-          return;
-        if (
-          handlePreviewChunkBoundaryResponse(
-            resp.status,
-            isFirst,
-            setServerTooLarge,
-            setLoading,
-            setLoadingMore,
-            observerRef,
-            isFetchingRef
-          )
-        ) {
-          return;
-        }
-        const accessReason = getPreviewAccessReasonFromStatus(resp.status);
-        if (accessReason) {
-          if (handleKnowledgePreviewAccessError(accessReason)) {
-            return;
-          }
-          throw new Error(`HTTP ${resp.status}`);
-        }
-        if (!resp.ok && resp.status !== 206)
-          throw new Error(`HTTP ${resp.status}`);
-
-        const contentRange = resp.headers.get("Content-Range");
-        const buf = await resp.arrayBuffer();
-        if (
-          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
-        )
-          return;
-        const hasMore = updateChunkRangeState(
-          contentRange,
-          buf.byteLength,
-          byteOffsetRef,
-          totalBytesRef
-        );
-        ensurePreviewTextDecoder(
-          resp.headers.get("Content-Type"),
-          textDecoderRef,
-          decoderEncodingRef,
-          decoderHasExplicitCharsetRef,
-          decoderAllowGbFallbackRef
-        );
-        const raw = decodePreviewChunk(
-          buf,
-          hasMore,
-          textDecoderRef,
-          decoderEncodingRef,
-          decoderAllowGbFallbackRef
-        );
-        const { remainder, safeText } = splitPreviewSafeText(
-          raw,
-          remainderRef.current,
-          hasMore,
-          detectedFileType
-        );
-        if (
-          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
-        )
-          return;
-        remainderRef.current = remainder;
-        appendTextPreviewContent({
-          detectedFileType,
-          safeText,
-          byteOffset: byteOffsetRef.current,
-          currentChunkLength: buf.byteLength,
-          csvDelimiterRef,
-          setTxtLines,
-          setCsvRows,
-          setTextContent,
-        });
-        if (!hasMore) observerRef.current?.disconnect();
-      } finally {
-        if (
-          shouldStopFetchingChunk(activeSessionId, textFetchSessionRef.current)
-        ) {
-          return;
+  const setupSentinelObserver = useCallback((node: HTMLDivElement | null) => {
+    observerRef.current?.disconnect();
+    observerRef.current = null;
+    if (!isValidContainerElement(node)) return;
+    const observer = new IntersectionObserver(entries => {
+      if (entries[0].isIntersecting) {
+        if (!isLocalSource && previewUrlRef.current && (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)) {
+          fetchTextChunk(previewUrlRef.current).catch(err =>
+            log.error('Failed to fetch next text chunk:', err)
+          );
         }
-        isFetchingRef.current = false;
-        if (isFirst) setLoading(false);
-        else setLoadingMore(false);
       }
-    },
-    [detectedFileType, handleKnowledgePreviewAccessError]
-  );
-
-  const setupSentinelObserver = useCallback(
-    (node: HTMLDivElement | null) => {
-      observerRef.current?.disconnect();
-      observerRef.current = null;
-      if (!isValidContainerElement(node)) return;
-      const observer = new IntersectionObserver(
-        (entries) => {
-          if (entries[0].isIntersecting) {
-            if (
-              !isLocalSource &&
-              previewUrlRef.current &&
-              (totalBytesRef.current === null ||
-                byteOffsetRef.current < totalBytesRef.current)
-            ) {
-              fetchTextChunk(previewUrlRef.current).catch((err) =>
-                log.error("Failed to fetch next text chunk:", err)
-              );
-            }
-          }
-        },
-        { threshold: 0.1 }
-      );
-      observer.observe(node);
-      observerRef.current = observer;
-    },
-    [fetchTextChunk, isLocalSource]
-  );
+    }, { threshold: 0.1 });
+    observer.observe(node);
+    observerRef.current = observer;
+  }, [fetchTextChunk, isLocalSource]);
 
   useEffect(() => {
     if (!open || (!isLocalSource && !objectName)) {
       return;
     }
 
-    let cancelled = false;
-    const abortController = new AbortController();
-    const { signal } = abortController;
-
     const loadPreview = async () => {
       setLoading(true);
       setError(null);
 
       try {
         if (isEmptyFile) {
-          setPreviewUrl("");
+          setPreviewUrl('');
           setLoading(false);
           return;
         }
@@ -688,20 +511,17 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
         if (isLocalSource && localFile) {
           resetTextPreviewState();
           const previousPreviewUrl = previewUrlRef.current;
-          if (previousPreviewUrl.startsWith("blob:")) {
+          if (previousPreviewUrl.startsWith('blob:')) {
             URL.revokeObjectURL(previousPreviewUrl);
           }
-          previewUrlRef.current = "";
+          previewUrlRef.current = '';
 
-          if (
-            isTooLargeToPreview &&
-            ["text", "markdown", "csv", "html"].includes(detectedFileType)
-          ) {
+          if (isTooLargeToPreview && ['text', 'markdown', 'csv', 'html'].includes(detectedFileType)) {
             setLoading(false);
             return;
           }
-
-          if (detectedFileType === "image" || detectedFileType === "pdf") {
+          
+          if (detectedFileType === 'image' || detectedFileType === 'pdf') {
             localPreviewUrl = URL.createObjectURL(localFile);
             setPreviewUrl(localPreviewUrl);
             previewUrlRef.current = localPreviewUrl;
@@ -709,10 +529,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             return;
           }
 
-          if (detectedFileType === "text") {
+          if (detectedFileType === 'text') {
             const text = await decodeLocalTextFile(localFile);
-            const newLines = text.split("\n");
-            if (newLines.at(-1) === "") {
+            const newLines = text.split('\n');
+            if (newLines.at(-1) === '') {
               newLines.pop();
             }
             setTxtLines(newLines);
@@ -720,26 +540,24 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             return;
           }
 
-          if (detectedFileType === "markdown") {
+          if (detectedFileType === 'markdown') {
             setTextContent(await decodeLocalTextFile(localFile));
             setLoading(false);
             return;
           }
 
-          if (detectedFileType === "html") {
+          if (detectedFileType === 'html') {
             const html = await decodeLocalTextFile(localFile);
             setTextContent(html);
             setLoading(false);
             return;
           }
 
-          if (detectedFileType === "csv") {
+          if (detectedFileType === 'csv') {
             const text = await decodeLocalTextFile(localFile);
             const delimiter = detectCsvDelimiter(text);
             csvDelimiterRef.current = delimiter;
-            const newLines = text
-              .split("\n")
-              .filter((line) => line.trim().length > 0);
+            const newLines = text.split('\n').filter(line => line.trim().length > 0);
             setCsvRows(newLines.map((line) => parseCsvLine(line, delimiter)));
             setLoading(false);
             return;
@@ -751,87 +569,34 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
         const url = storageService.getPreviewUrl(objectName, fileName);
 
-        if (["markdown", "csv", "text", "html"].includes(detectedFileType)) {
-          if (cancelled) return;
-          textFetchSessionRef.current += 1;
-          const sessionId = textFetchSessionRef.current;
-          resetTextPreviewState();
-          setPreviewUrl(url);
-          previewUrlRef.current = url;
-          await fetchTextChunk(url, true, sessionId, signal);
-          return;
-        }
-
-        if (detectedFileType === "pdf" || detectedFileType === "image") {
-          if (cancelled) return;
-          if (isTooLargeToPreview) {
-            setLoading(false);
+          if (['markdown', 'csv', 'text', 'html'].includes(detectedFileType)) {
+            textFetchSessionRef.current += 1;
+            const sessionId = textFetchSessionRef.current;
+            resetTextPreviewState();
+            setPreviewUrl(url);
+            previewUrlRef.current = url;
+            await fetchTextChunk(url, true, sessionId);
             return;
           }
-          const previousPreviewUrl = previewUrlRef.current;
-          if (previousPreviewUrl.startsWith("blob:")) {
-            URL.revokeObjectURL(previousPreviewUrl);
-          }
-          previewUrlRef.current = "";
-
-          const blob = await fetchPreviewBlob(url, signal);
-          if (cancelled) return;
-
-          const blobUrl = URL.createObjectURL(blob);
-          previewUrlRef.current = blobUrl;
-          setPreviewUrl(blobUrl);
-          setLoading(false);
-          return;
-        }
 
         setPreviewUrl(url);
         previewUrlRef.current = url;
+
         setLoading(false);
       } catch (err) {
-        if (ignoreAbortError(err) || cancelled) {
-          return;
-        }
-        if (
-          err instanceof PreviewAccessError &&
-          handleKnowledgePreviewAccessError(err.reason)
-        ) {
-          setLoading(false);
-          return;
-        }
-        log.error("Failed to load preview:", err);
-        setError(
-          err instanceof Error ? err.message : t("filePreview.previewFailed")
-        );
+        log.error('Failed to load preview:', err);
+        setError(err instanceof Error ? err.message : t('filePreview.previewFailed'));
         setLoading(false);
       }
     };
 
     void loadPreview();
-
-    return () => {
-      cancelled = true;
-      abortController.abort();
-      textFetchSessionRef.current += 1;
-    };
-  }, [
-    open,
-    objectName,
-    fileName,
-    detectedFileType,
-    t,
-    fetchTextChunk,
-    resetTextPreviewState,
-    isEmptyFile,
-    isLocalSource,
-    localFile,
-    handleKnowledgePreviewAccessError,
-    isTooLargeToPreview,
-  ]);
+  }, [open, objectName, fileName, detectedFileType, t, fetchTextChunk, resetTextPreviewState, isEmptyFile, isLocalSource, localFile]);
 
   useEffect(() => {
     return () => {
       const currentPreviewUrl = previewUrlRef.current;
-      if (currentPreviewUrl.startsWith("blob:")) {
+      if (currentPreviewUrl.startsWith('blob:')) {
         URL.revokeObjectURL(currentPreviewUrl);
       }
     };
@@ -845,13 +610,13 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       setImageRotation(0);
       setImageNaturalSize({ width: 0, height: 0 });
       setImageViewportSize({ width: 0, height: 0 });
-      setImageBaseMode("fit");
+      setImageBaseMode('fit');
       handleImagePanReset();
-      setTextContent("");
+      setTextContent('');
       setTxtLines([]);
       setCsvRows([]);
       setCsvTableHeight(400);
-      setPreviewUrl("");
+      setPreviewUrl('');
       setError(null);
       setImageLoadError(false);
       setLoadingMore(false);
@@ -859,7 +624,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       textFetchSessionRef.current += 1;
       byteOffsetRef.current = 0;
       totalBytesRef.current = null;
-      remainderRef.current = "";
+      remainderRef.current = '';
       isFetchingRef.current = false;
       textDecoderRef.current = null;
       decoderEncodingRef.current = null;
@@ -869,10 +634,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       observerRef.current = null;
       imageViewportResizeObserverRef.current?.disconnect();
       imageViewportResizeObserverRef.current = null;
-      if (previousPreviewUrl.startsWith("blob:")) {
+      if (previousPreviewUrl.startsWith('blob:')) {
         URL.revokeObjectURL(previousPreviewUrl);
       }
-      previewUrlRef.current = "";
+      previewUrlRef.current = '';
     }
   }, [open]);
 
@@ -887,20 +652,20 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (!open) return;
 
     const handleKeyDown = (e: KeyboardEvent) => {
-      if (e.key === "Escape") {
+      if (e.key === 'Escape') {
         onClose();
       }
     };
 
-    globalThis.addEventListener("keydown", handleKeyDown);
-    return () => globalThis.removeEventListener("keydown", handleKeyDown);
+    globalThis.addEventListener('keydown', handleKeyDown);
+    return () => globalThis.removeEventListener('keydown', handleKeyDown);
   }, [open, onClose]);
 
   const handleDownload = async () => {
     try {
       if (isLocalSource && localFile) {
         const url = URL.createObjectURL(localFile);
-        const link = document.createElement("a");
+        const link = document.createElement('a');
         link.href = url;
         link.download = fileName;
         link.click();
@@ -910,7 +675,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
       await storageService.downloadFile(objectName, fileName);
     } catch (err) {
-      log.error("Failed to download file:", err);
+      log.error('Failed to download file:', err);
     }
   };
 
@@ -925,22 +690,19 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
     if (
       isFetchingRef.current ||
-      (totalBytesRef.current !== null &&
-        byteOffsetRef.current >= totalBytesRef.current)
+      (totalBytesRef.current !== null && byteOffsetRef.current >= totalBytesRef.current)
     ) {
       return;
     }
 
-    fetchTextChunk(previewUrlRef.current).catch((err) =>
-      log.error("Failed to fetch next text chunk:", err)
+    fetchTextChunk(previewUrlRef.current).catch(err =>
+      log.error('Failed to fetch next text chunk:', err)
     );
   }, [fetchTextChunk, isLocalSource]);
 
   const handleMarkdownHeadingClick = useCallback((headingId: string) => {
     const container = markdownContainerRef.current;
-    const target =
-      container?.querySelector<HTMLElement>(`#${CSS.escape(headingId)}`) ??
-      null;
+    const target = container?.querySelector<HTMLElement>(`#${CSS.escape(headingId)}`) ?? null;
 
     if (!container || !target) {
       return;
@@ -948,10 +710,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
     const containerRect = container.getBoundingClientRect();
     const targetRect = target.getBoundingClientRect();
-    const nextScrollTop =
-      container.scrollTop + targetRect.top - containerRect.top;
+    const nextScrollTop = container.scrollTop + targetRect.top - containerRect.top;
 
-    container.scrollTo({ top: Math.max(nextScrollTop, 0), behavior: "smooth" });
+    container.scrollTo({ top: Math.max(nextScrollTop, 0), behavior: 'smooth' });
 
     if (globalThis.innerWidth < 768) {
       setShowMarkdownToc(false);
@@ -962,7 +723,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     <div className="flex items-center justify-center h-full">
       <div className="text-center">
         <div className="animate-spin rounded-full h-8 w-8 border-b-2 border-blue-500 mx-auto mb-2"></div>
-        <p className="text-sm text-gray-600">{t("filePreview.loading")}</p>
+        <p className="text-sm text-gray-600">{t('filePreview.loading')}</p>
       </div>
     </div>
   );
@@ -970,7 +731,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderCenteredErrorState = () => (
     <div className="flex items-center justify-center h-full">
       <div className="text-center max-w-md px-4">
-        <p className="text-red-500 text-sm">{t("filePreview.previewFailed")}</p>
+        <p className="text-red-500 text-sm">{t('filePreview.previewFailed')}</p>
       </div>
     </div>
   );
@@ -978,7 +739,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderError = () => renderCenteredErrorState();
 
   const renderPdfViewer = () => (
-    <PdfViewer url={previewUrl} fileName={fileName} />
+    <PdfViewer
+      url={previewUrl}
+      fileName={fileName}
+    />
   );
 
   const renderImageViewer = () => (
@@ -1001,16 +765,14 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             <div
               className="absolute inset-0 flex items-center justify-center"
               style={{
-                perspective: "1000px",
+                perspective: '1000px',
               }}
             >
               <div
                 style={{
                   transform: `translate(${imagePan.x}px, ${imagePan.y}px) scale(${effectiveImageScale}) rotate(${imageRotation}deg)`,
-                  willChange: "transform",
-                  transition: isImageDragging
-                    ? "none"
-                    : "transform 0.2s ease-in-out",
+                  willChange: 'transform',
+                  transition: isImageDragging ? 'none' : 'transform 0.2s ease-in-out',
                 }}
               >
                 <img
@@ -1020,10 +782,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
                   draggable={false}
                   onLoad={(e) => {
                     const img = e.currentTarget;
-                    setImageNaturalSize({
-                      width: img.naturalWidth,
-                      height: img.naturalHeight,
-                    });
+                    setImageNaturalSize({ width: img.naturalWidth, height: img.naturalHeight });
                   }}
                   onError={() => setImageLoadError(true)}
                 />
@@ -1038,16 +797,12 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           <div className="flex items-center gap-1 bg-white/70 backdrop-blur-sm border border-gray-200/60 rounded-full shadow-lg px-3 py-1">
             <button
               onClick={() => {
-                const nextScale = clamp(
-                  imageScaleRef.current - 0.25,
-                  imageScaleMin,
-                  imageScaleMax
-                );
+                const nextScale = clamp(imageScaleRef.current - 0.25, imageScaleMin, imageScaleMax);
                 applyImageScale(nextScale, 0, 0);
               }}
               disabled={effectiveImageScale <= 0.25}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors disabled:opacity-30 text-gray-600"
-              title={t("filePreview.zoomOut")}
+              title={t('filePreview.zoomOut')}
             >
               <Minus size={16} />
             </button>
@@ -1058,16 +813,12 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
             <button
               onClick={() => {
-                const nextScale = clamp(
-                  imageScaleRef.current + 0.25,
-                  imageScaleMin,
-                  imageScaleMax
-                );
+                const nextScale = clamp(imageScaleRef.current + 0.25, imageScaleMin, imageScaleMax);
                 applyImageScale(nextScale, 0, 0);
               }}
               disabled={effectiveImageScale >= 6}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors disabled:opacity-30 text-gray-600"
-              title={t("filePreview.zoomIn")}
+              title={t('filePreview.zoomIn')}
             >
               <Plus size={16} />
             </button>
@@ -1078,25 +829,21 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
               onClick={toggleImageBaseMode}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors text-gray-600"
               title={
-                imageBaseMode === "fit"
-                  ? t("filePreview.image.actualSize")
-                  : t("filePreview.image.fitPage")
+                imageBaseMode === 'fit'
+                  ? t('filePreview.image.actualSize')
+                  : t('filePreview.image.fitPage')
               }
             >
-              {imageBaseMode === "fit" ? (
-                <Maximize2 size={16} />
-              ) : (
-                <Minimize2 size={16} />
-              )}
+              {imageBaseMode === 'fit' ? <Maximize2 size={16} /> : <Minimize2 size={16} />}
             </button>
 
             <button
               onClick={() => {
-                setImageRotation((prev) => prev + 90);
+                setImageRotation(prev => prev + 90);
                 handleImagePanReset();
               }}
               className="p-1.5 rounded-lg hover:bg-gray-100 transition-colors text-gray-600"
-              title={t("filePreview.rotate")}
+              title={t('filePreview.rotate')}
             >
               <RotateCw size={16} />
             </button>
@@ -1109,12 +856,10 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
   const renderMarkdownViewer = () => (
     <div className="flex h-full min-h-0 bg-white">
       {markdownHeadings.length > 0 && (
-        <aside
-          className={`${showMarkdownToc ? "flex" : "hidden"} md:flex w-64 flex-shrink-0 flex-col border-r border-gray-200 bg-gray-50/70`}
-        >
+        <aside className={`${showMarkdownToc ? 'flex' : 'hidden'} md:flex w-64 flex-shrink-0 flex-col border-r border-gray-200 bg-gray-50/70`}>
           <div className="flex items-center justify-between border-b border-gray-200 px-3 py-3">
             <span className="text-sm font-medium text-gray-700">
-              {t("filePreview.markdownOutline", { defaultValue: "目录" })}
+              {t('filePreview.markdownOutline', { defaultValue: '目录' })}
             </span>
             <Button
               type="text"
@@ -1147,20 +892,13 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       <div className="flex min-w-0 flex-1 flex-col">
         {markdownHeadings.length > 0 && (
           <div className="border-b border-gray-200 px-4 py-2 md:hidden">
-            <Button
-              type="default"
-              size="small"
-              onClick={() => setShowMarkdownToc((prev) => !prev)}
-            >
-              {t("filePreview.markdownOutline", { defaultValue: "目录" })}
+            <Button type="default" size="small" onClick={() => setShowMarkdownToc(prev => !prev)}>
+              {t('filePreview.markdownOutline', { defaultValue: '目录' })}
             </Button>
           </div>
         )}
-        <div
-          ref={markdownContainerRef}
-          className="flex-1 overflow-auto px-6 pb-6 pt-0"
-        >
-          <MarkdownRenderer
+        <div ref={markdownContainerRef} className="flex-1 overflow-auto px-6 pb-6 pt-0">
+          <MarkdownRenderer 
             content={textContent}
             enableMultimodal={true}
             resolveS3Media={false}
@@ -1184,11 +922,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           const el = e.currentTarget;
           if (
             !isLocalSource &&
-            el.scrollTop + el.clientHeight >=
-              el.scrollHeight - el.clientHeight * 0.5 &&
+            el.scrollTop + el.clientHeight >= el.scrollHeight - el.clientHeight * 0.5 &&
             !isFetchingRef.current &&
-            (totalBytesRef.current === null ||
-              byteOffsetRef.current < totalBytesRef.current)
+            (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
           ) {
             fetchNextTextChunk();
           }
@@ -1218,16 +954,14 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     const columns = headerRow.map((col, i) => ({
       key: String(i),
       dataIndex: String(i),
-      title: col || `${t("filePreview.csv.column")} ${i + 1}`,
+      title: col || `${t('filePreview.csv.column')} ${i + 1}`,
       ellipsis: true,
       width: 160,
     }));
 
     const dataSource = dataRows.map((row, rowIdx) => {
       const record: Record<string, string> = { _key: String(rowIdx) };
-      headerRow.forEach((_, i) => {
-        record[String(i)] = row[i] ?? "";
-      });
+      headerRow.forEach((_, i) => { record[String(i)] = row[i] ?? ''; });
       return record;
     });
 
@@ -1260,14 +994,12 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
             const el = e.currentTarget as HTMLElement;
             if (
               !isLocalSource &&
-              el.scrollTop + el.clientHeight >=
-                el.scrollHeight - CSV_ROW_HEIGHT * 30 &&
+              el.scrollTop + el.clientHeight >= el.scrollHeight - CSV_ROW_HEIGHT * 30 &&
               !isFetchingRef.current &&
-              (totalBytesRef.current === null ||
-                byteOffsetRef.current < totalBytesRef.current)
+              (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
             ) {
-              fetchTextChunk(previewUrlRef.current).catch((err) =>
-                log.error("Failed to fetch next CSV chunk:", err)
+              fetchTextChunk(previewUrlRef.current).catch(err =>
+                log.error('Failed to fetch next CSV chunk:', err)
               );
             }
           }}
@@ -1275,9 +1007,7 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
         {loadingMore && (
           <div className="flex items-center justify-center py-3 border-t border-gray-100">
             <div className="animate-spin rounded-full h-5 w-5 border-b-2 border-blue-500 mr-2" />
-            <span className="text-sm text-gray-500">
-              {t("filePreview.loading")}
-            </span>
+            <span className="text-sm text-gray-500">{t('filePreview.loading')}</span>
           </div>
         )}
         <div ref={setupSentinelObserver} className="h-1" />
@@ -1293,11 +1023,9 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           const el = e.currentTarget;
           if (
             !isLocalSource &&
-            el.scrollTop + el.clientHeight >=
-              el.scrollHeight - el.clientHeight * 0.5 &&
+            el.scrollTop + el.clientHeight >= el.scrollHeight - el.clientHeight * 0.5 &&
             !isFetchingRef.current &&
-            (totalBytesRef.current === null ||
-              byteOffsetRef.current < totalBytesRef.current)
+            (totalBytesRef.current === null || byteOffsetRef.current < totalBytesRef.current)
           ) {
             fetchNextTextChunk();
           }
@@ -1309,11 +1037,11 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
               key={index}
               className="m-0 whitespace-pre-wrap break-words"
               style={{
-                contentVisibility: "auto",
+                contentVisibility: 'auto',
                 containIntrinsicSize: `${Math.max(block.length, 1) * 24}px`,
               }}
             >
-              {block.join("\n") || "\u00A0"}
+              {block.join('\n') || '\u00A0'}
             </pre>
           ))}
         </div>
@@ -1328,29 +1056,25 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
 
   const renderTooLarge = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500">{t("filePreview.tooLargeToPreview")}</p>
+      <p className="text-gray-500">{t('filePreview.tooLargeToPreview')}</p>
     </div>
   );
 
   const renderEmptyFile = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">{t("filePreview.emptyFile")}</p>
+      <p className="text-gray-500 text-sm">{t('filePreview.emptyFile')}</p>
     </div>
   );
 
   const renderUnsupported = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">
-        {t("filePreview.unsupportedSingleLine")}
-      </p>
+      <p className="text-gray-500 text-sm">{t('filePreview.unsupportedSingleLine')}</p>
     </div>
   );
 
   const renderUploadToPreview = () => (
     <div className="flex items-center justify-center h-full">
-      <p className="text-gray-500 text-sm">
-        {t("filePreview.uploadToPreview")}
-      </p>
+      <p className="text-gray-500 text-sm">{t('filePreview.uploadToPreview')}</p>
     </div>
   );
 
@@ -1361,19 +1085,19 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
     if (error) return renderError();
 
     switch (detectedFileType) {
-      case "pdf":
+      case 'pdf':
         return renderPdfViewer();
-      case "image":
+      case 'image':
         return renderImageViewer();
-      case "markdown":
+      case 'markdown':
         return renderMarkdownViewer();
-      case "csv":
+      case 'csv':
         return renderCsvViewer();
-      case "text":
+      case 'text':
         return renderTextViewer();
-      case "html":
+      case 'html':
         return renderHtmlViewer();
-      case "office":
+      case 'office':
         return renderUploadToPreview();
       default:
         return renderUnsupported();
@@ -1387,14 +1111,8 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
       placement="right"
       size="65%"
       styles={{
-        body: {
-          padding: 0,
-          height: "100%",
-          minHeight: 0,
-          display: "flex",
-          flexDirection: "column",
-        },
-        header: { padding: "12px 16px", borderBottom: "1px solid #e5e7eb" },
+        body: { padding: 0, height: '100%', minHeight: 0, display: 'flex', flexDirection: 'column' },
+        header: { padding: '12px 16px', borderBottom: '1px solid #e5e7eb' },
       }}
       closeIcon={<X size={20} />}
       title={
@@ -1415,12 +1133,14 @@ export function FilePreviewDrawer(props: Readonly<FilePreviewProps>) {
           icon={<Download size={14} />}
           onClick={handleDownload}
         >
-          {t("filePreview.download")}
+          {t('filePreview.download')}
         </Button>
       }
     >
       <div className="flex h-full flex-col">
-        <div className="flex-1 min-h-0 overflow-hidden">{renderContent()}</div>
+        <div className="flex-1 min-h-0 overflow-hidden">
+        {renderContent()}
+        </div>
       </div>
     </Drawer>
   );
diff --git a/frontend/components/common/markdownRenderer.tsx b/frontend/components/ui/markdownRenderer.tsx
similarity index 99%
rename from frontend/components/common/markdownRenderer.tsx
rename to frontend/components/ui/markdownRenderer.tsx
index 93dbcce11..53dfb6962 100644
--- a/frontend/components/common/markdownRenderer.tsx
+++ b/frontend/components/ui/markdownRenderer.tsx
@@ -16,8 +16,8 @@ import { visit } from "unist-util-visit";
 import { SearchResult } from "@/types/chat";
 import { resolveS3UrlToDataUrl } from "@/services/storageService";
 import { Tooltip, TooltipProvider } from "@/components/ui/tooltip";
-import { CopyButton } from "@/components/common/copyButton";
-import { Diagram } from "@/components/common/Diagram";
+import { CopyButton } from "@/components/ui/copyButton";
+import { Diagram } from "@/components/ui/Diagram";
 
 interface MarkdownRendererProps {
   content: string;
diff --git a/frontend/components/common/tokenUsageIndicator.tsx b/frontend/components/ui/tokenUsageIndicator.tsx
similarity index 98%
rename from frontend/components/common/tokenUsageIndicator.tsx
rename to frontend/components/ui/tokenUsageIndicator.tsx
index adde20fbf..826787e2b 100644
--- a/frontend/components/common/tokenUsageIndicator.tsx
+++ b/frontend/components/ui/tokenUsageIndicator.tsx
@@ -1,8 +1,8 @@
 "use client";
 
 import React from "react";
+import { Tooltip } from "@/components/ui/tooltip";
 import { TokenMetrics } from "@/types/chat";
-import { Tooltip } from "antd"
 
 interface TokenUsageIndicatorProps {
   latestMetrics: TokenMetrics | null;
diff --git a/frontend/const/agentConfig.ts b/frontend/const/agentConfig.ts
index 4c8b96a7f..aed7b6404 100644
--- a/frontend/const/agentConfig.ts
+++ b/frontend/const/agentConfig.ts
@@ -53,8 +53,6 @@ export const GENERATE_PROMPT_STREAM_TYPES = {
   AGENT_VAR_NAME: "agent_var_name",
   AGENT_DESCRIPTION: "agent_description",
   AGENT_DISPLAY_NAME: "agent_display_name",
-  GREETING_MESSAGE: "greeting_message",
-  EXAMPLE_QUESTIONS: "example_questions",
 } as const;
 
 export const TOOL_PARAM_TYPES = {
diff --git a/frontend/const/chatConfig.ts b/frontend/const/chatConfig.ts
index c206fa752..27b3b887d 100644
--- a/frontend/const/chatConfig.ts
+++ b/frontend/const/chatConfig.ts
@@ -117,11 +117,9 @@ messageTypes: {
   STEP_COUNT: "step_count" as const,
   TOKEN_COUNT: "token_count" as const,
   MAX_STEPS_REACHED: "max_steps_reached" as const,
-  VERIFICATION: "verification" as const,
   SEARCH_CONTENT_PLACEHOLDER: "search_content_placeholder" as const,
   VIRTUAL: "virtual" as const,
   PREPROCESS: "preprocess" as const,
-  SKILL_FILES: "skill_files" as const,
 },
 
 // Content type constants for last content type tracking
@@ -135,7 +133,6 @@ contentTypes: {
   SEARCH_CONTENT: "search_content" as const,
   CARD: "card" as const,
   MEMORY_SEARCH: "memory_search" as const,
-  VERIFICATION: "verification" as const,
   PREPROCESS: "preprocess" as const,
 },
 
diff --git a/frontend/hooks/agent/useAgentGeneration.ts b/frontend/hooks/agent/useAgentGeneration.ts
index cfd350e91..4ffa31adb 100644
--- a/frontend/hooks/agent/useAgentGeneration.ts
+++ b/frontend/hooks/agent/useAgentGeneration.ts
@@ -151,16 +151,11 @@ export function useAgentGeneration({
               }
               break;
             case GENERATE_PROMPT_STREAM_TYPES.AGENT_DISPLAY_NAME:
+              // Only save to cache if user hasn't filled in agent display name themselves
               if (!editedAgent.display_name) {
                 saveGeneratedField(generationAgentId, 'agentDisplayName', data.content);
               }
               break;
-            case GENERATE_PROMPT_STREAM_TYPES.GREETING_MESSAGE:
-              saveGeneratedField(generationAgentId, 'greetingMessage', data.content);
-              break;
-            case GENERATE_PROMPT_STREAM_TYPES.EXAMPLE_QUESTIONS:
-              saveGeneratedField(generationAgentId, 'exampleQuestions', data.content);
-              break;
           }
         },
         (error) => {
@@ -216,12 +211,6 @@ export function useAgentGeneration({
             duty_prompt: cached?.dutyPrompt || editedAgent.duty_prompt || "",
             constraint_prompt: cached?.constraintPrompt || editedAgent.constraint_prompt || "",
             few_shots_prompt: cached?.fewShotsPrompt || editedAgent.few_shots_prompt || "",
-            greeting_message: cached?.greetingMessage || editedAgent.greeting_message || "",
-            example_questions: cached?.exampleQuestions
-              ? (typeof cached.exampleQuestions === "string"
-                ? (() => { try { return JSON.parse(cached.exampleQuestions); } catch { return []; } })()
-                : cached.exampleQuestions)
-              : editedAgent.example_questions || [],
           };
           // Update agent config in store
           updateAgentConfig(configUpdates);
diff --git a/frontend/hooks/agent/useSaveGuard.ts b/frontend/hooks/agent/useSaveGuard.ts
index 2f644e0bc..6d948deff 100644
--- a/frontend/hooks/agent/useSaveGuard.ts
+++ b/frontend/hooks/agent/useSaveGuard.ts
@@ -135,7 +135,6 @@ export const useSaveGuard = () => {
         model_id: currentEditedAgent.model_id ?? undefined,
         max_steps: currentEditedAgent.max_step,
         provide_run_summary: currentEditedAgent.provide_run_summary,
-        verification_config: currentEditedAgent.verification_config,
         enabled: true,
         business_description: currentEditedAgent.business_description,
         duty_prompt: currentEditedAgent.duty_prompt,
@@ -150,8 +149,6 @@ export const useSaveGuard = () => {
         related_agent_ids: relatedAgentIds,
         related_external_agent_ids: relatedExternalAgentIds,
         ingroup_permission: currentEditedAgent.ingroup_permission ?? "READ_ONLY",
-        greeting_message: currentEditedAgent.greeting_message,
-        example_questions: currentEditedAgent.example_questions,
       });
 
       if (result.success) {
diff --git a/frontend/hooks/auth/useAuthenticationState.ts b/frontend/hooks/auth/useAuthenticationState.ts
index 402b5c717..3f8923ca7 100644
--- a/frontend/hooks/auth/useAuthenticationState.ts
+++ b/frontend/hooks/auth/useAuthenticationState.ts
@@ -1,20 +1,13 @@
 "use client";
 
-import { useState, useEffect, useCallback, useRef } from "react";
+import { useState, useEffect, useCallback } from "react";
 import { useTranslation } from "react-i18next";
 import { App } from "antd";
 
 import { useDeployment } from "@/components/providers/deploymentProvider";
 import { useQueryClient } from "@tanstack/react-query";
 import { authService } from "@/services/authService";
-import { casService } from "@/services/casService";
-import {
-  getSessionFromStorage,
-  removeSessionFromStorage,
-  checkSessionValid,
-  getTokenExpiresAt,
-} from "@/lib/session";
-import { authFlowState } from "@/lib/authFlow";
+import { getSessionFromStorage, removeSessionFromStorage, checkSessionValid, hasAuthCookies } from "@/lib/session";
 import { Session, AuthenticationStateReturn } from "@/types/auth";
 import { STATUS_CODES } from "@/const/auth";
 import { authEventUtils } from "@/lib/authEvents";
@@ -37,7 +30,6 @@ export function useAuthenticationState(): AuthenticationStateReturn {
   const [session, setSession] = useState<Session | null>(null);
   const [authServiceUnavailable, setAuthServiceUnavailable] =
     useState<boolean>(false);
-  const isCasLoginInProgressRef = useRef(false);
 
   // Speed mode: skip authentication checks, consider user as authenticated
   useEffect(() => {
@@ -59,68 +51,6 @@ export function useAuthenticationState(): AuthenticationStateReturn {
     setIsAuthChecking(false);
   }, [isSpeedMode]);
 
-  useEffect(() => {
-    if (isSpeedMode || isAuthChecking || isAuthenticated) return;
-    if (isCasLoginInProgressRef.current) return;
-    if (authFlowState.isExplicitLogoutInProgress()) return;
-    if (typeof window === "undefined") return;
-
-    const pathname = window.location.pathname;
-    if (pathname.includes("/oauth/complete")) return;
-
-    let cancelled = false;
-    casService.getConfig().then((config) => {
-      if (
-        cancelled ||
-        isCasLoginInProgressRef.current ||
-        authFlowState.isExplicitLogoutInProgress() ||
-        !config.enabled ||
-        config.login_mode !== "force"
-      ) {
-        return;
-      }
-
-      isCasLoginInProgressRef.current = true;
-      casService.startLogin();
-    });
-
-    return () => {
-      cancelled = true;
-    };
-  }, [isSpeedMode, isAuthChecking, isAuthenticated]);
-
-  useEffect(() => {
-    if (isSpeedMode || !isAuthenticated) return;
-
-    let timeoutId: ReturnType<typeof setTimeout> | null = null;
-    let cancelled = false;
-
-    casService.getConfig().then((config) => {
-      if (cancelled || !config.enabled || config.login_mode === "disabled")
-        return;
-      const expiresAt = getTokenExpiresAt();
-      if (!expiresAt) return;
-
-      const renewAtMs = expiresAt * 1000 - config.renew_before_seconds * 1000;
-      const delayMs = Math.max(0, renewAtMs - Date.now());
-      timeoutId = setTimeout(async () => {
-        const ok = await casService.renewInIframe(config.renew_timeout_seconds);
-        if (!ok || cancelled) return;
-        const renewedSession = getSessionFromStorage();
-        if (renewedSession) {
-          setSession(renewedSession);
-          setIsAuthenticated(true);
-          authEventUtils.emitTokenRefreshed();
-        }
-      }, delayMs);
-    });
-
-    return () => {
-      cancelled = true;
-      if (timeoutId) clearTimeout(timeoutId);
-    };
-  }, [isAuthenticated, session?.expires_at, isSpeedMode]);
-
   const clearLocalSession = useCallback(() => {
     removeSessionFromStorage();
     setSession(null);
@@ -184,7 +114,11 @@ export function useAuthenticationState(): AuthenticationStateReturn {
 
   // Register method
   const register = useCallback(
-    async (email: string, password: string, inviteCode?: string) => {
+    async (
+      email: string,
+      password: string,
+      inviteCode?: string
+    ) => {
       setIsLoading(true);
 
       try {
@@ -223,44 +157,47 @@ export function useAuthenticationState(): AuthenticationStateReturn {
   );
 
   // Logout method
-  const logout = useCallback(async (options: { silent?: boolean } = {}) => {
-    const { silent = false } = options;
+  const logout = useCallback(
+    async (options: { silent?: boolean } = {}) => {
+      const { silent = false } = options;
 
-    try {
-      setIsLoading(true);
+      try {
+        setIsLoading(true);
 
-      if (!silent) {
-        // Call logout API
-        await authService.signOut();
-      }
+        if (!silent) {
+          // Call logout API
+          await authService.signOut();
+        }
 
-      // Clear local session
-      removeSessionFromStorage();
-      setSession(null);
-      setIsAuthenticated(false);
+        // Clear local session
+        removeSessionFromStorage();
+        setSession(null);
+        setIsAuthenticated(false);
 
-      queryClient.clear();
-      if (!silent) {
-        message.success(t("auth.logoutSuccess"));
-      }
+        queryClient.clear();
+        if (!silent) {
+          message.success(t("auth.logoutSuccess"));
+        }
 
-      // Emit logout event
-      authEventUtils.emitLogout();
-    } catch (error: any) {
-      log.error("Logout failed:", error?.message || error);
-      // Even if API call fails, clear local session
-      removeSessionFromStorage();
-      setSession(null);
-      setIsAuthenticated(false);
+        // Emit logout event
+        authEventUtils.emitLogout();
+      } catch (error: any) {
+        log.error("Logout failed:", error?.message || error);
+        // Even if API call fails, clear local session
+        removeSessionFromStorage();
+        setSession(null);
+        setIsAuthenticated(false);
 
-      queryClient.clear();
-      if (!silent) {
-        message.error(t("auth.logoutFailed"));
+        queryClient.clear();
+        if (!silent) {
+          message.error(t("auth.logoutFailed"));
+        }
+      } finally {
+        setIsLoading(false);
       }
-    } finally {
-      setIsLoading(false);
-    }
-  }, []);
+    },
+    []
+  );
 
   // Revoke method
   const revoke = useCallback(async () => {
@@ -296,6 +233,6 @@ export function useAuthenticationState(): AuthenticationStateReturn {
     register,
     logout,
     clearLocalSession,
-    revoke,
+    revoke
   };
 }
diff --git a/frontend/hooks/auth/useAuthenticationUI.ts b/frontend/hooks/auth/useAuthenticationUI.ts
index 748d6d359..2b42641da 100644
--- a/frontend/hooks/auth/useAuthenticationUI.ts
+++ b/frontend/hooks/auth/useAuthenticationUI.ts
@@ -1,6 +1,6 @@
 "use client";
 
-import { useState, useCallback, useEffect, useRef } from "react";
+import { useState, useCallback, useEffect } from "react";
 import { useRouter, usePathname, useSearchParams } from "next/navigation";
 import { App } from "antd";
 import { useTranslation } from "react-i18next";
@@ -9,8 +9,6 @@ import { useDeployment } from "@/components/providers/deploymentProvider";
 import { AUTH_EVENTS } from "@/const/auth";
 import { getEffectiveRoutePath } from "@/lib/auth";
 import { authEvents, authEventUtils } from "@/lib/authEvents";
-import { authFlowState } from "@/lib/authFlow";
-import { casService } from "@/services/casService";
 import { AuthenticationUIReturn, RegisterModalOptions } from "@/types/auth";
 
 /**
@@ -35,7 +33,6 @@ export function useAuthenticationUI({
   const { message } = App.useApp();
   const effectivePath = pathname ? getEffectiveRoutePath(pathname) : "/";
   const isOAuthCompletePage = effectivePath === "/oauth/complete";
-  const isRedirectingToCasRef = useRef(false);
 
   // UI state for modals - managed locally within the hook
   const [isLoginModalOpen, setIsLoginModalOpen] = useState(false);
@@ -43,12 +40,12 @@ export function useAuthenticationUI({
   const [registerModalOptions, setRegisterModalOptions] =
     useState<RegisterModalOptions | null>(null);
   const [isAuthPromptModalOpen, setIsAuthPromptModalOpen] = useState(false);
-  const [isSessionExpiredModalOpen, setIsSessionExpiredModalOpen] =
-    useState(false);
+  const [isSessionExpiredModalOpen, setIsSessionExpiredModalOpen] = useState(false);
 
-  const handleUnauthenticatedModalClose = () => {
+  const handleUnauthenticatedModalClose = (() => {
     // Only emit back to home event and redirect if user is not authenticated
     if (!isAuthenticated && !isSpeedMode) {
+        
       // Emit event to notify SideNavigation to reset selected key
       authEventUtils.emitBackToHome();
       // Redirect to home page if not already there
@@ -56,7 +53,7 @@ export function useAuthenticationUI({
         router.push("/");
       }
     }
-  };
+  });
 
   // Modal control functions
   const openLoginModal = useCallback(() => setIsLoginModalOpen(true), []);
@@ -77,37 +74,14 @@ export function useAuthenticationUI({
     handleUnauthenticatedModalClose();
   }, [handleUnauthenticatedModalClose]);
 
-  const redirectToCasIfForced = useCallback(
-    async (redirect?: string): Promise<boolean> => {
-      if (isRedirectingToCasRef.current) return true;
-      if (authFlowState.isExplicitLogoutInProgress()) return true;
-
-      const config = await casService.getConfig();
-      if (authFlowState.isExplicitLogoutInProgress()) return true;
-      if (!config.enabled || config.login_mode !== "force") return false;
-
-      isRedirectingToCasRef.current = true;
-      casService.startLogin(redirect);
-      return true;
-    },
-    []
-  );
-
-  const openAuthPromptModal = useCallback(() => {
-    redirectToCasIfForced(effectivePath).then((redirected) => {
-      if (!redirected) setIsAuthPromptModalOpen(true);
-    });
-  }, [effectivePath, redirectToCasIfForced]);
+  const openAuthPromptModal = useCallback(() => setIsAuthPromptModalOpen(true), []);
 
   const closeAuthPromptModal = useCallback(() => {
     setIsAuthPromptModalOpen(false);
     handleUnauthenticatedModalClose();
   }, [handleUnauthenticatedModalClose]);
 
-  const openSessionExpiredModal = useCallback(
-    () => setIsSessionExpiredModalOpen(true),
-    []
-  );
+  const openSessionExpiredModal = useCallback(() => setIsSessionExpiredModalOpen(true), []);
 
   const closeSessionExpiredModal = useCallback(() => {
     clearLocalSession();
@@ -131,15 +105,13 @@ export function useAuthenticationUI({
     if (isSpeedMode) return;
 
     const handleSessionExpired = () => {
-      // Prevent showing session expired modal when login/register modal is already open.
-      // This avoids race conditions while the user is filling in an auth form.
+      // Prevent showing session expired modal when login/register modal is already open
+      // This avoids race conditions when mousemove events trigger session checks
+      // while the user is already filling in the login form
       if (isLoginModalOpen || isRegisterModalOpen) {
         return;
       }
-
-      redirectToCasIfForced(effectivePath).then((redirected) => {
-        if (!redirected) setIsSessionExpiredModalOpen(true);
-      });
+      setIsSessionExpiredModalOpen(true);
     };
 
     const handleRegisterSuccess = () => {
@@ -162,13 +134,7 @@ export function useAuthenticationUI({
       cleanup();
       cleanupRegister();
     };
-  }, [
-    effectivePath,
-    isSpeedMode,
-    redirectToCasIfForced,
-    isLoginModalOpen,
-    isRegisterModalOpen,
-  ]);
+  }, [isSpeedMode, isLoginModalOpen, isRegisterModalOpen]);
 
   // Auto-open login modal when returning from a failed OAuth redirect
   useEffect(() => {
@@ -188,17 +154,7 @@ export function useAuthenticationUI({
     if (oauthError && !isLoginModalOpen) {
       setIsLoginModalOpen(true);
     }
-  }, [
-    searchParams,
-    isAuthChecking,
-    isAuthenticated,
-    isSpeedMode,
-    isLoginModalOpen,
-    router,
-    isOAuthCompletePage,
-    message,
-    getOAuthErrorMessage,
-  ]);
+  }, [searchParams, isAuthChecking, isAuthenticated, isSpeedMode, isLoginModalOpen, router, isOAuthCompletePage, message, getOAuthErrorMessage]);
 
   useEffect(() => {
     if (!isOAuthCompletePage) return;
@@ -219,28 +175,9 @@ export function useAuthenticationUI({
     if (isSessionExpiredModalOpen) return;
     if (isLoginModalOpen) return;
     if (isRegisterModalOpen) return;
-    let cancelled = false;
+    openAuthPromptModal();
+  }, [pathname, isAuthenticated, isSpeedMode, isAuthChecking, isSessionExpiredModalOpen, openAuthPromptModal, isOAuthCompletePage]);
 
-    redirectToCasIfForced(effectivePath).then((redirected) => {
-      if (!cancelled && !redirected) {
-        setIsAuthPromptModalOpen(true);
-      }
-    });
-
-    return () => {
-      cancelled = true;
-    };
-  }, [
-    effectivePath,
-    isAuthenticated,
-    isSpeedMode,
-    isAuthChecking,
-    isSessionExpiredModalOpen,
-    isLoginModalOpen,
-    isRegisterModalOpen,
-    isOAuthCompletePage,
-    redirectToCasIfForced,
-  ]);
 
   return {
     // Login/Register Modal
diff --git a/frontend/lib/agentGenerationCache.ts b/frontend/lib/agentGenerationCache.ts
index d8dbfb045..6799f3d2f 100644
--- a/frontend/lib/agentGenerationCache.ts
+++ b/frontend/lib/agentGenerationCache.ts
@@ -30,10 +30,6 @@ export interface AgentGenerationCache {
   agentDisplayName: string;
   /** Generated agent description */
   agentDescription: string;
-  /** Generated greeting message */
-  greetingMessage: string;
-  /** Generated example questions */
-  exampleQuestions: string;
 }
 
 /**
@@ -50,8 +46,6 @@ const DEFAULT_CACHE: AgentGenerationCache = {
   agentName: "",
   agentDisplayName: "",
   agentDescription: "",
-  greetingMessage: "",
-  exampleQuestions: "",
 };
 
 /**
@@ -179,7 +173,7 @@ export function setAgentGenerationStatus(
 export function saveGeneratedField<
   K extends keyof Pick<
     AgentGenerationCache,
-    'dutyPrompt' | 'constraintPrompt' | 'fewShotsPrompt' | 'agentName' | 'agentDisplayName' | 'agentDescription' | 'greetingMessage' | 'exampleQuestions'
+    'dutyPrompt' | 'constraintPrompt' | 'fewShotsPrompt' | 'agentName' | 'agentDisplayName' | 'agentDescription'
   >
 >(
   agentId: number,
diff --git a/frontend/lib/auth.ts b/frontend/lib/auth.ts
index 330028bc3..7c6cafa11 100644
--- a/frontend/lib/auth.ts
+++ b/frontend/lib/auth.ts
@@ -15,7 +15,6 @@ import {
   hasAuthCookies,
   handleSessionExpired,
 } from "@/lib/session";
-import { authFlowState } from "@/lib/authFlow";
 
 /**
  * Role color mapping - Ant Design color presets
@@ -50,11 +49,7 @@ export function generateAvatarUrl(email: string): string {
 export const fetchWithAuth = async (url: string, options: RequestInit = {}) => {
   // Frontend pre-check: detect session expiry without hitting backend
   if (typeof window !== "undefined") {
-    if (
-      !authFlowState.isExplicitLogoutInProgress() &&
-      hasAuthCookies() &&
-      !checkSessionValid()
-    ) {
+    if (hasAuthCookies() && !checkSessionValid()) {
       handleSessionExpired();
       throw new ApiError(
         STATUS_CODES.TOKEN_EXPIRED,
diff --git a/frontend/lib/authFlow.ts b/frontend/lib/authFlow.ts
deleted file mode 100644
index 329157120..000000000
--- a/frontend/lib/authFlow.ts
+++ /dev/null
@@ -1,13 +0,0 @@
-let explicitLogoutInProgress = false;
-
-export const authFlowState = {
-  beginExplicitLogout: (): void => {
-    explicitLogoutInProgress = true;
-  },
-
-  endExplicitLogout: (): void => {
-    explicitLogoutInProgress = false;
-  },
-
-  isExplicitLogoutInProgress: (): boolean => explicitLogoutInProgress,
-};
diff --git a/frontend/lib/chat/chatMessageExtractor.ts b/frontend/lib/chat/chatMessageExtractor.ts
new file mode 100644
index 000000000..f7d172be4
--- /dev/null
+++ b/frontend/lib/chat/chatMessageExtractor.ts
@@ -0,0 +1,292 @@
+import { chatConfig, MESSAGE_ROLES } from "@/const/chatConfig";
+import {
+  ApiMessage,
+  SearchResult,
+  AgentStep,
+  ApiMessageItem,
+  ChatMessageType,
+  MinioFileItem,
+} from "@/types/chat";
+import log from "@/lib/logger";
+
+// Replace <user_break> tag with the localized natural language string
+const processSpecialTag = (content: string, t: any): string => {
+  if (!content || typeof content !== "string") {
+    return content;
+  }
+
+  if (content == "<user_break>") {
+    return t("chatStreamHandler.userInterrupted");
+  }
+
+  return content;
+};
+
+export function extractAssistantMsgFromResponse(
+  dialog_msg: ApiMessage,
+  index: number,
+  create_time: number,
+  t: any
+) {
+  let searchResultsContent: SearchResult[] = [];
+  if (
+    dialog_msg.search &&
+    Array.isArray(dialog_msg.search) &&
+    dialog_msg.search.length > 0
+  ) {
+    searchResultsContent = dialog_msg.search.map((item) => ({
+      title: item.title || t("extractMsg.unknownTitle"),
+      url: item.url || "#",
+      text: item.text || t("extractMsg.noContentDescription"),
+      published_date: item.published_date || "",
+      source_type: item.source_type || "",
+      filename: item.filename || "",
+      score: typeof item.score === "number" ? item.score : undefined,
+      score_details: item.score_details || {},
+      tool_sign: item.tool_sign || "",
+      cite_index: typeof item.cite_index === "number" ? item.cite_index : -1,
+    }));
+  }
+
+  // handle images
+  let imagesContent: string[] = [];
+  if (
+    dialog_msg.picture &&
+    Array.isArray(dialog_msg.picture) &&
+    dialog_msg.picture.length > 0
+  ) {
+    imagesContent = dialog_msg.picture;
+  }
+
+  // extract the content of the Message
+  let finalAnswer = "";
+  let steps: AgentStep[] = [];
+  if (dialog_msg.message && Array.isArray(dialog_msg.message)) {
+    dialog_msg.message.forEach((msg: ApiMessageItem) => {
+      switch (msg.type) {
+        case chatConfig.messageTypes.FINAL_ANSWER: {
+          finalAnswer += processSpecialTag(msg.content, t);
+          break;
+        }
+
+        case chatConfig.messageTypes.STEP_COUNT: {
+          steps.push({
+            id: `step-${steps.length + 1}`,
+            title: msg.content.trim(),
+            content: "",
+            expanded: false,
+            contents: [],
+            metrics: null,
+            thinking: { content: "", expanded: false },
+            code: { content: "", expanded: false },
+            output: { content: "", expanded: false },
+          });
+          break;
+        }
+
+        case chatConfig.messageTypes.MODEL_OUTPUT_THINKING: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            const contentId = `model-${Date.now()}-${Math.random()
+              .toString(36)
+              .substring(2, 7)}`;
+            currentStep.contents.push({
+              id: contentId,
+              type: "model_output",
+              subType: "thinking",
+              content: msg.content,
+              expanded: true,
+              timestamp: Date.now(),
+            });
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.EXECUTION_LOGS: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            const contentId = `execution-${Date.now()}-${Math.random()
+              .toString(36)
+              .substring(2, 7)}`;
+            currentStep.contents.push({
+              id: contentId,
+              type: "execution",
+              content: msg.content,
+              expanded: true,
+              timestamp: Date.now(),
+            });
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.ERROR: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            const contentId = `error-${Date.now()}-${Math.random()
+              .toString(36)
+              .substring(2, 7)}`;
+            currentStep.contents.push({
+              id: contentId,
+              type: "error",
+              content: msg.content,
+              expanded: true,
+              timestamp: Date.now(),
+            });
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.SEARCH_CONTENT_PLACEHOLDER: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            try {
+              const placeholderData = JSON.parse(msg.content);
+              const unitId = placeholderData.unit_id;
+
+              if (
+                unitId &&
+                dialog_msg.search_unit_id &&
+                dialog_msg.search_unit_id[unitId.toString()]
+              ) {
+                const unitSearchResults =
+                  dialog_msg.search_unit_id[unitId.toString()];
+                const searchContent = JSON.stringify(unitSearchResults);
+
+                const contentId = `search-content-${Date.now()}-${Math.random()
+                  .toString(36)
+                  .substring(2, 7)}`;
+                currentStep.contents.push({
+                  id: contentId,
+                  type: "search_content",
+                  content: searchContent,
+                  expanded: true,
+                  timestamp: Date.now(),
+                });
+              }
+            } catch (e) {
+              log.error(t("extractMsg.cannotParseSearchPlaceholder"), e);
+            }
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.TOKEN_COUNT: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            try {
+              currentStep.metrics = JSON.parse(msg.content);
+            } catch {
+              currentStep.metrics = null;
+            }
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.CARD: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            const contentId = `card-${Date.now()}-${Math.random()
+              .toString(36)
+              .substring(2, 7)}`;
+            currentStep.contents.push({
+              id: contentId,
+              type: "card",
+              content: msg.content,
+              expanded: true,
+              timestamp: Date.now(),
+            });
+          }
+          break;
+        }
+
+        case chatConfig.messageTypes.TOOL: {
+          const currentStep = steps[steps.length - 1];
+          if (currentStep) {
+            const contentId = `tool-${Date.now()}-${Math.random()
+              .toString(36)
+              .substring(2, 7)}`;
+            currentStep.contents.push({
+              id: contentId,
+              type: "executing", // use the existing executing type to represent the tool call
+              content: msg.content,
+              expanded: true,
+              timestamp: Date.now(),
+            });
+          }
+          break;
+        }
+
+        default:
+          break;
+      }
+    });
+  }
+
+  const formattedAssistantMsg: ChatMessageType = {
+    id: `assistant-${index}-${Date.now()}`,
+    role: MESSAGE_ROLES.ASSISTANT,
+    message_id: dialog_msg.message_id,
+    content: "",
+    opinion_flag: dialog_msg.opinion_flag,
+    timestamp: new Date(create_time),
+    steps: steps,
+    finalAnswer: finalAnswer,
+    agentRun: "",
+    isComplete: true,
+    showRawContent: false,
+    searchResults: searchResultsContent,
+    images: imagesContent,
+    attachments: undefined,
+  };
+  return formattedAssistantMsg;
+}
+
+export function extractUserMsgFromResponse(
+  dialog_msg: ApiMessage,
+  index: number,
+  create_time: number
+) {
+  let userContent = "";
+  if (Array.isArray(dialog_msg.message)) {
+    const stringMessage = dialog_msg.message.find(
+      (m: { type: string; content: string }) => m.type === "string"
+    );
+    userContent = stringMessage?.content || "";
+  } else if (typeof dialog_msg.message === "string") {
+    userContent = dialog_msg.message;
+  } else if (dialog_msg.message && typeof dialog_msg.message === "object") {
+    const msgObj = dialog_msg.message as { content?: string };
+    userContent = msgObj.content || "";
+  }
+
+  let userAttachments: MinioFileItem[] = [];
+  if (
+    dialog_msg.minio_files &&
+    Array.isArray(dialog_msg.minio_files) &&
+    dialog_msg.minio_files.length > 0
+  ) {
+    userAttachments = dialog_msg.minio_files.map((item) => {
+      return {
+        type: item.type || "",
+        name: item.name || "",
+        size: item.size || 0,
+        object_name: item.object_name,
+        url: item.url,
+        description: item.description,
+      };
+    });
+  }
+
+  const formattedUserMsg: ChatMessageType = {
+    id: `user-${index}-${Date.now()}`,
+    role: MESSAGE_ROLES.USER,
+    message_id: dialog_msg.message_id,
+    content: userContent,
+    opinion_flag: dialog_msg.opinion_flag,
+    timestamp: new Date(create_time),
+    showRawContent: true,
+    isComplete: true,
+    attachments: userAttachments.length > 0 ? userAttachments : undefined,
+  };
+  return formattedUserMsg;
+}
diff --git a/frontend/lib/chatMessageExtractor.ts b/frontend/lib/chatMessageExtractor.ts
index eb0f79aec..08f73de82 100644
--- a/frontend/lib/chatMessageExtractor.ts
+++ b/frontend/lib/chatMessageExtractor.ts
@@ -22,40 +22,6 @@ const processSpecialTag = (content: string, t: any): string => {
   return content;
 };
 
-const createAgentStep = (
-  id: string,
-  title: string,
-  expanded = false
-): AgentStep => ({
-  id,
-  title,
-  content: "",
-  expanded,
-  contents: [],
-  metrics: null,
-  thinking: { content: "", expanded },
-  code: { content: "", expanded },
-  output: { content: "", expanded },
-});
-
-const getOrCreateCurrentStep = (
-  steps: AgentStep[],
-  fallbackTitle: string
-): AgentStep => {
-  const currentStep = steps[steps.length - 1];
-  if (currentStep) {
-    return currentStep;
-  }
-
-  const recoveredStep = createAgentStep(
-    `step-history-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`,
-    fallbackTitle,
-    true
-  );
-  steps.push(recoveredStep);
-  return recoveredStep;
-};
-
 export function extractAssistantMsgFromResponse(
   dialog_msg: ApiMessage,
   index: number,
@@ -104,9 +70,17 @@ export function extractAssistantMsgFromResponse(
         }
 
         case chatConfig.messageTypes.STEP_COUNT: {
-          steps.push(
-            createAgentStep(`step-${steps.length + 1}`, msg.content.trim())
-          );
+          steps.push({
+            id: `step-${steps.length + 1}`,
+            title: msg.content.trim(),
+            content: "",
+            expanded: false,
+            contents: [],
+            metrics: null,
+            thinking: { content: "", expanded: false },
+            code: { content: "", expanded: false },
+            output: { content: "", expanded: false },
+          });
           break;
         }
 
@@ -242,22 +216,6 @@ export function extractAssistantMsgFromResponse(
           break;
         }
 
-        case chatConfig.messageTypes.VERIFICATION: {
-          const currentStep = getOrCreateCurrentStep(steps, "Verification");
-          const contentId = `verification-${Date.now()}-${Math.random()
-            .toString(36)
-            .substring(2, 7)}`;
-          currentStep.contents.push({
-            id: contentId,
-            type: chatConfig.messageTypes.VERIFICATION,
-            subType: "verification",
-            content: msg.content,
-            expanded: true,
-            timestamp: Date.now(),
-          });
-          break;
-        }
-
         case chatConfig.messageTypes.MAX_STEPS_REACHED: {
           // Parse the max steps reached event data for historical messages
           try {
@@ -292,24 +250,6 @@ export function extractAssistantMsgFromResponse(
     });
   }
 
-  let assistantAttachments: MinioFileItem[] = [];
-  if (
-    dialog_msg.minio_files &&
-    Array.isArray(dialog_msg.minio_files) &&
-    dialog_msg.minio_files.length > 0
-  ) {
-    assistantAttachments = dialog_msg.minio_files.map((item) => {
-      return {
-        type: item.type || "",
-        name: item.name || "",
-        size: item.size || 0,
-        object_name: item.object_name,
-        url: item.url,
-        description: item.description,
-      };
-    });
-  }
-
   const formattedAssistantMsg: ChatMessageType = {
     id: `assistant-${index}-${Date.now()}`,
     role: MESSAGE_ROLES.ASSISTANT,
@@ -324,7 +264,7 @@ export function extractAssistantMsgFromResponse(
     showRawContent: false,
     searchResults: searchResultsContent,
     images: imagesContent,
-    attachments: assistantAttachments.length > 0 ? assistantAttachments : undefined,
+    attachments: undefined,
   };
   return formattedAssistantMsg;
 }
@@ -360,7 +300,7 @@ export function extractUserMsgFromResponse(
         size: item.size || 0,
         object_name: item.object_name,
         url: item.url,
-        presigned_url: item.presigned_url, // Preserve presigned_url for MCP tool access
+        presigned_url: item.presigned_url,  // Preserve presigned_url for MCP tool access
         description: item.description,
       };
     });
diff --git a/frontend/lib/filePreviewUtils.ts b/frontend/lib/filePreviewUtils.ts
index 929f01446..0126241bf 100644
--- a/frontend/lib/filePreviewUtils.ts
+++ b/frontend/lib/filePreviewUtils.ts
@@ -353,43 +353,3 @@ export function getPageWrapperStyle(
 
   return { minHeight: placeholderHeight, width: placeholderWidth };
 }
-
-export type PreviewAccessReason = 'forbidden' | 'not_found';
-
-export class PreviewAccessError extends Error {
-  readonly reason: PreviewAccessReason;
-
-  constructor(reason: PreviewAccessReason) {
-    super(reason);
-    this.name = 'PreviewAccessError';
-    this.reason = reason;
-  }
-}
-
-export function getPreviewAccessReasonFromStatus(
-  status: number,
-): PreviewAccessReason | null {
-  if (status === 403) return 'forbidden';
-  if (status === 404) return 'not_found';
-  return null;
-}
-
-/** Fetch remote preview content; throws PreviewAccessError on 403/404. */
-export async function fetchPreviewBlob(
-  url: string,
-  signal?: AbortSignal,
-): Promise<Blob> {
-  const resp = await fetch(url, {
-    cache: 'no-store',
-    credentials: 'include',
-    signal,
-  });
-  const accessReason = getPreviewAccessReasonFromStatus(resp.status);
-  if (accessReason) {
-    throw new PreviewAccessError(accessReason);
-  }
-  if (!resp.ok) {
-    throw new Error(`HTTP ${resp.status}`);
-  }
-  return resp.blob();
-}
diff --git a/frontend/pnpm-workspace.yaml b/frontend/pnpm-workspace.yaml
index 07399aa05..3d5d51424 100644
--- a/frontend/pnpm-workspace.yaml
+++ b/frontend/pnpm-workspace.yaml
@@ -1,4 +1,2 @@
-allowBuilds:
-  core-js: true
-  sharp: true
-  unrs-resolver: true
+ignoredBuiltDependencies:
+  - unrs-resolver
diff --git a/frontend/public/locales/en/common.json b/frontend/public/locales/en/common.json
index c3ccbd6c0..9e1d3d8b8 100644
--- a/frontend/public/locales/en/common.json
+++ b/frontend/public/locales/en/common.json
@@ -17,10 +17,6 @@
   "filePreview.loadingDocument": "Loading document...",
   "filePreview.loadingPage": "Loading page...",
   "filePreview.previewFailed": "File preview failed",
-  "filePreview.knowledge.accessDenied.title": "Cannot preview",
-  "filePreview.knowledge.accessDenied.content": "You do not have permission to preview this document.",
-  "filePreview.knowledge.noStoredCopy.title": "Cannot preview",
-  "filePreview.knowledge.noStoredCopy.content": "This knowledge base does not keep a copy of the document; preview is unavailable.",
   "filePreview.emptyFile": "This file content is empty",
   "filePreview.uploadToPreview": "Please upload the file before previewing",
   "filePreview.download": "Download",
@@ -278,13 +274,6 @@
   "chatStreamHandler.parseMaxStepsDataFailed": "Failed to parse max steps data:",
 
   "taskWindow.maxStepsReached": "Max steps limit reached ({{completedSteps}} steps), summarizing current work...",
-  "taskWindow.verification.start": "Self-checking...",
-  "taskWindow.verification.pass": "Self-check passed",
-  "taskWindow.verification.warning": "Self-check needs attention",
-  "taskWindow.verification.blocked": "Self-check blocked this action",
-  "taskWindow.verification.repair": "Self-check failed, revising",
-  "taskWindow.verification.finalPass": "Final self-check passed",
-  "taskWindow.verification.finalFail": "Final self-check did not pass",
   "taskWindow.unknownSource": "Unknown Source",
   "taskWindow.knowledgeFile": "Knowledge Base File",
   "taskWindow.urlParseError": "URL parsing error:",
@@ -326,12 +315,6 @@
   "agent.contextMenu.copy": "Copy",
   "agent.copySuffix": "Copy",
   "agent.info.title": "Agent Information",
-  "agent.greeting.tabTitle": "Greeting",
-  "agent.greeting.messageTitle": "Greeting Message",
-  "agent.greeting.messagePlaceholder": "Enter agent greeting, e.g., Hello! I'm your data analysis assistant",
-  "agent.greeting.questionsTitle": "Example Questions",
-  "agent.greeting.addQuestion": "Add Example Question",
-  "agent.greeting.removeQuestion": "Remove",
   "agent.info.name.error.empty": "Name cannot be empty",
   "agent.info.name.error.format": "Name can only contain letters, numbers and underscores, and must start with a letter or underscore",
   "agent.info.name.error.length": "Name length cannot exceed 50 characters",
@@ -344,8 +327,6 @@
   "agent.author.hint": "Default: {{email}}",
   "agent.provideRunSummary": "Provide Run Summary",
   "agent.provideRunSummary.error": "Please select whether to provide run summary",
-  "agent.verification": "Self Verification",
-  "agent.verification.error": "Please select whether to enable self verification",
   "agent.description": "Agent Description",
   "agent.descriptionPlaceholder": "Please enter agent description",
   "agent.userGroup": "User Group",
@@ -386,10 +367,6 @@
   "agent.debug.stop": "Stop",
   "agent.debug.clear": "Clear",
   "agent.debug.send": "Send",
-  "agent.debug.optimizeTitle": "Prompt optimization",
-  "agent.debug.optimizeHint": "Select a reply and provide feedback. The system will optimize the agent's full system prompt.",
-  "agent.debug.selectedQuestion": "Selected question",
-  "agent.debug.selectedAnswer": "Selected answer",
   "agent.debug.userStop": "User manually stopped debugging",
   "agent.debug.cancelError": "Error while canceling request",
   "agent.debug.stopError": "Failed to stop debug mode Agent run, but frontend has stopped:",
@@ -408,11 +385,6 @@
   "agent.debug.compareEmpty": "No output yet",
   "agent.debug.defaultMode": "Default mode",
   "agent.debug.compareMode": "Compare mode",
-  "agent.debug.promptCompare.title": "Prompt compare",
-  "agent.debug.promptCompare.close": "Close",
-  "agent.debug.promptCompare.apply": "Replace with Optimized Content",
-  "agent.debug.promptCompare.original": "Original",
-  "agent.debug.promptCompare.optimized": "Optimized",
 
   "guide.steps.describeBusinessLogic.title": "Describe Business Logic",
 
@@ -434,25 +406,6 @@
   "systemPrompt.optimize.empty": "No optimized content yet",
   "systemPrompt.optimize.replace": "Replace with Optimized Content",
   "systemPrompt.optimize.error": "Failed to optimize this section",
-  "systemPrompt.optimize.generating": "Generating optimized prompt template...",
-  "systemPrompt.optimize.generatingPlaceholder": "Generating, please wait...",
-  "systemPrompt.button.badcase": "Bad Case Optimize",
-  "systemPrompt.finetune.title": "Fine-Tune",
-  "systemPrompt.finetune.modeLabel": "Adjustment Mode",
-  "systemPrompt.finetune.modeGeneral": "Global Optimize",
-  "systemPrompt.finetune.modeGeneralDesc": "Optimize the entire section based on feedback",
-  "systemPrompt.finetune.modeInsert": "Insert Content",
-  "systemPrompt.finetune.modeInsertDesc": "Insert new content at a specific position",
-  "systemPrompt.finetune.modeSelect": "Replace Selection",
-  "systemPrompt.finetune.modeSelectDesc": "Replace the selected range of content",
-  "systemPrompt.finetune.insertPositionLabel": "Insert Position (character index)",
-  "systemPrompt.finetune.insertPositionPlaceholder": "e.g. 50",
-  "systemPrompt.finetune.selectStartLabel": "Selection Start (character index)",
-  "systemPrompt.finetune.selectStartPlaceholder": "e.g. 10",
-  "systemPrompt.finetune.selectEndLabel": "Selection End (character index)",
-  "systemPrompt.finetune.selectEndPlaceholder": "e.g. 100",
-  "systemPrompt.finetune.selectTip": "Select text in the editor below to get position",
-  "systemPrompt.finetune.positionError": "Please enter a valid position number",
   "systemPrompt.expandEdit.backgroundInfo": "Background Info",
   "systemPrompt.expandEdit.close": "Save & Close",
   "systemPrompt.nonEditing.title": "Please Select an Agent First",
@@ -617,7 +570,6 @@
   "knowledgeBase.tag.createdAt": "Created on {{date}}",
   "knowledgeBase.tag.model": "{{model}} Model",
   "knowledgeBase.tag.modelMismatch": "Model Mismatch",
-  "knowledgeBase.tag.noPreserveSourceFile": "Document copy not preserved",
   "knowledgeBase.upload.modelMismatch.description": "The model of the current knowledge base does not match the configured model, file upload is not allowed, please switch the knowledge base or adjust the model configuration",
   "knowledgeBase.list.empty": "No knowledge bases yet, please create one first",
   "knowledgeBase.list.noResults": "No matching knowledge bases found",
@@ -666,7 +618,6 @@
   "knowledgeBase.name.new": "new_base",
   "knowledgeBase.message.getDocumentsFailed": "Failed to get documents",
   "knowledgeBase.create.permission.groupPlaceholder": "No user group",
-  "knowledgeBase.create.preserveSourceFile": "Preserve document copy",
   "knowledgeBase.ingroup.permission.EDIT": "In Group Read/Write",
   "knowledgeBase.ingroup.permission.READ_ONLY": "In Group Read Only",
   "knowledgeBase.ingroup.permission.PRIVATE": "Personal Private",
@@ -1108,7 +1059,6 @@
   "auth.accessDenied": "You do not have permission to access this page",
   "auth.oauthDivider": "or continue with",
   "auth.oauthLogin": "{{provider}} Login",
-  "auth.casLogin": "{{provider}} Login",
   "auth.oauthLoginFailed": "Third-party login failed: {{error}}",
   "auth.oauthLoginFailedGeneric": "Third-party login failed. Please try again.",
   "auth.oauthCompleteTitle": "Complete Account Setup",
diff --git a/frontend/public/locales/zh/common.json b/frontend/public/locales/zh/common.json
index 09b8bcd4a..114984215 100644
--- a/frontend/public/locales/zh/common.json
+++ b/frontend/public/locales/zh/common.json
@@ -17,10 +17,6 @@
   "filePreview.loadingDocument": "文档加载中...",
   "filePreview.loadingPage": "页面加载中...",
   "filePreview.previewFailed": "文件预览失败",
-  "filePreview.knowledge.accessDenied.title": "无法预览",
-  "filePreview.knowledge.accessDenied.content": "您没有权限访问该文档。",
-  "filePreview.knowledge.noStoredCopy.title": "无法预览",
-  "filePreview.knowledge.noStoredCopy.content": "当前知识库未保存该文档副本，无法预览。",
   "filePreview.emptyFile": "文件内容为空",
   "filePreview.uploadToPreview": "请上传文件后预览",
   "filePreview.download": "下载",
@@ -279,13 +275,6 @@
   "chatStreamHandler.parseMaxStepsDataFailed": "解析最大步数数据失败:",
 
   "taskWindow.maxStepsReached": "已达到最大步数限制（{{completedSteps}} 步），正在总结当前工作...",
-  "taskWindow.verification.start": "正在自检...",
-  "taskWindow.verification.pass": "自检通过",
-  "taskWindow.verification.warning": "自检发现需关注项",
-  "taskWindow.verification.blocked": "自检已阻断当前动作",
-  "taskWindow.verification.repair": "自检未通过，正在修正",
-  "taskWindow.verification.finalPass": "最终自检通过",
-  "taskWindow.verification.finalFail": "最终自检未通过",
   "taskWindow.unknownSource": "未知来源",
   "taskWindow.knowledgeFile": "知识库文件",
   "taskWindow.urlParseError": "URL解析错误:",
@@ -328,12 +317,6 @@
   "agent.contextMenu.copy": "复制",
   "agent.copySuffix": "副本",
   "agent.info.title": "智能体信息",
-  "agent.greeting.tabTitle": "开场白",
-  "agent.greeting.messageTitle": "问候语",
-  "agent.greeting.messagePlaceholder": "请输入智能体问候语，例如：你好！我是你的数据分析助手",
-  "agent.greeting.questionsTitle": "示例问题",
-  "agent.greeting.addQuestion": "添加示例问题",
-  "agent.greeting.removeQuestion": "删除",
   "agent.info.name.error.empty": "名称不能为空",
   "agent.info.name.error.format": "名称只能包含字母、数字和下划线，且必须以字母或下划线开头",
   "agent.info.name.error.length": "名称长度不能超过50个字符",
@@ -346,8 +329,6 @@
   "agent.author.hint": "默认：{{email}}",
   "agent.provideRunSummary": "提供运行摘要",
   "agent.provideRunSummary.error": "请选择是否提供运行摘要",
-  "agent.verification": "自验证",
-  "agent.verification.error": "请选择是否启用自验证",
   "agent.description": "智能体描述",
   "agent.userGroup": "用户组",
   "agent.userGroup.empty": "暂无用户组",
@@ -388,10 +369,6 @@
   "agent.debug.stop": "停止",
   "agent.debug.clear": "清空",
   "agent.debug.send": "发送",
-  "agent.debug.optimizeTitle": "提示词优化",
-  "agent.debug.optimizeHint": "选择一条回复，输入优化反馈，系统将自动优化智能体的完整系统提示词。",
-  "agent.debug.selectedQuestion": "选中的问题",
-  "agent.debug.selectedAnswer": "选中的回复",
   "agent.debug.userStop": "用户手动停止调试",
   "agent.debug.cancelError": "取消请求时出错",
   "agent.debug.stopError": "停止调试模式智能体运行失败，但前端已停止:",
@@ -410,11 +387,6 @@
   "agent.debug.compareEmpty": "暂无输出",
   "agent.debug.defaultMode": "默认模式",
   "agent.debug.compareMode": "对比模式",
-  "agent.debug.promptCompare.title": "提示词对比",
-  "agent.debug.promptCompare.close": "关闭",
-  "agent.debug.promptCompare.apply": "一键替换",
-  "agent.debug.promptCompare.original": "优化前",
-  "agent.debug.promptCompare.optimized": "优化后",
 
   "guide.steps.describeBusinessLogic.title": "描述业务逻辑",
 
@@ -590,7 +562,6 @@
   "knowledgeBase.tag.createdAt": "创建于{{date}}",
   "knowledgeBase.tag.model": "{{model}}模型",
   "knowledgeBase.tag.modelMismatch": "模型不匹配",
-  "knowledgeBase.tag.noPreserveSourceFile": "不保留文档副本",
   "knowledgeBase.upload.modelMismatch.description": "当前知识库的模型与配置模型不匹配，无法上传文件，请切换知识库或调整模型配置",
   "knowledgeBase.list.empty": "暂无知识库，请先创建知识库",
   "knowledgeBase.list.noResults": "没有找到匹配的知识库",
@@ -637,7 +608,6 @@
   "knowledgeBase.name.new": "新知识库",
   "knowledgeBase.message.getDocumentsFailed": "获取文档列表失败",
   "knowledgeBase.create.permission.groupPlaceholder": "无所属用户组",
-  "knowledgeBase.create.preserveSourceFile": "保留文档副本",
   "knowledgeBase.ingroup.permission.EDIT": "同组可编辑",
   "knowledgeBase.ingroup.permission.READ_ONLY": "同组只读",
   "knowledgeBase.ingroup.permission.PRIVATE": "私有",
@@ -1079,7 +1049,6 @@
   "auth.accessDenied": "您没有权限访问此页面",
   "auth.oauthDivider": "或使用第三方登录",
   "auth.oauthLogin": "{{provider}} 登录",
-  "auth.casLogin": "{{provider}} 登录",
   "auth.oauthLoginFailed": "第三方登录失败：{{error}}",
   "auth.oauthLoginFailedGeneric": "第三方登录失败，请重试",
   "auth.oauthCompleteTitle": "补充账号信息",
@@ -2833,16 +2802,5 @@
   "systemPrompt.optimize.optimized": "优化后",
   "systemPrompt.optimize.empty": "暂未生成优化内容",
   "systemPrompt.optimize.replace": "一键替换",
-  "systemPrompt.optimize.error": "该部分优化失败",
-  "systemPrompt.optimize.generating": "正在生成优化后的 prompt 模板...",
-  "systemPrompt.optimize.generatingPlaceholder": "正在生成中，请稍候...",
-
-  "systemPrompt.finetune.modeLabel": "使用要求",
-  "systemPrompt.finetune.modeGeneral": "全局优化",
-  "systemPrompt.finetune.modeGeneralDesc": "基于评价反馈对整个部分进行优化",
-  "systemPrompt.finetune.modeInsert": "插入内容",
-  "systemPrompt.finetune.modeInsertDesc": "在指定位置插入新的内容",
-  "systemPrompt.finetune.modeSelect": "替换选中",
-  "systemPrompt.finetune.modeSelectDesc": "替换选中的内容范围"
-
+  "systemPrompt.optimize.error": "该部分优化失败"
 }
diff --git a/frontend/server.js b/frontend/server.js
index e88304b8b..f0e615577 100644
--- a/frontend/server.js
+++ b/frontend/server.js
@@ -87,10 +87,14 @@ function setAuthCookies(res, session) {
 
   if (session.expires_at) {
     cookies.push(
-      cookie.serialize(COOKIE_NAMES.EXPIRES_AT, String(session.expires_at), {
-        ...buildCookieOptions(false), // readable by frontend JS
-        maxAge: expiresInSeconds, // Same as access token
-      })
+      cookie.serialize(
+        COOKIE_NAMES.EXPIRES_AT,
+        String(session.expires_at),
+        {
+          ...buildCookieOptions(false), // readable by frontend JS
+          maxAge: expiresInSeconds, // Same as access token
+        }
+      )
     );
   }
 
@@ -102,19 +106,10 @@ function setAuthCookies(res, session) {
 function clearAuthCookies(res) {
   const expired = { maxAge: 0, path: "/" };
   res.setHeader("Set-Cookie", [
-    cookie.serialize(COOKIE_NAMES.ACCESS_TOKEN, "", {
-      ...expired,
-      httpOnly: true,
-    }),
-    cookie.serialize(COOKIE_NAMES.REFRESH_TOKEN, "", {
-      ...expired,
-      httpOnly: true,
-    }),
+    cookie.serialize(COOKIE_NAMES.ACCESS_TOKEN, "", { ...expired, httpOnly: true }),
+    cookie.serialize(COOKIE_NAMES.REFRESH_TOKEN, "", { ...expired, httpOnly: true }),
     cookie.serialize(COOKIE_NAMES.EXPIRES_AT, "", expired),
-    cookie.serialize(COOKIE_NAMES.OAUTH_PENDING, "", {
-      ...expired,
-      httpOnly: true,
-    }),
+    cookie.serialize(COOKIE_NAMES.OAUTH_PENDING, "", { ...expired, httpOnly: true }),
   ]);
 }
 
@@ -159,12 +154,6 @@ const AUTH_INTERCEPT_ENDPOINTS = new Set([
   "/api/user/oauth/link",
   "/api/user/oauth/pending",
   "/api/user/oauth/complete",
-  "/api/user/cas/config",
-  "/api/user/cas/login",
-  "/api/user/cas/callback",
-  "/api/user/cas/renew",
-  "/api/user/cas/renew_callback",
-  "/api/user/cas/logout_callback",
 ]);
 
 function collectRequestBody(req) {
@@ -182,11 +171,8 @@ function collectRequestBody(req) {
  * If no refresh_token cookie exists, return 401 immediately.
  */
 function prepareAuthRequestBody(pathname, body, cookies, res) {
-  if (
-    pathname === "/api/user/refresh_token" ) {
-    const refreshToken =
-    cookies[COOKIE_NAMES.REFRESH_TOKEN]
-  ;
+  if (pathname === "/api/user/refresh_token") {
+    const refreshToken = cookies[COOKIE_NAMES.REFRESH_TOKEN];
     if (!refreshToken) {
       res.writeHead(401, { "Content-Type": "application/json" });
       res.end(JSON.stringify({ detail: "No refresh token cookie found" }));
@@ -208,204 +194,144 @@ function forwardAuthRequest(req, res, targetUrl) {
   const transport = parsedTarget.protocol === "https:" ? https : http;
   const cookies = parseCookies(req);
 
-  if (
-    req.parsedPathname === "/api/user/refresh_token" &&
-    !cookies[COOKIE_NAMES.REFRESH_TOKEN]
-  ) {
-    res.writeHead(204);
-    res.end();
-    return;
-  }
-
-  collectRequestBody(req)
-    .then((rawBody) => {
-      const body = prepareAuthRequestBody(req.parsedPathname, rawBody, cookies, res);
+  collectRequestBody(req).then((rawBody) => {
+    const body = prepareAuthRequestBody(req.parsedPathname, rawBody, cookies, res);
 
     // If body is null, prepareAuthRequestBody already sent the error response
     if (body === null) {
       return;
     }
 
-      const forwardHeaders = { ...req.headers, host: parsedTarget.host };
+    const forwardHeaders = { ...req.headers, host: parsedTarget.host };
 
-      // Inject access_token from cookie as Authorization header for the backend
-      if (
-        cookies[COOKIE_NAMES.ACCESS_TOKEN] &&
-        !forwardHeaders["authorization"]
-      ) {
-        forwardHeaders["authorization"] =
-          `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`;
-      }
+    // Inject access_token from cookie as Authorization header for the backend
+    if (cookies[COOKIE_NAMES.ACCESS_TOKEN] && !forwardHeaders["authorization"]) {
+      forwardHeaders["authorization"] = `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`;
+    }
 
-      if (
-        cookies[COOKIE_NAMES.OAUTH_PENDING] &&
-        (req.parsedPathname === "/api/user/oauth/pending" ||
-          req.parsedPathname === "/api/user/oauth/complete")
-      ) {
-        forwardHeaders["x-oauth-pending-token"] =
-          cookies[COOKIE_NAMES.OAUTH_PENDING];
-      }
+    if (
+      cookies[COOKIE_NAMES.OAUTH_PENDING] &&
+      (req.parsedPathname === "/api/user/oauth/pending" ||
+        req.parsedPathname === "/api/user/oauth/complete")
+    ) {
+      forwardHeaders["x-oauth-pending-token"] = cookies[COOKIE_NAMES.OAUTH_PENDING];
+    }
 
-      // Update content-length if body was modified
-      if (body.length !== rawBody.length) {
-        forwardHeaders["content-length"] = String(body.length);
-      }
+    // Update content-length if body was modified
+    if (body.length !== rawBody.length) {
+      forwardHeaders["content-length"] = String(body.length);
+    }
 
-      const options = {
-        hostname: parsedTarget.hostname,
-        port: parsedTarget.port,
-        path: req.url,
-        method: req.method,
-        headers: forwardHeaders,
-      };
-
-      const proxyReq = transport.request(options, (proxyRes) => {
-        const responseChunks = [];
-        proxyRes.on("data", (chunk) => responseChunks.push(chunk));
-        proxyRes.on("end", () => {
-          const responseBody = Buffer.concat(responseChunks);
-          let finalBody = responseBody;
-
-          try {
-            const contentType = proxyRes.headers["content-type"] || "";
-            if (
-              contentType.includes("application/json") &&
-              responseBody.length > 0
+    const options = {
+      hostname: parsedTarget.hostname,
+      port: parsedTarget.port,
+      path: req.url,
+      method: req.method,
+      headers: forwardHeaders,
+    };
+
+    const proxyReq = transport.request(options, (proxyRes) => {
+      const responseChunks = [];
+      proxyRes.on("data", (chunk) => responseChunks.push(chunk));
+      proxyRes.on("end", () => {
+        const responseBody = Buffer.concat(responseChunks);
+        let finalBody = responseBody;
+
+        try {
+          const contentType = proxyRes.headers["content-type"] || "";
+          if (contentType.includes("application/json") && responseBody.length > 0) {
+            const data = JSON.parse(responseBody.toString());
+
+            const isLogout = req.parsedPathname === "/api/user/logout";
+            const isRevoke = req.parsedPathname === "/api/user/revoke";
+
+            if (isLogout || isRevoke) {
+              clearAuthCookies(res);
+            } else if (
+              req.parsedPathname === "/api/user/oauth/callback" &&
+              data.data &&
+              data.data.requires_account_completion &&
+              data.data.pending_token
             ) {
-              const data = JSON.parse(responseBody.toString());
-
-              const isLogout = req.parsedPathname === "/api/user/logout";
-              const isRevoke = req.parsedPathname === "/api/user/revoke";
-
-              if (isLogout || isRevoke) {
-                clearAuthCookies(res);
-              } else if (
-                req.parsedPathname === "/api/user/oauth/callback" &&
-                data.data &&
-                data.data.requires_account_completion &&
-                data.data.pending_token
-              ) {
-                setPendingOAuthCookie(res, data.data.pending_token);
-                const locale = getPreferredLocale(cookies);
-                res.writeHead(302, { Location: `/${locale}/oauth/complete` });
-                res.end();
-                return;
-              } else if (data.data && data.data.session) {
-                const session = data.data.session;
-                setAuthCookies(res, session);
-
-                const isOAuthCallback =
-                  req.parsedPathname === "/api/user/oauth/callback";
-                const isCasCallback =
-                  req.parsedPathname === "/api/user/cas/callback";
-                const isCasRenewCallback =
-                  req.parsedPathname === "/api/user/cas/renew_callback";
-                if (isOAuthCallback) {
-                  res.writeHead(302, { Location: "/" });
-                  res.end();
-                  return;
-                }
-                if (isCasCallback) {
-                  res.writeHead(302, {
-                    Location: data.data.redirect_url || "/",
-                  });
-                  res.end();
-                  return;
-                }
-                if (isCasRenewCallback) {
-                  const html = Buffer.from(`<!doctype html><html><body><script>
-window.parent && window.parent.postMessage({ type: "cas-renew-success" }, window.location.origin);
-</script></body></html>`);
-                  const responseHeaders = {
-                    "content-type": "text/html; charset=utf-8",
-                    "content-length": String(html.length),
-                  };
-                  const existingSetCookie = res.getHeader("Set-Cookie") || [];
-                  const cookiesToSend = Array.isArray(existingSetCookie)
-                    ? existingSetCookie
-                    : [existingSetCookie];
-                  if (cookiesToSend.filter(Boolean).length > 0) {
-                    responseHeaders["set-cookie"] =
-                      cookiesToSend.filter(Boolean);
-                  }
-                  res.writeHead(200, responseHeaders);
-                  res.end(html);
-                  return;
-                }
-
-                if (req.parsedPathname === "/api/user/oauth/complete") {
-                  clearPendingOAuthCookie(res);
-                }
-
-                const sanitized = { ...data };
-                sanitized.data = { ...data.data };
-                sanitized.data.session = {
-                  expires_at: session.expires_at,
-                  expires_in_seconds: session.expires_in_seconds,
-                };
-                finalBody = Buffer.from(JSON.stringify(sanitized));
-              } else if (
-                req.parsedPathname === "/api/user/oauth/callback" &&
-                data.data &&
-                data.data.oauth_error
-              ) {
-                const errorParams = new URLSearchParams({
-                  oauth_error: data.data.oauth_error,
-                  oauth_error_description:
-                    data.data.oauth_error_description || "",
-                });
-                res.writeHead(302, { Location: `/?${errorParams.toString()}` });
+              setPendingOAuthCookie(res, data.data.pending_token);
+              const locale = getPreferredLocale(cookies);
+              res.writeHead(302, { Location: `/${locale}/oauth/complete` });
+              res.end();
+              return;
+            } else if (data.data && data.data.session) {
+              const session = data.data.session;
+              setAuthCookies(res, session);
+
+              const isOAuthCallback = req.parsedPathname === "/api/user/oauth/callback";
+              if (isOAuthCallback) {
+                res.writeHead(302, { Location: "/" });
                 res.end();
                 return;
               }
-            }
-          } catch {
-            // If JSON parsing fails, pass through unchanged
-          }
 
-          // Copy response headers, but override content-length and set cookies
-          const responseHeaders = { ...proxyRes.headers };
-          responseHeaders["content-length"] = String(finalBody.length);
-          // Merge Set-Cookie: proxyRes cookies + our auth cookies
-          const existingSetCookie = res.getHeader("Set-Cookie") || [];
-          const upstreamSetCookie = proxyRes.headers["set-cookie"] || [];
-          const mergedCookies = [
-            ...(Array.isArray(existingSetCookie)
-              ? existingSetCookie
-              : [existingSetCookie]),
-            ...(Array.isArray(upstreamSetCookie)
-              ? upstreamSetCookie
-              : [upstreamSetCookie]),
-          ].filter(Boolean);
-
-          delete responseHeaders["set-cookie"];
-          if (mergedCookies.length > 0) {
-            responseHeaders["set-cookie"] = mergedCookies;
-          }
+              if (req.parsedPathname === "/api/user/oauth/complete") {
+                clearPendingOAuthCookie(res);
+              }
 
-          res.writeHead(proxyRes.statusCode, responseHeaders);
-          res.end(finalBody);
-        });
-      });
+              const sanitized = { ...data };
+              sanitized.data = { ...data.data };
+              sanitized.data.session = {
+                expires_at: session.expires_at,
+                expires_in_seconds: session.expires_in_seconds,
+              };
+              finalBody = Buffer.from(JSON.stringify(sanitized));
+            } else if (req.parsedPathname === "/api/user/oauth/callback" && data.data && data.data.oauth_error) {
+              const errorParams = new URLSearchParams({
+                oauth_error: data.data.oauth_error,
+                oauth_error_description: data.data.oauth_error_description || "",
+              });
+              res.writeHead(302, { Location: `/?${errorParams.toString()}` });
+              res.end();
+              return;
+            }
+          }
+        } catch {
+          // If JSON parsing fails, pass through unchanged
+        }
 
-      proxyReq.on("error", (err) => {
-        console.error("[Auth Proxy] Forward error:", err.message);
-        if (!res.headersSent) {
-          res.writeHead(502, { "Content-Type": "application/json" });
-          res.end(JSON.stringify({ detail: "Backend unavailable" }));
+        // Copy response headers, but override content-length and set cookies
+        const responseHeaders = { ...proxyRes.headers };
+        responseHeaders["content-length"] = String(finalBody.length);
+        // Merge Set-Cookie: proxyRes cookies + our auth cookies
+        const existingSetCookie = res.getHeader("Set-Cookie") || [];
+        const upstreamSetCookie = proxyRes.headers["set-cookie"] || [];
+        const mergedCookies = [
+          ...(Array.isArray(existingSetCookie) ? existingSetCookie : [existingSetCookie]),
+          ...(Array.isArray(upstreamSetCookie) ? upstreamSetCookie : [upstreamSetCookie]),
+        ].filter(Boolean);
+
+        delete responseHeaders["set-cookie"];
+        if (mergedCookies.length > 0) {
+          responseHeaders["set-cookie"] = mergedCookies;
         }
+
+        res.writeHead(proxyRes.statusCode, responseHeaders);
+        res.end(finalBody);
       });
+    });
 
-      proxyReq.write(body);
-      proxyReq.end();
-    })
-    .catch((err) => {
-      console.error("[Auth Proxy] Body read error:", err.message);
+    proxyReq.on("error", (err) => {
+      console.error("[Auth Proxy] Forward error:", err.message);
       if (!res.headersSent) {
-        res.writeHead(500, { "Content-Type": "application/json" });
-        res.end(JSON.stringify({ detail: "Internal proxy error" }));
+        res.writeHead(502, { "Content-Type": "application/json" });
+        res.end(JSON.stringify({ detail: "Backend unavailable" }));
       }
     });
+
+    proxyReq.write(body);
+    proxyReq.end();
+  }).catch((err) => {
+    console.error("[Auth Proxy] Body read error:", err.message);
+    if (!res.headersSent) {
+      res.writeHead(500, { "Content-Type": "application/json" });
+      res.end(JSON.stringify({ detail: "Internal proxy error" }));
+    }
+  });
 }
 
 // ============================================================================
@@ -413,14 +339,8 @@ window.parent && window.parent.postMessage({ type: "cas-renew-success" }, window
 // ============================================================================
 proxy.on("proxyReq", (proxyReq, req) => {
   const cookies = parseCookies(req);
-  if (
-    cookies[COOKIE_NAMES.ACCESS_TOKEN] &&
-    !proxyReq.getHeader("authorization")
-  ) {
-    proxyReq.setHeader(
-      "Authorization",
-      `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`
-    );
+  if (cookies[COOKIE_NAMES.ACCESS_TOKEN] && !proxyReq.getHeader("authorization")) {
+    proxyReq.setHeader("Authorization", `Bearer ${cookies[COOKIE_NAMES.ACCESS_TOKEN]}`);
   }
 });
 
@@ -455,18 +375,12 @@ app.prepare().then(() => {
           pathname.startsWith("/api/file/storage") ||
           pathname.startsWith("/api/file/preprocess");
         if (isRuntime) {
-          proxy.web(req, res, {
-            target: RUNTIME_HTTP_BACKEND,
-            changeOrigin: true,
-          });
+          proxy.web(req, res, { target: RUNTIME_HTTP_BACKEND, changeOrigin: true });
         } else if (
           pathname === "/api/skills/create" ||
           pathname.startsWith("/api/skills/stop/")
         ) {
-          proxy.web(req, res, {
-            target: RUNTIME_HTTP_BACKEND,
-            changeOrigin: true,
-          });
+          proxy.web(req, res, { target: RUNTIME_HTTP_BACKEND, changeOrigin: true });
         } else {
           proxy.web(req, res, { target: HTTP_BACKEND, changeOrigin: true });
         }
diff --git a/frontend/services/agentConfigService.ts b/frontend/services/agentConfigService.ts
index a955aa410..8e0f9da0d 100644
--- a/frontend/services/agentConfigService.ts
+++ b/frontend/services/agentConfigService.ts
@@ -200,9 +200,7 @@ export const fetchPublishedAgentList = async () => {
       group_ids: agent.group_ids || [],
       is_new: agent.is_new || false,
       permission: agent.permission,
-      current_version_no: agent.current_version_no,
-      greeting_message: agent.greeting_message,
-      example_questions: agent.example_questions || [],
+      published_version_no: agent.published_version_no,
     }));
 
     return {
@@ -409,7 +407,6 @@ export interface UpdateAgentInfoPayload {
   max_steps?: number;
   provide_run_summary?: boolean;
   enable_context_manager?: boolean;
-  verification_config?: Record<string, any>;
   enabled?: boolean;
   business_description?: string;
   business_logic_model_name?: string;
@@ -421,8 +418,6 @@ export interface UpdateAgentInfoPayload {
   related_agent_ids?: number[];
   related_external_agent_ids?: number[];
   ingroup_permission?: string;
-  greeting_message?: string;
-  example_questions?: string[];
 }
 
 export const updateAgentInfo = async (payload: UpdateAgentInfoPayload) => {
@@ -774,7 +769,6 @@ export const searchAgentInfo = async (
       prompt_template_id: data.prompt_template_id ?? 0,
       prompt_template_name: data.prompt_template_name ?? "system_default",
       provide_run_summary: data.provide_run_summary,
-      verification_config: data.verification_config,
       enabled: data.enabled,
       is_available: data.is_available,
       unavailable_reasons: data.unavailable_reasons || [],
@@ -812,8 +806,6 @@ export const searchAgentInfo = async (
           })
         : [],
       skills: data.skills || [],
-      greeting_message: data.greeting_message || "",
-      example_questions: data.example_questions || [],
       current_version_no: data.current_version_no,
     };
 
diff --git a/frontend/services/agentVersionService.ts b/frontend/services/agentVersionService.ts
index d520e05cb..31dec3eb0 100644
--- a/frontend/services/agentVersionService.ts
+++ b/frontend/services/agentVersionService.ts
@@ -33,7 +33,6 @@ export interface Agent {
   tenant_id: string;
   enabled: boolean;
   provide_run_summary: boolean;
-  verification_config?: Record<string, any>;
   business_description?: string;
   business_logic_model_name?: string;
   business_logic_model_id?: number;
@@ -548,4 +547,4 @@ export async function updateVersion(
       message: error instanceof Error ? error.message : "Failed to update version",
     };
   }
-}
+}
\ No newline at end of file
diff --git a/frontend/services/api.ts b/frontend/services/api.ts
index ef8b97ff4..490b3c56d 100644
--- a/frontend/services/api.ts
+++ b/frontend/services/api.ts
@@ -30,11 +30,6 @@ export const API_ENDPOINTS = {
     accounts: `${API_BASE_URL}/user/oauth/accounts`,
     unlink: (provider: string) => `${API_BASE_URL}/user/oauth/accounts/${provider}`,
   },
-  cas: {
-    config: `${API_BASE_URL}/user/cas/config`,
-    login: `${API_BASE_URL}/user/cas/login`,
-    renew: `${API_BASE_URL}/user/cas/renew`,
-  },
   conversation: {
     list: `${API_BASE_URL}/conversation/list`,
     create: `${API_BASE_URL}/conversation/create`,
diff --git a/frontend/services/authService.ts b/frontend/services/authService.ts
index 7589622b4..1735adc1a 100644
--- a/frontend/services/authService.ts
+++ b/frontend/services/authService.ts
@@ -14,7 +14,6 @@ import { ASSET_OWNER_TENANT_ID, STATUS_CODES, USER_ROLES } from "@/const/auth";
 
 import { generateAvatarUrl } from "@/lib/auth";
 import { fetchWithAuth } from "@/lib/auth";
-import { authFlowState } from "@/lib/authFlow";
 import {
   removeSessionFromStorage,
   getSessionFromStorage,
@@ -163,9 +162,7 @@ export const authService = {
       return {
         error: {
           message:
-            error instanceof Error
-              ? error.message
-              : "Network error, please try again later",
+            error instanceof Error ? error.message : "Network error, please try again later",
           code:
             error instanceof Error && "code" in error
               ? (error as any).code
@@ -271,29 +268,19 @@ export const authService = {
   },
 
   signOut: async (): Promise<{ error: null }> => {
-    authFlowState.beginExplicitLogout();
     try {
-      const response = await fetchWithAuth(API_ENDPOINTS.user.logout, {
+      await fetchWithAuth(API_ENDPOINTS.user.logout, {
         method: "POST",
-        keepalive: true,
       });
-      const data = await response.json().catch(() => null);
-      const casLogoutUrl = data?.data?.cas_logout_url;
 
       // server.js clears HttpOnly cookies; clear local user info
       removeSessionFromStorage();
-      if (casLogoutUrl && typeof window !== "undefined") {
-        window.location.href = casLogoutUrl;
-      } else {
-        authFlowState.endExplicitLogout();
-      }
 
       return { error: null };
     } catch (error) {
       log.error("Logout failed:", error);
 
       removeSessionFromStorage();
-      authFlowState.endExplicitLogout();
 
       return { error: null };
     }
@@ -344,16 +331,11 @@ export const authService = {
           ),
           email: data.data.user.user_email,
           role: data.data.user.user_role,
-          authProvider: data.data.user.auth_provider,
           avatarUrl: data.data.user.avatarUrl,
-          permissions: data.data.user.permissions.map((permission: string) =>
-            permission.toLowerCase()
-          ),
-          accessibleRoutes: data.data.user.accessibleRoutes.map(
-            (router: string) => router.toLowerCase()
-          ),
-        },
-      };
+          permissions: data.data.user.permissions.map((permission:string) => permission.toLowerCase()),
+          accessibleRoutes: data.data.user.accessibleRoutes.map((router:string) => router.toLowerCase()),
+        }
+      }
       return userData as AuthInfoResponse;
     } catch (error) {
       log.error("Failed to get user Info:", error);
@@ -392,9 +374,7 @@ export const authService = {
       if (errorCode === ErrorCode.INVALID_CREDENTIALS) {
         return {
           errorCode: ErrorCode.INVALID_CREDENTIALS,
-          error:
-            error?.message ||
-            getI18nErrorMessage(ErrorCode.INVALID_CREDENTIALS),
+          error: error?.message || getI18nErrorMessage(ErrorCode.INVALID_CREDENTIALS),
         };
       }
       if (errorCode === ErrorCode.PASSWORD_WEAK) {
@@ -406,9 +386,7 @@ export const authService = {
       if (errorCode === ErrorCode.PASSWORD_SAME_AS_OLD) {
         return {
           errorCode: ErrorCode.PASSWORD_SAME_AS_OLD,
-          error:
-            error?.message ||
-            getI18nErrorMessage(ErrorCode.PASSWORD_SAME_AS_OLD),
+          error: error?.message || getI18nErrorMessage(ErrorCode.PASSWORD_SAME_AS_OLD),
         };
       }
 
diff --git a/frontend/services/casService.ts b/frontend/services/casService.ts
deleted file mode 100644
index 2c2dd2cb0..000000000
--- a/frontend/services/casService.ts
+++ /dev/null
@@ -1,69 +0,0 @@
-import { API_ENDPOINTS } from "@/services/api";
-import log from "@/lib/logger";
-
-export interface CasConfig {
-  enabled: boolean;
-  login_mode: "button" | "force" | "disabled";
-  renew_before_seconds: number;
-  renew_timeout_seconds: number;
-  display_name: string;
-}
-
-const disabledConfig: CasConfig = {
-  enabled: false,
-  login_mode: "disabled",
-  renew_before_seconds: 300,
-  renew_timeout_seconds: 10,
-  display_name: "CAS",
-};
-
-export const casService = {
-  getConfig: async (): Promise<CasConfig> => {
-    try {
-      const response = await fetch(API_ENDPOINTS.cas.config);
-      if (!response.ok) return disabledConfig;
-      const data = await response.json();
-      return { ...disabledConfig, ...(data.data || {}) };
-    } catch (error) {
-      log.warn("Failed to fetch CAS config:", error);
-      return disabledConfig;
-    }
-  },
-
-  startLogin: (redirect?: string): void => {
-    const target = redirect || window.location.pathname + window.location.search;
-    window.location.href = `${API_ENDPOINTS.cas.login}?redirect=${encodeURIComponent(target)}`;
-  },
-
-  renewInIframe: (timeoutSeconds: number): Promise<boolean> => {
-    if (typeof window === "undefined") return Promise.resolve(false);
-
-    return new Promise((resolve) => {
-      const iframe = document.createElement("iframe");
-      iframe.src = API_ENDPOINTS.cas.renew;
-      iframe.style.display = "none";
-      iframe.setAttribute("aria-hidden", "true");
-
-      let settled = false;
-      const cleanup = () => {
-        window.removeEventListener("message", onMessage);
-        iframe.remove();
-      };
-      const finish = (ok: boolean) => {
-        if (settled) return;
-        settled = true;
-        cleanup();
-        resolve(ok);
-      };
-      const onMessage = (event: MessageEvent) => {
-        if (event.origin !== window.location.origin) return;
-        if (event.data?.type === "cas-renew-success") finish(true);
-        if (event.data?.type === "cas-renew-failed") finish(false);
-      };
-
-      window.addEventListener("message", onMessage);
-      document.body.appendChild(iframe);
-      window.setTimeout(() => finish(false), Math.max(1, timeoutSeconds) * 1000);
-    });
-  },
-};
diff --git a/frontend/services/knowledgeBaseService.ts b/frontend/services/knowledgeBaseService.ts
index da760e0bf..bd13de32d 100644
--- a/frontend/services/knowledgeBaseService.ts
+++ b/frontend/services/knowledgeBaseService.ts
@@ -155,10 +155,7 @@ class KnowledgeBaseService {
     userId: string
   ): Promise<Array<{ id: string; name: string }>> {
     try {
-      const url = new URL(
-        API_ENDPOINTS.idata.knowledgeSpaces,
-        window.location.origin
-      );
+      const url = new URL(API_ENDPOINTS.idata.knowledgeSpaces, window.location.origin);
       url.searchParams.set("idata_api_base", idataApiBase);
       url.searchParams.set("api_key", apiKey);
       url.searchParams.set("user_id", userId);
@@ -173,12 +170,8 @@ class KnowledgeBaseService {
       // Check for error response from middleware (has code field)
       if (result.code !== undefined && result.code !== 0) {
         const errorCode = result.code || response.status;
-        const errorMessage =
-          result.message || "Failed to fetch iData knowledge spaces";
-        log.error("iData API error:", {
-          code: errorCode,
-          message: errorMessage,
-        });
+        const errorMessage = result.message || "Failed to fetch iData knowledge spaces";
+        log.error("iData API error:", { code: errorCode, message: errorMessage });
         throw new ApiError(errorCode, errorMessage);
       }
 
@@ -219,10 +212,7 @@ class KnowledgeBaseService {
       if (result.code !== undefined && result.code !== 0) {
         const errorCode = result.code || response.status;
         const errorMessage = result.message || "Failed to fetch iData datasets";
-        log.error("iData API error:", {
-          code: errorCode,
-          message: errorMessage,
-        });
+        log.error("iData API error:", { code: errorCode, message: errorMessage });
         throw new ApiError(errorCode, errorMessage);
       }
 
@@ -377,10 +367,7 @@ class KnowledgeBaseService {
   /**
    * Fetch Haotian knowledge sets via backend proxy.
    */
-  async getHaotianKnowledgeSets(
-    listUrl: string,
-    externalAuthorization: string
-  ): Promise<{
+  async getHaotianKnowledgeSets(listUrl: string, externalAuthorization: string): Promise<{
     knowledge_sets: Array<{
       name: string;
       knowledge_bases: Array<{ dify_dataset_id: string; name: string }>;
@@ -407,10 +394,7 @@ class KnowledgeBaseService {
   /**
    * Test Haotian connection via backend proxy.
    */
-  async testHaotianConnection(
-    listUrl: string,
-    externalAuthorization: string
-  ): Promise<{
+  async testHaotianConnection(listUrl: string, externalAuthorization: string): Promise<{
     success: boolean;
     error?: string;
   }> {
@@ -432,8 +416,7 @@ class KnowledgeBaseService {
     } catch (error) {
       return {
         success: false,
-        error:
-          error instanceof Error ? error.message : "Connection test failed",
+        error: error instanceof Error ? error.message : "Connection test failed",
       };
     }
   }
@@ -578,10 +561,7 @@ class KnowledgeBaseService {
                       null,
                     is_multimodal: resolveIsMultimodal(indexInfo, stats),
                     // Use embedding_model_name (display_name) from backend, fallback to ES stats
-                    embeddingModel:
-                      indexInfo.embedding_model_name ||
-                      stats.embedding_model ||
-                      "unknown",
+                    embeddingModel: indexInfo.embedding_model_name || stats.embedding_model || "unknown",
                     summaryFrequency: indexInfo.summary_frequency || null,
                     lastSummaryTime: indexInfo.last_summary_time || null,
                     knowledge_sources:
@@ -599,7 +579,6 @@ class KnowledgeBaseService {
                     tokenNum: 0,
                     source: "nexent",
                     tenant_id: indexInfo.tenant_id,
-                    preserve_source_file: indexInfo.preserve_source_file ?? true,
                   };
                 }
               );
@@ -779,7 +758,6 @@ class KnowledgeBaseService {
         ingroup_permission?: string;
         group_ids?: number[];
         is_multimodal?: boolean;
-        preserve_source_file?: boolean;
       } = {
         name: params.name,
         description: params.description || "",
@@ -794,9 +772,6 @@ class KnowledgeBaseService {
       if (params.group_ids && params.group_ids.length > 0) {
         requestBody.group_ids = params.group_ids;
       }
-      if (params.preserve_source_file !== undefined) {
-        requestBody.preserve_source_file = params.preserve_source_file;
-      }
 
       const response = await fetch(
         API_ENDPOINTS.knowledgeBase.indexDetail(params.name),
@@ -1550,7 +1525,9 @@ class KnowledgeBaseService {
   }
 
   // Embedding model status and configuration
-  async getEmbeddingModelStatus(indexName: string): Promise<{
+  async getEmbeddingModelStatus(
+    indexName: string
+  ): Promise<{
     status: "configured" | "legacy" | "missing";
     needs_config: boolean;
     index_name: string;
@@ -1577,9 +1554,7 @@ class KnowledgeBaseService {
         const errorData = await response.json().catch(() => ({}));
         throw new ApiError(
           response.status,
-          errorData.detail ||
-            errorData.message ||
-            "Failed to get embedding model status"
+          errorData.detail || errorData.message || "Failed to get embedding model status"
         );
       }
 
diff --git a/frontend/services/promptService.ts b/frontend/services/promptService.ts
index 399511a72..2899fd370 100644
--- a/frontend/services/promptService.ts
+++ b/frontend/services/promptService.ts
@@ -4,8 +4,6 @@ import {
   GeneratePromptParams,
   OptimizePromptSectionParams,
   OptimizePromptSectionResponse,
-  OptimizePromptBadCaseParams,
-  OptimizePromptBadCaseResponse,
   StreamResponseData,
 } from '@/types/agentConfig';
 import { fetchWithAuth, getAuthHeaders } from '@/lib/auth';
@@ -83,5 +81,3 @@ export const optimizePromptSection = async (
   const result = await response.json();
   return result.data as OptimizePromptSectionResponse;
 };
-
-// optimizePromptBadCase removed: badcase optimization is now fully automated in agent debug.
diff --git a/frontend/services/sessionService.ts b/frontend/services/sessionService.ts
index 817eede03..273f3c9bd 100644
--- a/frontend/services/sessionService.ts
+++ b/frontend/services/sessionService.ts
@@ -26,10 +26,6 @@ export const sessionService = {
         body: JSON.stringify({}),
       });
 
-      if (response.status === 204) {
-        return null;
-      }
-
       if (!response.ok) {
         return null;
       }
diff --git a/frontend/stores/agentConfigStore.ts b/frontend/stores/agentConfigStore.ts
index e1a1b9545..bdbf54cac 100644
--- a/frontend/stores/agentConfigStore.ts
+++ b/frontend/stores/agentConfigStore.ts
@@ -10,13 +10,7 @@
 
 import { create } from "zustand";
 
-import {
-  Agent,
-  Tool,
-  AgentConfigUpdate,
-  Skill,
-  DEFAULT_AGENT_VERIFICATION_CONFIG,
-} from "@/types/agentConfig";
+import { Agent, Tool, AgentConfigUpdate, Skill } from "@/types/agentConfig";
 import { getAgentGenerationCache } from "@/lib/agentGenerationCache";
 
 /**
@@ -44,12 +38,9 @@ export type EditableAgent = Pick<
   | "business_logic_model_id"
   | "prompt_template_id"
   | "prompt_template_name"
-  | "verification_config"
   | "sub_agent_id_list"
   | "group_ids"
   | "ingroup_permission"
-  | "greeting_message"
-  | "example_questions"
 > & {
   skills: Skill[];
   external_sub_agent_id_list?: number[];
@@ -177,12 +168,9 @@ function createEmptyEditableAgent(llmConfig?: { id: number | null; name: string;
     business_logic_model_id: llmConfig?.id || 0,
     prompt_template_id: 0,
     prompt_template_name: "system_default",
-    verification_config: { ...DEFAULT_AGENT_VERIFICATION_CONFIG },
     sub_agent_id_list: [],
     group_ids: [],
     ingroup_permission: "READ_ONLY",
-    greeting_message: "",
-    example_questions: [],
   };
 }
 
@@ -209,14 +197,11 @@ const toEditable = (agent: Agent | null): EditableAgent =>
         business_logic_model_id: agent.business_logic_model_id || 0,
         prompt_template_id: agent.prompt_template_id ?? 0,
         prompt_template_name: agent.prompt_template_name || "system_default",
-        verification_config: agent.verification_config || { ...DEFAULT_AGENT_VERIFICATION_CONFIG },
         sub_agent_id_list: agent.sub_agent_id_list || [],
         external_sub_agent_id_list: agent.external_sub_agent_id_list || [],
         group_ids: agent.group_ids || [],
         ingroup_permission: agent.ingroup_permission || "READ_ONLY",
         prompts_hidden: agent.prompts_hidden,
-        greeting_message: agent.greeting_message || "",
-        example_questions: agent.example_questions || [],
       }
     : { ...emptyEditableAgent };
 
@@ -327,16 +312,12 @@ const isDirty = (
       editedAgent.business_logic_model_id !== 0 ||
       (editedAgent.prompt_template_id ?? 0) !== 0 ||
       (editedAgent.prompt_template_name || "system_default") !== "system_default" ||
-      JSON.stringify(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) !==
-        JSON.stringify(DEFAULT_AGENT_VERIFICATION_CONFIG) ||
       normalizeArray(editedAgent.group_ids || []).length > 0 ||
       normalizeArray(editedAgent.sub_agent_id_list || []).length > 0 ||
       normalizeArray(editedAgent.external_sub_agent_id_list || []).length > 0 ||
       editedAgent.tools.length > 0 ||
       editedAgent.skills.length > 0 ||
-      editedAgent.ingroup_permission !== "READ_ONLY" ||
-      editedAgent.greeting_message !== "" ||
-      (editedAgent.example_questions || []).length > 0
+      editedAgent.ingroup_permission !== "READ_ONLY"
     );
   }
 
@@ -357,8 +338,6 @@ const isDirty = (
     baselineAgent.business_logic_model_id !== editedAgent.business_logic_model_id ||
     (baselineAgent.prompt_template_id ?? 0) !== (editedAgent.prompt_template_id ?? 0) ||
     (baselineAgent.prompt_template_name || "system_default") !== (editedAgent.prompt_template_name || "system_default") ||
-    JSON.stringify(baselineAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) !==
-      JSON.stringify(editedAgent.verification_config || DEFAULT_AGENT_VERIFICATION_CONFIG) ||
     JSON.stringify(normalizeArray(baselineAgent.group_ids ?? [])) !==
       JSON.stringify(normalizeArray(editedAgent.group_ids ?? [])) ||
     JSON.stringify(normalizeArray(baselineAgent.sub_agent_id_list ?? [])) !==
@@ -367,9 +346,7 @@ const isDirty = (
       JSON.stringify(normalizeArray(editedAgent.external_sub_agent_id_list ?? [])) ||
     isToolsDirty(baselineAgent.tools, editedAgent.tools) ||
     isSkillsDirty(baselineAgent.skills, editedAgent.skills) ||
-    baselineAgent.ingroup_permission !== editedAgent.ingroup_permission ||
-    baselineAgent.greeting_message !== editedAgent.greeting_message ||
-    JSON.stringify(baselineAgent.example_questions ?? []) !== JSON.stringify(editedAgent.example_questions ?? [])
+    baselineAgent.ingroup_permission !== editedAgent.ingroup_permission
   );
 };
 
@@ -407,12 +384,6 @@ export const useAgentConfigStore = create<AgentConfigStoreState>((set, get) => (
         if (cached.dutyPrompt) cacheUpdates.duty_prompt = cached.dutyPrompt;
         if (cached.constraintPrompt) cacheUpdates.constraint_prompt = cached.constraintPrompt;
         if (cached.fewShotsPrompt) cacheUpdates.few_shots_prompt = cached.fewShotsPrompt;
-        if (cached.greetingMessage) cacheUpdates.greeting_message = cached.greetingMessage;
-        if (cached.exampleQuestions) {
-          cacheUpdates.example_questions = typeof cached.exampleQuestions === "string"
-            ? (() => { try { return JSON.parse(cached.exampleQuestions); } catch { return []; } })()
-            : cached.exampleQuestions;
-        }
         
         // Only restore agent metadata if not already set in baseline
         if (cached.agentName && !editedAgent.name) cacheUpdates.name = cached.agentName;
@@ -537,3 +508,4 @@ export const useAgentConfigStore = create<AgentConfigStoreState>((set, get) => (
     return get().baselineAgent;
   },
 }));
+
diff --git a/frontend/types/agentConfig.ts b/frontend/types/agentConfig.ts
index e717da7cd..0287fbff9 100644
--- a/frontend/types/agentConfig.ts
+++ b/frontend/types/agentConfig.ts
@@ -24,51 +24,10 @@ export type AgentConfigUpdate = Partial<Pick<
   | "business_logic_model_name"
   | "prompt_template_id"
   | "prompt_template_name"
-  | "verification_config"
   | "group_ids"
   | "ingroup_permission"
-  | "greeting_message"
-  | "example_questions"
 >>;
 
-export interface AgentVerificationConfig {
-  enabled: boolean;
-  step_verification_enabled: boolean;
-  final_verification_enabled: boolean;
-  llm_verification_enabled?: boolean;
-  max_final_rounds: number;
-  strictness: "lenient" | "balanced" | "strict";
-  fail_policy: "repair_then_controlled_summary" | "warn";
-  pass_score?: number;
-  critical_events: Array<
-    | "tool_precheck"
-    | "tool_result"
-    | "retrieval"
-    | "code_execution"
-    | "handoff"
-    | "final_answer"
-  >;
-}
-
-export const DEFAULT_AGENT_VERIFICATION_CONFIG: AgentVerificationConfig = {
-  enabled: true,
-  step_verification_enabled: true,
-  final_verification_enabled: true,
-  llm_verification_enabled: true,
-  max_final_rounds: 2,
-  strictness: "balanced",
-  fail_policy: "repair_then_controlled_summary",
-  pass_score: 0.75,
-  critical_events: [
-    "tool_precheck",
-    "tool_result",
-    "retrieval",
-    "code_execution",
-    "handoff",
-    "final_answer",
-  ],
-};
-
 // ========== Core Interfaces ==========
 
 export interface Agent {
@@ -83,7 +42,6 @@ export interface Agent {
   max_step: number;
   provide_run_summary: boolean;
   enable_context_manager?: boolean;
-  verification_config?: AgentVerificationConfig;
   tools: Tool[];
   skills?: Skill[];  // Skills configured for this agent
   duty_prompt?: string;
@@ -109,8 +67,6 @@ export interface Agent {
   prompts_hidden?: boolean;
   current_version_no?: number;
   is_a2a_server?: boolean;
-  greeting_message?: string;
-  example_questions?: string[];
 }
 
 export interface Tool {
@@ -504,14 +460,11 @@ export interface GeneratePromptParams {
 export interface OptimizePromptSectionParams {
   agent_id: number;
   task_description: string;
-  model_id: number;
+  model_id: string;
   section_type: "duty" | "constraint" | "few_shots";
   section_title: string;
   current_content: string;
   feedback: string;
-  mode?: "general" | "insert" | "select";
-  start_pos?: number;
-  end_pos?: number;
   tool_ids?: number[];
   sub_agent_ids?: number[];
   knowledge_base_display_names?: string[];
@@ -524,32 +477,6 @@ export interface OptimizePromptSectionResponse {
   optimized_content: string;
 }
 
-export interface BadCaseItem {
-  question: string;
-  answer: string;
-  label?: string;
-  reason?: string;
-}
-
-export interface OptimizePromptBadCaseParams {
-  agent_id: number;
-  model_id: number;
-  current_content: string;
-  bad_cases: BadCaseItem[];
-  section_type: string;
-  section_title: string;
-  tool_ids?: number[];
-  sub_agent_ids?: number[];
-  knowledge_base_display_names?: string[];
-}
-
-export interface OptimizePromptBadCaseResponse {
-  section_type: string;
-  section_title: string;
-  original_content: string;
-  optimized_content: string;
-}
-
 /**
  * Stream Response Data Structure
  */
diff --git a/frontend/types/auth.ts b/frontend/types/auth.ts
index f7781e6eb..69d0d436c 100644
--- a/frontend/types/auth.ts
+++ b/frontend/types/auth.ts
@@ -9,7 +9,6 @@ export interface User {
   role: UserRole;
   avatarUrl?: string;
   tenantId?: string;
-  authProvider?: "local" | "cas";
 }
 
 // Session type definition
diff --git a/frontend/types/chat.ts b/frontend/types/chat.ts
index 60778e98c..dca79e3dc 100644
--- a/frontend/types/chat.ts
+++ b/frontend/types/chat.ts
@@ -36,12 +36,11 @@ export interface StepContent {
         typeof chatConfig.messageTypes.VIRTUAL |
         typeof chatConfig.messageTypes.MEMORY_SEARCH |
         typeof chatConfig.messageTypes.PREPROCESS |
-        typeof chatConfig.messageTypes.VERIFICATION |
         typeof chatConfig.messageTypes.MAX_STEPS_REACHED
   content: string
   expanded: boolean
   timestamp: number
-  subType?: "thinking" | "code" | "deep_thinking" | "progress" | "file_processed" | "truncation" | "complete" | "error" | "verification"
+  subType?: "thinking" | "code" | "deep_thinking" | "progress" | "file_processed" | "truncation" | "complete" | "error"
   isLoading?: boolean
   _preserve?: boolean
   _messageContainer?: {
@@ -75,7 +74,7 @@ metrics: TokenMetrics | null
 
 export interface ChatAgentSelectorProps {
   selectedAgentId: string | null;
-  onAgentSelect: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
+  onAgentSelect: (agentId: string | null) => void;
   disabled?: boolean;
   isInitialMode?: boolean;
 }
@@ -140,7 +139,6 @@ type LocalFilePreviewSource = {
 export type FilePreviewProps = {
   open: boolean;
   onClose: () => void;
-  previewContext?: 'knowledgeBase';
 } & (RemoteFilePreviewSource | LocalFilePreviewSource);
 
 // Main chat message type
@@ -206,11 +204,9 @@ export interface ChatStreamMainProps {
   currentConversationId?: number;
   shouldScrollToBottom?: boolean;
   selectedAgentId?: string | null;
-  onAgentSelect?: (agentId: string | null, greetingMessage?: string, exampleQuestions?: string[]) => void;
+  onAgentSelect?: (agentId: string | null) => void;
   onCitationHover?: () => void;
   onScroll?: () => void;
-  agentGreeting?: string | null;
-  agentExampleQuestions?: string[];
 }
 
 // Card item type for task window
diff --git a/frontend/types/knowledgeBase.ts b/frontend/types/knowledgeBase.ts
index ed32fad3d..7caf4986c 100644
--- a/frontend/types/knowledgeBase.ts
+++ b/frontend/types/knowledgeBase.ts
@@ -37,7 +37,6 @@ export interface KnowledgeBase {
   tenant_id?: string;
   summaryFrequency?: string | null;
   lastSummaryTime?: string | null;
-  preserve_source_file?: boolean;
 }
 
 // Create knowledge base parameter type
@@ -50,7 +49,6 @@ export interface KnowledgeBaseCreateParams {
   ingroup_permission?: string;
   group_ids?: number[];
   is_multimodal?: boolean;
-  preserve_source_file?: boolean;
 }
 
 // Document type
diff --git a/k8s/helm/deploy.sh b/k8s/helm/deploy.sh
index 07522d22c..7a583307d 100755
--- a/k8s/helm/deploy.sh
+++ b/k8s/helm/deploy.sh
@@ -611,7 +611,7 @@ apply() {
                 sleep 5
                 for svc in $backend_services; do
                     echo "  Waiting for nexent-$svc..."
-                    if kubectl rollout status "deployment/nexent-$svc" -n "$NAMESPACE" --timeout=300s >/dev/null 2>&1; then
+                    if kubectl wait --for=condition=ready pod -l app=nexent-$svc -n $NAMESPACE --timeout=300s 2>/dev/null; then
                         echo "  nexent-$svc is ready."
                     else
                         echo "  Error: nexent-$svc did not become ready within timeout."
diff --git a/k8s/helm/nexent/charts/nexent-common/files/init.sql b/k8s/helm/nexent/charts/nexent-common/files/init.sql
index 399c50917..f27f2ad85 100644
--- a/k8s/helm/nexent/charts/nexent-common/files/init.sql
+++ b/k8s/helm/nexent/charts/nexent-common/files/init.sql
@@ -337,12 +337,9 @@ CREATE TABLE IF NOT EXISTS nexent.ag_tenant_agent_t (
     is_new BOOLEAN DEFAULT FALSE,
     provide_run_summary BOOLEAN DEFAULT FALSE,
     enable_context_manager BOOLEAN DEFAULT FALSE,
-    verification_config JSONB,
     version_no INTEGER DEFAULT 0 NOT NULL,
     current_version_no INTEGER NULL,
     ingroup_permission VARCHAR(30),
-    greeting_message TEXT,
-    example_questions JSONB,
     create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
     created_by VARCHAR(100),
@@ -400,9 +397,6 @@ COMMENT ON COLUMN nexent.ag_tenant_agent_t.version_no IS 'Version number. 0 = dr
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.current_version_no IS 'Current published version number. NULL means no version published yet';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.ingroup_permission IS 'In-group permission: EDIT, READ_ONLY, PRIVATE';
 COMMENT ON COLUMN nexent.ag_tenant_agent_t.enable_context_manager IS 'Whether to enable context management (compression) for this agent';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.verification_config IS 'Layered ReAct self-verification configuration';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.greeting_message IS 'Agent greeting message displayed on chat initial screen';
-COMMENT ON COLUMN nexent.ag_tenant_agent_t.example_questions IS 'List of example questions for starting a conversation with this agent';
 
 -- Create index for is_new queries
 CREATE INDEX IF NOT EXISTS idx_ag_tenant_agent_t_is_new
@@ -1868,238 +1862,3 @@ FOR EACH ROW
 EXECUTE FUNCTION update_mcp_community_record_update_time();
 
 COMMENT ON TRIGGER update_mcp_community_record_update_time_trigger ON nexent.mcp_community_record_t IS 'Trigger to maintain update_time';
-
-CREATE TABLE IF NOT EXISTS nexent.user_cas_session_t (
-    cas_session_id SERIAL PRIMARY KEY,
-    session_id VARCHAR(100) NOT NULL UNIQUE,
-    user_id VARCHAR(100) NOT NULL,
-    cas_user_id VARCHAR(200) NOT NULL,
-    cas_session_index VARCHAR(500),
-    status VARCHAR(30) NOT NULL DEFAULT 'active',
-    expires_at TIMESTAMP NOT NULL,
-    revoked_at TIMESTAMP,
-    create_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    update_time TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
-    created_by VARCHAR(100),
-    updated_by VARCHAR(100),
-    delete_flag VARCHAR(1) DEFAULT 'N'
-);
-
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_session_id
-    ON nexent.user_cas_session_t (session_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_user_id
-    ON nexent.user_cas_session_t (user_id);
-CREATE INDEX IF NOT EXISTS ix_user_cas_session_cas_user_id
-    ON nexent.user_cas_session_t (cas_user_id);
-
-COMMENT ON TABLE nexent.user_cas_session_t IS 'Server-side session records for CAS SSO login and logout synchronization';
-COMMENT ON COLUMN nexent.user_cas_session_t.session_id IS 'JWT sid claim for revocation checks';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_user_id IS 'User identifier returned by CAS';
-COMMENT ON COLUMN nexent.user_cas_session_t.cas_session_index IS 'CAS SessionIndex or service ticket';
-
--- Rename params -> config_values, add config_schemas to ag_skill_info_t
--- Add tenant_id column for multi-tenancy support
-ALTER TABLE nexent.ag_skill_info_t ADD COLUMN IF NOT EXISTS tenant_id VARCHAR(100);
-
--- Add config_values and config_schemas to ag_skill_info_t
-DO $$
-BEGIN
-    IF EXISTS (
-        SELECT 1 FROM information_schema.columns
-        WHERE table_schema = 'nexent'
-          AND table_name   = 'ag_skill_info_t'
-          AND column_name  = 'params'
-    ) THEN
-        ALTER TABLE nexent.ag_skill_info_t RENAME COLUMN params TO config_values;
-    END IF;
-END $$;
-ALTER TABLE nexent.ag_skill_info_t ADD COLUMN IF NOT EXISTS config_schemas JSON;
-
--- Comments for ag_skill_info_t columns
-COMMENT ON COLUMN nexent.ag_skill_info_t.tenant_id IS 'Tenant ID for multi-tenancy. NULL for pre-existing skills.';
-COMMENT ON COLUMN nexent.ag_skill_info_t.config_values IS 'Runtime parameter values from config/config.yaml';
-COMMENT ON COLUMN nexent.ag_skill_info_t.config_schemas IS 'Parameter metadata list from config/schema.yaml';
-
--- Add config_values and config_schemas to ag_skill_instance_t
-ALTER TABLE nexent.ag_skill_instance_t ADD COLUMN IF NOT EXISTS config_values JSON;
-ALTER TABLE nexent.ag_skill_instance_t ADD COLUMN IF NOT EXISTS config_schemas JSON;
-
--- Comments for ag_skill_instance_t columns
-COMMENT ON COLUMN nexent.ag_skill_instance_t.config_values IS 'Per-agent runtime parameter values from config/config.yaml';
-COMMENT ON COLUMN nexent.ag_skill_instance_t.config_schemas IS 'Per-agent parameter schema overrides from config/schema.yaml';
-
--- Migration: ASSET_OWNER role permissions and invitation type comment
--- Date: 2026-05-29
--- Description: Add ASSET_OWNER role permissions, SU asset-owner invite permissions,
---              update invitation code_type comment, and ensure ag_skill_info_t.tenant_id exists
--- Source: commit 15cece97692db2372a978cbdf21b5d5316e79f30 (init.sql)
-
-SET search_path TO nexent;
-
-BEGIN;
-
-COMMENT ON COLUMN nexent.tenant_invitation_code_t.code_type IS
-    'Invitation code type: ADMIN_INVITE, DEV_INVITE, USER_INVITE, ASSET_OWNER_INVITE';
-
-INSERT INTO nexent.role_permission_t
-    (role_permission_id, user_role, permission_category, permission_type, permission_subtype)
-VALUES
-    (188, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'CREATE'),
-    (189, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'READ'),
-    (190, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'UPDATE'),
-    (191, 'SU', 'RESOURCE', 'INVITE.ASSET_OWNER', 'DELETE'),
-    (192, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/'),
-    (193, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/agents'),
-    (194, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/knowledges'),
-    (195, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/chat'),
-    (196, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/space'),
-    (197, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/market'),
-    (198, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/models'),
-    (199, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'CREATE'),
-    (200, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'READ'),
-    (201, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'UPDATE'),
-    (202, 'ASSET_OWNER', 'RESOURCE', 'AGENT', 'DELETE'),
-    (203, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'CREATE'),
-    (204, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'READ'),
-    (205, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'UPDATE'),
-    (206, 'ASSET_OWNER', 'RESOURCE', 'SKILL', 'DELETE'),
-    (207, 'ASSET_OWNER', 'RESOURCE', 'KB', 'CREATE'),
-    (208, 'ASSET_OWNER', 'RESOURCE', 'KB', 'READ'),
-    (209, 'ASSET_OWNER', 'RESOURCE', 'KB', 'UPDATE'),
-    (210, 'ASSET_OWNER', 'RESOURCE', 'KB', 'DELETE'),
-    (211, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'CREATE'),
-    (212, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'READ'),
-    (213, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'UPDATE'),
-    (214, 'ASSET_OWNER', 'RESOURCE', 'MCP', 'DELETE'),
-    (215, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'CREATE'),
-    (216, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'READ'),
-    (217, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'UPDATE'),
-    (218, 'ASSET_OWNER', 'RESOURCE', 'MODEL', 'DELETE'),
-    (219, 'ASSET_OWNER', 'RESOURCE', 'USER.ROLE', 'READ'),
-    (220, 'ASSET_OWNER', 'VISIBILITY', 'LEFT_NAV_MENU', '/users'),
-    (221, 'SU', 'VISIBILITY', 'LEFT_NAV_MENU', '/asset-owner-resources')
-ON CONFLICT (role_permission_id) DO NOTHING;
-
-COMMIT;
-
--- Migration: Add preserve_source_file to knowledge_record_t table
--- Date: 2026-06-01
--- Description: Whether to preserve uploaded source documents after vectorization (default: true)
-
-ALTER TABLE nexent.knowledge_record_t
-ADD COLUMN IF NOT EXISTS preserve_source_file BOOLEAN NOT NULL DEFAULT true;
-
-COMMENT ON COLUMN nexent.knowledge_record_t.preserve_source_file IS 'Whether to preserve uploaded source documents after vectorization';
-
--- Migration: Add ag_agent_repository_t table
--- Date: 2026-06-05
--- Description: Agent marketplace repository for frozen shareable agent snapshots.
-
-SET search_path TO nexent;
-
-BEGIN;
-
-CREATE SEQUENCE IF NOT EXISTS nexent.ag_agent_repository_t_agent_repository_id_seq;
-
-CREATE TABLE IF NOT EXISTS nexent.ag_agent_repository_t (
-    agent_repository_id BIGINT NOT NULL DEFAULT nextval('nexent.ag_agent_repository_t_agent_repository_id_seq'),
-    publisher_tenant_id VARCHAR(100) NOT NULL,
-    publisher_user_id VARCHAR(100) NOT NULL,
-    agent_id INTEGER NOT NULL,
-    source_version_no INTEGER NOT NULL,
-    name VARCHAR(100) NOT NULL,
-    display_name VARCHAR(100),
-    description TEXT,
-    author VARCHAR(100),
-    category_id INTEGER,
-    tags TEXT[],
-    tool_count INTEGER,
-    version_label VARCHAR(100),
-    agent_info_json JSONB NOT NULL,
-    status VARCHAR(30) DEFAULT 'NOT_SHARED',
-    create_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
-    update_time TIMESTAMP WITHOUT TIME ZONE DEFAULT CURRENT_TIMESTAMP,
-    created_by VARCHAR(100),
-    updated_by VARCHAR(100),
-    delete_flag VARCHAR(1) DEFAULT 'N',
-    CONSTRAINT ag_agent_repository_t_pkey PRIMARY KEY (agent_repository_id)
-);
-
-ALTER SEQUENCE nexent.ag_agent_repository_t_agent_repository_id_seq
-    OWNED BY nexent.ag_agent_repository_t.agent_repository_id;
-
-ALTER TABLE nexent.ag_agent_repository_t OWNER TO root;
-
-COMMENT ON TABLE nexent.ag_agent_repository_t IS 'Agent marketplace repository for frozen shareable agent snapshots';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_repository_id IS 'Agent repository listing ID, unique primary key';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_tenant_id IS 'Publisher tenant ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.publisher_user_id IS 'Publisher user ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_id IS 'Root agent ID from ag_tenant_agent_t; upsert key with publisher_tenant_id';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.source_version_no IS 'Published version number frozen at share time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.name IS 'Root agent programmatic name for display and search';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.display_name IS 'Root agent display name';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.description IS 'Root agent description';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.author IS 'Agent author';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.category_id IS 'Optional marketplace category ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.tags IS 'Marketplace tags';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.tool_count IS 'Total tool count across all agents in the bundle (display only)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.version_label IS 'Repository entry version label for display (e.g. v1.0)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.agent_info_json IS 'Frozen ExportAndImportDataFormat snapshot with optional skills';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.status IS 'Listing status: NOT_SHARED (未共享) / PENDING_REVIEW (待审核) / REJECTED (审核驳回) / SHARED (已共享)';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.create_time IS 'Creation time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.update_time IS 'Update time';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.created_by IS 'Creator ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.updated_by IS 'Updater ID';
-COMMENT ON COLUMN nexent.ag_agent_repository_t.delete_flag IS 'Soft delete flag: Y/N';
-
-CREATE UNIQUE INDEX IF NOT EXISTS uq_agent_repository_tenant_agent_active
-    ON nexent.ag_agent_repository_t (publisher_tenant_id, agent_id)
-    WHERE delete_flag = 'N';
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_publisher_delete
-    ON nexent.ag_agent_repository_t (publisher_tenant_id, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_status_delete
-    ON nexent.ag_agent_repository_t (status, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_name_delete
-    ON nexent.ag_agent_repository_t (name, delete_flag);
-
-CREATE INDEX IF NOT EXISTS idx_agent_repository_tags_gin
-    ON nexent.ag_agent_repository_t USING GIN (tags);
-
-CREATE OR REPLACE FUNCTION update_ag_agent_repository_update_time()
-RETURNS TRIGGER AS $$
-BEGIN
-    NEW.update_time = CURRENT_TIMESTAMP;
-    RETURN NEW;
-END;
-$$ LANGUAGE plpgsql;
-
-COMMENT ON FUNCTION update_ag_agent_repository_update_time() IS 'Auto-update update_time for ag_agent_repository_t';
-
-DROP TRIGGER IF EXISTS update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t;
-CREATE TRIGGER update_ag_agent_repository_update_time_trigger
-BEFORE UPDATE ON nexent.ag_agent_repository_t
-FOR EACH ROW
-EXECUTE FUNCTION update_ag_agent_repository_update_time();
-
-COMMENT ON TRIGGER update_ag_agent_repository_update_time_trigger ON nexent.ag_agent_repository_t IS 'Trigger to maintain update_time';
-
-COMMIT;
-
--- Migration: Add selected_agent_version_no to ag_agent_relation_t
--- Date: 2026-06-09
--- Description: Pin child agent version on parent-child relations at publish time.
-
-SET search_path TO nexent;
-
-BEGIN;
-
-ALTER TABLE nexent.ag_agent_relation_t
-    ADD COLUMN IF NOT EXISTS selected_agent_version_no INTEGER;
-
-COMMENT ON COLUMN nexent.ag_agent_relation_t.selected_agent_version_no IS
-    'Pinned version of selected_agent_id. NULL = use child current published version at runtime (legacy/draft).';
-
-COMMIT;
diff --git a/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml b/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
index 0f1a4a5a3..1b473b633 100644
--- a/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
+++ b/k8s/helm/nexent/charts/nexent-common/templates/configmap.yaml
@@ -166,23 +166,3 @@ data:
   OAUTH_SSL_VERIFY: {{ .Values.config.oauth.sslVerify | quote }}
   OAUTH_CA_BUNDLE: {{ .Values.config.oauth.caBundle | quote }}
   OAUTH_CALLBACK_BASE_URL: {{ .Values.config.oauth.callbackBaseUrl | quote }}
-
-  # ===== CAS SSO Configuration =====
-  CAS_ENABLED: {{ .Values.config.cas.enabled | quote }}
-  CAS_SERVER_URL: {{ .Values.config.cas.serverUrl | quote }}
-  CAS_VALIDATE_PATH: {{ .Values.config.cas.validatePath | quote }}
-  CAS_CALLBACK_BASE_URL: {{ .Values.config.cas.callbackBaseUrl | quote }}
-  CAS_LOGIN_MODE: {{ .Values.config.cas.loginMode | quote }}
-  CAS_USER_ATTRIBUTE: {{ .Values.config.cas.userAttribute | quote }}
-  CAS_EMAIL_ATTRIBUTE: {{ .Values.config.cas.emailAttribute | quote }}
-  CAS_ROLE_ATTRIBUTE: {{ .Values.config.cas.roleAttribute | quote }}
-  CAS_TENANT_ATTRIBUTE: {{ .Values.config.cas.tenantAttribute | quote }}
-  CAS_ROLE_MAP_JSON: {{ .Values.config.cas.roleMapJson | quote }}
-  CAS_SESSION_MAX_AGE_SECONDS: {{ .Values.config.cas.sessionMaxAgeSeconds | quote }}
-  LOCAL_SESSION_MAX_AGE_SECONDS: {{ .Values.config.cas.localSessionMaxAgeSeconds | quote }}
-  CAS_RENEW_BEFORE_SECONDS: {{ .Values.config.cas.renewBeforeSeconds | quote }}
-  CAS_RENEW_TIMEOUT_SECONDS: {{ .Values.config.cas.renewTimeoutSeconds | quote }}
-  CAS_SYNTHETIC_EMAIL_DOMAIN: {{ .Values.config.cas.syntheticEmailDomain | quote }}
-  CAS_LOGOUT_URL: {{ .Values.config.cas.logoutUrl | quote }}
-  CAS_SSL_VERIFY: {{ .Values.config.cas.sslVerify | quote }}
-  CAS_CA_BUNDLE: {{ .Values.config.cas.caBundle | quote }}
diff --git a/k8s/helm/nexent/charts/nexent-common/values.yaml b/k8s/helm/nexent/charts/nexent-common/values.yaml
index 7b27ba302..788ae7290 100644
--- a/k8s/helm/nexent/charts/nexent-common/values.yaml
+++ b/k8s/helm/nexent/charts/nexent-common/values.yaml
@@ -139,29 +139,6 @@ config:
     sslVerify: "true"
     caBundle: ""
     callbackBaseUrl: "http://localhost:30000"
-  cas:
-    enabled: "false"
-    serverUrl: ""
-    validatePath: "/p3/serviceValidate"
-    callbackBaseUrl: "http://localhost:30000"
-    # Supported values:
-    # - disabled: disable CAS login entry and automatic CAS redirects.
-    # - button: show CAS as an optional login entry.
-    # - force: automatically redirect unauthenticated users to CAS login.
-    loginMode: "disabled"
-    userAttribute: ""
-    emailAttribute: "email"
-    roleAttribute: "role"
-    tenantAttribute: "tenant_id"
-    roleMapJson: ""
-    sessionMaxAgeSeconds: "3600"
-    localSessionMaxAgeSeconds: "3600"
-    renewBeforeSeconds: "300"
-    renewTimeoutSeconds: "10"
-    syntheticEmailDomain: "cas.local"
-    logoutUrl: ""
-    sslVerify: "true"
-    caBundle: ""
 
 # Secrets used by common templates
 secrets:
diff --git a/k8s/helm/nexent/charts/nexent-data-process/values.yaml b/k8s/helm/nexent/charts/nexent-data-process/values.yaml
index d6bb70a7f..189292667 100644
--- a/k8s/helm/nexent/charts/nexent-data-process/values.yaml
+++ b/k8s/helm/nexent/charts/nexent-data-process/values.yaml
@@ -12,7 +12,7 @@ resources:
       memory: 512Mi
       cpu: 0.5
     limits:
-      memory: 64Gi
+      memory: 4Gi
       cpu: 8
 
 config:
diff --git a/k8s/helm/nexent/values.yaml b/k8s/helm/nexent/values.yaml
index 6224d0949..ce5bc454a 100644
--- a/k8s/helm/nexent/values.yaml
+++ b/k8s/helm/nexent/values.yaml
@@ -40,33 +40,6 @@ global:
 
 # Optional monitoring stack. Set provider to one of:
 # otlp, phoenix, langfuse, langsmith, grafana, zipkin.
-nexent-common:
-  # Shared ConfigMap values rendered into the Kubernetes nexent-config ConfigMap.
-  config:
-    cas:
-      enabled: "false"
-      serverUrl: ""
-      validatePath: "/p3/serviceValidate"
-      callbackBaseUrl: "http://localhost:30000"
-      # Supported values:
-      # - disabled: disable CAS login entry and automatic CAS redirects.
-      # - button: show CAS as an optional login entry.
-      # - force: automatically redirect unauthenticated users to CAS login.
-      loginMode: "disabled"
-      userAttribute: ""
-      emailAttribute: "email"
-      roleAttribute: "role"
-      tenantAttribute: "tenant_id"
-      roleMapJson: ""
-      sessionMaxAgeSeconds: "3600"
-      localSessionMaxAgeSeconds: "3600"
-      renewBeforeSeconds: "300"
-      renewTimeoutSeconds: "10"
-      syntheticEmailDomain: "cas.local"
-      logoutUrl: ""
-      sslVerify: "true"
-      caBundle: ""
-
 nexent-elasticsearch:
   enabled: true
 nexent-postgresql:
diff --git a/make/data_process/Dockerfile b/make/data_process/Dockerfile
index 998e2352a..8d9a8a723 100644
--- a/make/data_process/Dockerfile
+++ b/make/data_process/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.11-slim
+FROM python:3.10-slim
 ARG MIRROR
 ARG APT_MIRROR
 LABEL authors="nexent"
@@ -45,12 +45,11 @@ RUN uv sync --no-cache-dir --extra data-process $(test -n "$MIRROR" && echo "-i
     uv cache clean
 # Layer 2: install sdk in link mode
 COPY sdk /opt/sdk
-RUN uv pip install --no-cache-dir "/opt/sdk[performance]" $(test -n "$MIRROR" && echo "-i $MIRROR") && \
+RUN uv pip install --no-cache-dir /opt/sdk $(test -n "$MIRROR" && echo "-i $MIRROR") && \
     uv cache clean
 
 # Pre-download tiktoken cl100k_base model to avoid network issues during runtime
 RUN uv run python -c "import tiktoken; enc = tiktoken.get_encoding('cl100k_base')"
-
 # Layer 3: copy backend code
 COPY backend /opt/backend
 
diff --git a/make/main/Dockerfile b/make/main/Dockerfile
index 0e32b04b7..0f4027619 100644
--- a/make/main/Dockerfile
+++ b/make/main/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.11-slim
+FROM python:3.10-slim
 ARG MIRROR
 ARG APT_MIRROR
 LABEL authors="nexent"
diff --git a/make/mcp/Dockerfile b/make/mcp/Dockerfile
index e011bf5fe..03cb3f1c3 100644
--- a/make/mcp/Dockerfile
+++ b/make/mcp/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.11-slim
+FROM python:3.10-slim
 
 ARG MIRROR
 ARG APT_MIRROR
@@ -38,7 +38,7 @@ RUN if [ -n "$MCP_PROXY_VERSION" ]; then \
 
 # Install Node.js 20 from official binaries (pin exact version to avoid repo issues)
 ARG NODE_VERSION=20.17.0
-RUN set -eu && \
+RUN set -euo pipefail && \
     arch="$(dpkg --print-architecture)" && \
     case "${arch}" in \
         amd64) node_arch="x64" ;; \
diff --git a/scripts/deployment/common.sh b/scripts/deployment/common.sh
index 006561553..5855af1a0 100755
--- a/scripts/deployment/common.sh
+++ b/scripts/deployment/common.sh
@@ -319,6 +319,11 @@ deployment_validate() {
     deployment_error "Local config schemaVersion $DEPLOYMENT_LOADED_SCHEMA_VERSION is incompatible with $DEPLOYMENT_SCHEMA_VERSION. Re-run with --reconfigure."
     return 1
   fi
+  if [ -n "$DEPLOYMENT_LOADED_APP_VERSION" ] && [ -n "${APP_VERSION:-}" ] && [ -z "${DEPLOYMENT_APP_VERSION_EXPLICIT:-}" ] && [ "$DEPLOYMENT_LOADED_APP_VERSION" != "$APP_VERSION" ]; then
+    deployment_error "Local config appVersion $DEPLOYMENT_LOADED_APP_VERSION does not match current appVersion $APP_VERSION. Re-run with --reconfigure or pass --app-version."
+    return 1
+  fi
+
   local old_ifs="$IFS"
   local component
   IFS=','
diff --git a/scripts/offline/build_offline_package.sh b/scripts/offline/build_offline_package.sh
index ff2141c83..f69eaea80 100755
--- a/scripts/offline/build_offline_package.sh
+++ b/scripts/offline/build_offline_package.sh
@@ -4,6 +4,7 @@ set -e
 
 SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
 PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
+DEPLOYMENT_COMMON="$PROJECT_ROOT/scripts/deployment/common.sh"
 
 DEFAULT_VERSION="latest"
 DEFAULT_PLATFORM="amd64"
@@ -14,6 +15,16 @@ VERSION=""
 PLATFORM=""
 OUTPUT_DIR=""
 INCLUDE_SOURCE=""
+DRY_RUN="false"
+COMMON_ARGS=()
+
+if [ -f "$DEPLOYMENT_COMMON" ]; then
+  # shellcheck source=/dev/null
+  source "$DEPLOYMENT_COMMON"
+else
+  echo "Error: shared deployment helper not found: $DEPLOYMENT_COMMON"
+  exit 1
+fi
 
 show_help() {
   echo "Usage: $0 [OPTIONS]"
@@ -29,6 +40,10 @@ show_help() {
   echo "                           Default: $DEFAULT_OUTPUT_DIR"
   echo "  --include-source BOOL   Include source code (true or false)"
   echo "                           Default: $DEFAULT_INCLUDE_SOURCE"
+  echo "  --components LIST       Deployment components for image selection"
+  echo "  --image-source SOURCE   general, mainland, or local-latest"
+  echo "  --registry-profile NAME Legacy alias for --image-source general|mainland"
+  echo "  --config FILE           Deployment config with components and image source"
   echo "  --dry-run               Show execution plan without actual operations"
   echo "  --help                  Show this help message"
   echo ""
@@ -60,7 +75,15 @@ parse_args() {
         shift 2
         ;;
       --dry-run)
-        dry_run=true
+        DRY_RUN="true"
+        shift
+        ;;
+      --components|--image-source|--registry-profile|--app-version|--monitoring-provider|--port-policy|--config|--local-config)
+        COMMON_ARGS+=("$1" "$2")
+        shift 2
+        ;;
+      --use-local-config|--reconfigure)
+        COMMON_ARGS+=("$1")
         shift
         ;;
       --help)
@@ -84,13 +107,32 @@ parse_args() {
     echo "Error: Platform must be 'amd64' or 'arm64'"
     exit 1
   fi
+}
 
-  if [[ "$dry_run" == "true" ]]; then
+prepare_deployment_image_config() {
+  export APP_VERSION="$VERSION"
+  deployment_prepare_config "${COMMON_ARGS[@]}" --app-version "$VERSION" || exit 1
+
+  case "$DEPLOYMENT_REGISTRY_PROFILE" in
+    mainland)
+      [ -f "$PROJECT_ROOT/docker/.env.mainland" ] && source "$PROJECT_ROOT/docker/.env.mainland"
+      ;;
+    general|local-latest)
+      [ -f "$PROJECT_ROOT/docker/.env.general" ] && source "$PROJECT_ROOT/docker/.env.general"
+      ;;
+  esac
+
+  deployment_apply_image_source
+}
+
+show_dry_run_plan() {
     echo "=== DRY RUN MODE ==="
     echo "Version: $VERSION"
     echo "Platform: $PLATFORM"
     echo "Output directory: $OUTPUT_DIR"
     echo "Include source: $INCLUDE_SOURCE"
+    echo "Components: $DEPLOYMENT_COMPONENTS"
+    echo "Image source: $DEPLOYMENT_IMAGE_SOURCE"
     echo ""
     echo "Images to pull:"
     get_nexent_images
@@ -98,38 +140,49 @@ parse_args() {
     echo ""
     echo "No actual operations will be performed."
     exit 0
-  fi
 }
 
 get_nexent_images() {
-  local version_tag="$VERSION"
-
-  local nexent_images=(
-    "nexent/nexent:${version_tag}"
-    "nexent/nexent-web:${version_tag}"
-    "nexent/nexent-data-process:${version_tag}"
-    "nexent/nexent-mcp:${version_tag}"
-  )
-
-  for img in "${nexent_images[@]}"; do
-    echo "$img"
-  done
+  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_IMAGE"
+  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_WEB_IMAGE"
+  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "application" && echo "$NEXENT_MCP_DOCKER_IMAGE"
+  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "data-process" && echo "$NEXENT_DATA_PROCESS_IMAGE"
+  deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "terminal" && echo "$OPENSSH_SERVER_IMAGE"
+  true
 }
 
 get_third_party_images() {
-  local third_party_images=(
-    "docker.elastic.co/elasticsearch/elasticsearch:8.17.4"
-    "docker.io/library/postgres:15-alpine"
-    "docker.io/library/redis:alpine"
-    "quay.io/minio/minio:RELEASE.2023-12-20T01-00-02Z"
-    "docker.io/library/kong:2.8.1"
-    "docker.io/supabase/gotrue:v2.170.0"
-    "docker.io/supabase/postgres:15.8.1.060"
-  )
-
-  for img in "${third_party_images[@]}"; do
-    echo "$img"
-  done
+  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "infrastructure"; then
+    echo "$ELASTICSEARCH_IMAGE"
+    echo "$POSTGRESQL_IMAGE"
+    echo "$REDIS_IMAGE"
+    echo "$MINIO_IMAGE"
+  fi
+  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "supabase"; then
+    echo "$SUPABASE_KONG"
+    echo "$SUPABASE_GOTRUE"
+    echo "$SUPABASE_DB"
+  fi
+  if deployment_csv_contains "$DEPLOYMENT_COMPONENTS" "monitoring"; then
+    echo "otel/opentelemetry-collector-contrib:0.151.0"
+    case "$DEPLOYMENT_MONITORING_PROVIDER" in
+      phoenix) echo "arizephoenix/phoenix:15" ;;
+      grafana)
+        echo "grafana/tempo:2.10.5"
+        echo "grafana/grafana:12.4"
+        ;;
+      zipkin) echo "openzipkin/zipkin:latest" ;;
+      langfuse)
+        echo "docker.io/langfuse/langfuse-worker:3"
+        echo "docker.io/langfuse/langfuse:3"
+        echo "docker.io/clickhouse/clickhouse-server:26.3-alpine"
+        echo "docker.io/minio/minio:RELEASE.2023-12-20T01-00-02Z"
+        echo "docker.io/redis:alpine"
+        echo "docker.io/postgres:15-alpine"
+        ;;
+    esac
+  fi
+  true
 }
 
 pull_with_retry() {
@@ -362,6 +415,11 @@ LOADSCRIPT
 
 main() {
   parse_args "$@"
+  prepare_deployment_image_config
+
+  if [[ "$DRY_RUN" == "true" ]]; then
+    show_dry_run_plan
+  fi
 
   echo ""
   echo "========================================"
@@ -371,6 +429,8 @@ main() {
   echo "Platform: $PLATFORM"
   echo "Output directory: $OUTPUT_DIR"
   echo "Include source: $INCLUDE_SOURCE"
+  echo "Components: $DEPLOYMENT_COMPONENTS"
+  echo "Image source: $DEPLOYMENT_IMAGE_SOURCE"
   echo "========================================"
 
   rm -rf "$OUTPUT_DIR"
diff --git a/sdk/nexent/__init__.py b/sdk/nexent/__init__.py
index d0de150cb..781fcf495 100644
--- a/sdk/nexent/__init__.py
+++ b/sdk/nexent/__init__.py
@@ -3,7 +3,8 @@
 from .memory import *
 from .storage import *
 from .vector_database import *
+from .container import *
 from .skills import *
 
 
-__all__ = ["core", "memory", "storage", "vector_database", "datamate", "skills"]
+__all__ = ["core", "memory", "storage", "vector_database", "container", "datamate", "skills"]
diff --git a/sdk/nexent/container/docker_client.py b/sdk/nexent/container/docker_client.py
index 80aa6f8c3..166d27b49 100644
--- a/sdk/nexent/container/docker_client.py
+++ b/sdk/nexent/container/docker_client.py
@@ -11,34 +11,12 @@
 
 import docker
 from docker.errors import APIError, DockerException, NotFound
+from fastmcp import Client
+from fastmcp.client.transports import StreamableHttpTransport, SSETransport
 
 from .container_client_base import ContainerClient, ContainerConfig
 from .docker_config import DockerContainerConfig
 
-Client = None
-StreamableHttpTransport = None
-SSETransport = None
-
-
-def _ensure_fastmcp_imports() -> tuple[type, type, type]:
-    global Client, StreamableHttpTransport, SSETransport
-
-    if Client is None:
-        from fastmcp import Client as FastMCPClient
-
-        Client = FastMCPClient
-
-    if StreamableHttpTransport is None or SSETransport is None:
-        from fastmcp.client.transports import (
-            StreamableHttpTransport as FastMCPStreamableHttpTransport,
-            SSETransport as FastMCPSSETransport,
-        )
-
-        StreamableHttpTransport = FastMCPStreamableHttpTransport
-        SSETransport = FastMCPSSETransport
-
-    return Client, StreamableHttpTransport, SSETransport
-
 logger = logging.getLogger("nexent.container.docker")
 
 
@@ -57,7 +35,7 @@ class ContainerConnectionError(Exception):
 class DockerContainerClient(ContainerClient):
     """Docker container client implementation"""
 
-    DEFAULT_NETWORK_NAME = "nexent_network"
+    DEFAULT_NETWORK_NAME = "nexent_nexent"
 
     def __init__(self, config: DockerContainerConfig):
         """
@@ -403,8 +381,6 @@ async def _wait_for_service_ready(
         Raises:
             ContainerConnectionError: If service is not ready after max retries
         """
-        client_cls, streamable_http_transport_cls, sse_transport_cls = _ensure_fastmcp_imports()
-
         for i in range(max_retries):
             try:
                 # Select transport based on URL ending and set headers
@@ -412,23 +388,23 @@ async def _wait_for_service_ready(
                 headers = {"Authorization": authorization_token} if authorization_token else {}
 
                 if url_stripped.endswith("/sse"):
-                    transport = sse_transport_cls(
+                    transport = SSETransport(
                         url=url_stripped,
                         headers=headers
                     )
                 elif url_stripped.endswith("/mcp"):
-                    transport = streamable_http_transport_cls(
+                    transport = StreamableHttpTransport(
                         url=url_stripped,
                         headers=headers
                     )
                 else:
                     # Default to StreamableHttpTransport for unrecognized formats
-                    transport = streamable_http_transport_cls(
+                    transport = StreamableHttpTransport(
                         url=url_stripped,
                         headers=headers
                     )
 
-                client = client_cls(transport=transport)
+                client = Client(transport=transport)
                 async with client:
                     if client.is_connected():
                         logger.info(f"Service ready at {url}")
diff --git a/sdk/nexent/container/k8s_client.py b/sdk/nexent/container/k8s_client.py
index c2fb72741..c1fa4db53 100644
--- a/sdk/nexent/container/k8s_client.py
+++ b/sdk/nexent/container/k8s_client.py
@@ -8,7 +8,6 @@
 import asyncio
 import logging
 import socket
-import re
 import uuid
 
 import kubernetes
@@ -24,47 +23,6 @@
 
 logger = logging.getLogger("nexent.container.kubernetes")
 
-# Kubernetes naming constraints: lowercase alphanumeric or dash, cannot start/end with dash,
-# cannot have consecutive dashes, max 253 characters
-K8S_NAME_PATTERN = re.compile(r"[^a-z0-9-]+")
-K8S_CONSECUTIVE_DASHES = re.compile(r"-+")
-
-
-def _sanitize_k8s_name(name: str) -> str:
-    """Convert arbitrary string to valid Kubernetes resource name.
-
-    Rules:
-    - Convert to lowercase
-    - Replace invalid characters with dash
-    - Collapse consecutive dashes
-    - Remove leading/trailing dashes
-    - Must start with alphanumeric
-
-    Args:
-        name: Input string to sanitize
-
-    Returns:
-        Valid Kubernetes name (lowercase alphanumeric and dashes only)
-    """
-    if not name:
-        return "unknown"
-
-    # Lowercase and replace invalid chars with dash
-    sanitized = K8S_NAME_PATTERN.sub("-", name.lower())
-
-    # Collapse consecutive dashes
-    sanitized = K8S_CONSECUTIVE_DASHES.sub("-", sanitized)
-
-    # Remove leading/trailing dashes
-    sanitized = sanitized.strip("-")
-
-    # Ensure it starts with alphanumeric
-    if sanitized and not sanitized[0].isalnum():
-        sanitized = "x" + sanitized
-
-    # Fallback if empty
-    return sanitized if sanitized else "unknown"
-
 
 class ContainerError(Exception):
     """Raised when container operation fails"""
@@ -119,9 +77,9 @@ def __init__(self, config: KubernetesContainerConfig):
 
     def _generate_pod_name(self, service_name: str, tenant_id: str, user_id: str) -> str:
         """Generate unique pod name with service, tenant, and user segments."""
-        safe_name = _sanitize_k8s_name(service_name)
-        tenant_part = _sanitize_k8s_name(tenant_id)[:8]
-        user_part = _sanitize_k8s_name(user_id)[:8]
+        safe_name = "".join(c if c.isalnum() or c == "-" else "-" for c in service_name)
+        tenant_part = (tenant_id or "")[:8]
+        user_part = (user_id or "")[:8]
         uuid_part = uuid.uuid4().hex[:8]
         return f"mcp-{safe_name}-{tenant_part}-{user_part}-{uuid_part}"
 
@@ -528,7 +486,7 @@ def list_containers(
 
                 # Filter by service_name if provided
                 if service_name:
-                    safe_name = _sanitize_k8s_name(service_name)
+                    safe_name = "".join(c if c.isalnum() or c == "-" else "-" for c in service_name)
                     pod_component = labels.get(self.LABEL_COMPONENT, "")
                     if safe_name not in pod_component:
                         continue
diff --git a/sdk/nexent/core/agents/agent_model.py b/sdk/nexent/core/agents/agent_model.py
index 62e75cb59..82fb81167 100644
--- a/sdk/nexent/core/agents/agent_model.py
+++ b/sdk/nexent/core/agents/agent_model.py
@@ -75,67 +75,6 @@ class ToolConfig(BaseModel):
     usage: Optional[str] = Field(description="MCP server name", default=None)
     metadata: Optional[Dict[str, Any]] = Field(description="Metadata", default=None)
 
-
-VerificationEvent = Literal[
-    "tool_precheck",
-    "tool_result",
-    "retrieval",
-    "code_execution",
-    "handoff",
-    "final_answer",
-]
-VerificationStrictness = Literal["lenient", "balanced", "strict"]
-VerificationFailPolicy = Literal["repair_then_controlled_summary", "warn"]
-
-
-class AgentVerificationConfig(BaseModel):
-    """Configuration for layered ReAct self-verification."""
-
-    enabled: bool = Field(description="Whether self-verification is enabled", default=True)
-    step_verification_enabled: bool = Field(
-        description="Whether to verify critical ReAct step events",
-        default=True,
-    )
-    final_verification_enabled: bool = Field(
-        description="Whether to verify final answer candidates before returning them",
-        default=True,
-    )
-    llm_verification_enabled: bool = Field(
-        description="Whether to use the LLM as a final-answer verifier after deterministic checks",
-        default=True,
-    )
-    max_final_rounds: int = Field(
-        description="Maximum number of final-answer verification attempts",
-        default=2,
-        ge=1,
-        le=5,
-    )
-    strictness: VerificationStrictness = Field(
-        description="Verification strictness profile",
-        default="balanced",
-    )
-    fail_policy: VerificationFailPolicy = Field(
-        description="Policy when final verification still fails after repair attempts",
-        default="repair_then_controlled_summary",
-    )
-    pass_score: float = Field(
-        description="Minimum verifier score for final answers",
-        default=0.75,
-        ge=0.0,
-        le=1.0,
-    )
-    critical_events: List[VerificationEvent] = Field(
-        description="Critical ReAct events that should be verified",
-        default_factory=lambda: [
-            "tool_precheck",
-            "tool_result",
-            "retrieval",
-            "code_execution",
-            "handoff",
-            "final_answer",
-        ],
-    )
-
 class AgentConfig(BaseModel):
     name: str = Field(description="Agent name")
     description: str = Field(description="Agent description")
@@ -161,10 +100,6 @@ class AgentConfig(BaseModel):
         description="Pre-built context components for system prompt assembly",
         default=None
     )
-    verification_config: AgentVerificationConfig = Field(
-        description="Layered ReAct self-verification configuration",
-        default_factory=AgentVerificationConfig,
-    )
 
 
 class AgentHistory(BaseModel):
diff --git a/sdk/nexent/core/agents/core_agent.py b/sdk/nexent/core/agents/core_agent.py
index 9397b2bfa..e029f012e 100644
--- a/sdk/nexent/core/agents/core_agent.py
+++ b/sdk/nexent/core/agents/core_agent.py
@@ -2,7 +2,6 @@
 import ast
 import time
 import threading
-from datetime import datetime
 from textwrap import dedent
 from typing import Any, Optional, List, Dict
 from collections.abc import Generator
@@ -28,8 +27,6 @@
     import PIL.Image
 
 from .agent_context import ContextManager
-from .agent_model import AgentVerificationConfig
-from .verification import VerificationController, VerificationResult
 from ..utils.token_estimation import msg_token_count
 
 def parse_code_blobs(text: str) -> str:
@@ -215,24 +212,9 @@ def _build_final_answer_messages(task: str, agent_prompt_templates: Dict[str, An
 
 
 class CoreAgent(CodeAgent):
-    def __init__(
-        self,
-        observer: MessageObserver,
-        prompt_templates: Dict[str, Any] | None = None,
-        verification_config: AgentVerificationConfig | None = None,
-        *args,
-        **kwargs
-    ):
+    def __init__(self, observer: MessageObserver, prompt_templates: Dict[str, Any] | None = None, *args, **kwargs):
         super().__init__(prompt_templates=prompt_templates, *args, **kwargs)
         self.observer = observer
-        self.verification_config = verification_config or AgentVerificationConfig(enabled=False)
-        self.verification_controller = VerificationController(
-            config=self.verification_config,
-            observer=observer,
-            agent_name=self.agent_name,
-            model=self.model,
-            logger=self.logger,
-        )
         self.stop_event = threading.Event()
         self._history_step_count = 0  # For ContextManager, record boundary for compression
         self.context_manager: ContextManager = None
@@ -244,78 +226,6 @@ def __init__(
         # identifiers; omitting "python" and "py" ensures ```python blocks are not extracted.
         self.code_block_tags = ["", ""]
 
-    def _verification_tool_names(self) -> List[str]:
-        names = set()
-        for container in (getattr(self, "tools", {}) or {}, getattr(self, "managed_agents", {}) or {}):
-            try:
-                names.update(str(name) for name in container.keys())
-            except AttributeError:
-                continue
-        names.add("final_answer")
-        return sorted(names)
-
-    def _append_verification_feedback(self, action_step: ActionStep, result: VerificationResult) -> None:
-        feedback = self.verification_controller.build_feedback_observation(result)
-        if action_step.observations:
-            action_step.observations += feedback
-        else:
-            action_step.observations = feedback
-
-    def _build_verification_memory_summary(
-        self,
-        current_step: ActionStep | None = None,
-        max_chars: int = 8000,
-    ) -> str:
-        summaries = []
-        steps = list(self.memory.steps[-8:])
-        if current_step is not None:
-            steps.append(current_step)
-        for step in steps:
-            if isinstance(step, TaskStep):
-                summaries.append(f"Task: {truncate_content(str(step.task), max_length=1200)}")
-            elif isinstance(step, ActionStep):
-                code = truncate_content(str(getattr(step, "code_action", "") or ""), max_length=1200)
-                observations = truncate_content(str(getattr(step, "observations", "") or ""), max_length=1800)
-                output = truncate_content(str(getattr(step, "action_output", "") or ""), max_length=1200)
-                summaries.append(
-                    f"Step {getattr(step, 'step_number', '?')}:\n"
-                    f"Code: {code}\n"
-                    f"Observation: {observations}\n"
-                    f"Output: {output}"
-                )
-        return truncate_content("\n\n".join(summaries), max_length=max_chars)
-
-    def _finalize_failed_verification_candidate(
-        self,
-        action_step: ActionStep,
-        verification_result: VerificationResult,
-        verification_round: int,
-        max_rounds: int,
-        candidate_answer: Any,
-    ) -> tuple[bool, Any]:
-        if verification_round < max_rounds:
-            verification_result.phase = "repair"
-            self.verification_controller.emit(
-                verification_result,
-                verification_round,
-            )
-            self._append_verification_feedback(action_step, verification_result)
-            action_step.is_final_answer = False
-            return False, None
-
-        verification_result.phase = "final_fail"
-        self.verification_controller.emit(
-            verification_result,
-            verification_round,
-        )
-        controlled_answer = self.verification_controller.build_controlled_failure_answer(
-            candidate_answer,
-            verification_result,
-        )
-        action_step.is_final_answer = True
-        action_step.action_output = controlled_answer
-        return True, controlled_answer
-
     def _log_model_call_parameters(self, input_messages: List[ChatMessage], stop_sequences: List[str], additional_args: Dict[str, Any]) -> None:
         """
         Log model call parameters with content truncation for readability.
@@ -438,22 +348,7 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             # Record parsing results
             self.observer.add_message(
                 self.agent_name, ProcessType.PARSE, code_action)
-            verification_controller = getattr(self, "verification_controller", None)
-            if verification_controller:
-                precheck = verification_controller.verify_before_tool_call(
-                    code_action=code_action,
-                    step_number=memory_step.step_number,
-                    available_tool_names=self._verification_tool_names(),
-                )
-                if not precheck.passed and precheck.severity == "blocking":
-                    self._append_verification_feedback(memory_step, precheck)
-                    raise AgentExecutionError(
-                        precheck.repair_instruction or precheck.user_visible_note or "Action failed verification.",
-                        self.logger,
-                    )
 
-        except AgentExecutionError:
-            raise
         except Exception:
             self.logger.log_markdown(
                 content=model_output, title="AGENT FINAL ANSWER", level=LogLevel.INFO)
@@ -519,7 +414,7 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             error_msg = str(e)
             self.logger.log(
                 f"[Code Execution] step={memory_step.step_number} failed after {exec_duration_ms:.1f}ms: {error_msg}",
-                level=LogLevel.ERROR,
+                level=LogLevel.WARNING,
             )
             raise AgentExecutionError(error_msg, self.logger)
 
@@ -535,23 +430,6 @@ def _step_stream(self, memory_step: ActionStep) -> Generator[Any]:
             observation += "Last output from code snippet:\n" + truncated_output
         memory_step.observations = observation
 
-        verification_controller = getattr(self, "verification_controller", None)
-        if verification_controller:
-            postcheck = verification_controller.verify_after_tool_call(
-                code_action=code_action,
-                observation=memory_step.observations,
-                step_number=memory_step.step_number,
-                is_final_answer=bool(code_output.is_final_answer),
-            )
-            if not postcheck.passed and postcheck.severity == "blocking":
-                self._append_verification_feedback(memory_step, postcheck)
-                raise AgentExecutionError(
-                    postcheck.repair_instruction or postcheck.user_visible_note or "Action result failed verification.",
-                    self.logger,
-                )
-            if postcheck.severity == "warning":
-                self._append_verification_feedback(memory_step, postcheck)
-
         # Pre-truncate observations when ContextManager is enabled. Keeps the
         # head + tail of long outputs around a truncation marker so downstream
         # compression sees bounded-length step records and the model can still
@@ -600,11 +478,7 @@ def run(self, task: str, stream: bool = False, reset: bool = True, images: Optio
         ```
         """
         max_steps = max_steps or self.max_steps
-        # Prepend current time to the user task instead of baking it into the
-        # system prompt. This keeps the system prefix stable so prompt/KV caches
-        # can hit across requests; only the trailing user message varies.
-        time_str = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-        self.task = f"[Current time: {time_str}]\n\n{task}"
+        self.task = task
         if additional_args is not None:
             self.state.update(additional_args)
             self.task += f"""
@@ -723,17 +597,6 @@ def _run_stream(
         action_step = None
         self.step_number = 1
         returned_final_answer = False
-        final_verification_round = 0
-        verification_config = getattr(
-            self,
-            "verification_config",
-            AgentVerificationConfig(enabled=False),
-        )
-        max_final_verification_rounds = (
-            verification_config.max_final_rounds
-            if verification_config and verification_config.enabled
-            else 1
-        )
         while not returned_final_answer and self.step_number <= max_steps and not self.stop_event.is_set():
             step_start_time = time.time()
 
@@ -745,73 +608,24 @@ def _run_stream(
                     yield output
 
                 if isinstance(output, ActionOutput) and output.is_final_answer:
-                    candidate_answer = output.output
+                    final_answer = output.output
                     self.logger.log(
-                        Text(f"Final answer: {candidate_answer}", style=f"bold {YELLOW_HEX}"),
+                        Text(f"Final answer: {final_answer}", style=f"bold {YELLOW_HEX}"),
                         level=LogLevel.INFO,
                     )
 
-                    if verification_config.enabled and verification_config.final_verification_enabled:
-                        final_verification_round += 1
-                        verification_result = self.verification_controller.verify_final_answer(
-                            task=task,
-                            candidate=candidate_answer,
-                            memory_summary=self._build_verification_memory_summary(action_step),
-                            round_number=final_verification_round,
-                        )
-                        if verification_result.passed:
-                            final_answer = candidate_answer
-                            if self.final_answer_checks:
-                                self._validate_final_answer(final_answer)
-                            returned_final_answer = True
-                            action_step.is_final_answer = True
-                        else:
-                            returned_final_answer, final_answer = self._finalize_failed_verification_candidate(
-                                action_step=action_step,
-                                verification_result=verification_result,
-                                verification_round=final_verification_round,
-                                max_rounds=max_final_verification_rounds,
-                                candidate_answer=candidate_answer,
-                            )
-                    else:
-                        final_answer = candidate_answer
-                        if self.final_answer_checks:
-                            self._validate_final_answer(final_answer)
-                        returned_final_answer = True
-                        action_step.is_final_answer = True
+                    if self.final_answer_checks:
+                        self._validate_final_answer(final_answer)
+                    returned_final_answer = True
+                    action_step.is_final_answer = True
 
             except FinalAnswerError:
                 # When the model does not output code, directly treat the large model content as the final answer
-                candidate_answer = action_step.model_output
-                if isinstance(candidate_answer, str):
-                    candidate_answer = convert_code_format(candidate_answer)
-
-                if verification_config.enabled and verification_config.final_verification_enabled:
-                    final_verification_round += 1
-                    verification_result = self.verification_controller.verify_final_answer(
-                        task=task,
-                        candidate=candidate_answer,
-                        memory_summary=self._build_verification_memory_summary(action_step),
-                        round_number=final_verification_round,
-                    )
-                    if verification_result.passed:
-                        final_answer = candidate_answer
-                        if self.final_answer_checks:
-                            self._validate_final_answer(final_answer)
-                        returned_final_answer = True
-                        action_step.is_final_answer = True
-                    else:
-                        returned_final_answer, final_answer = self._finalize_failed_verification_candidate(
-                            action_step=action_step,
-                            verification_result=verification_result,
-                            verification_round=final_verification_round,
-                            max_rounds=max_final_verification_rounds,
-                            candidate_answer=candidate_answer,
-                        )
-                else:
-                    final_answer = candidate_answer
-                    returned_final_answer = True
-                    action_step.is_final_answer = True
+                final_answer = action_step.model_output
+                if isinstance(final_answer, str):
+                    final_answer = convert_code_format(final_answer)
+                returned_final_answer = True
+                action_step.is_final_answer = True
 
             except AgentError as e:
                 action_step.error = e
@@ -838,19 +652,6 @@ def _run_stream(
             # _handle_max_steps_reached already yields the final step internally
             # and sets action_step.error, so don't yield again to avoid duplicate error
             final_answer = self._handle_max_steps_reached(task)
-            if verification_config.enabled and verification_config.final_verification_enabled:
-                final_verification_round += 1
-                verification_result = self.verification_controller.verify_final_answer(
-                    task=task,
-                    candidate=final_answer,
-                    memory_summary=self._build_verification_memory_summary(),
-                    round_number=final_verification_round,
-                )
-                if not verification_result.passed:
-                    final_answer = self.verification_controller.build_controlled_failure_answer(
-                        final_answer,
-                        verification_result,
-                    )
         yield FinalAnswerStep(handle_agent_output_types(final_answer))
 
 
@@ -995,7 +796,7 @@ def _handle_max_steps_reached(self, task: str) -> Any:
         except Exception as e:
             # Fallback to error message if streaming fails
             model_output = f"Error in generating final LLM output: {e}"
-            self.logger.log(f"Error in final answer generation: {e}", level=LogLevel.ERROR)
+            self.logger.log(f"Error in final answer generation: {e}", level=LogLevel.WARNING)
 
         # Finalize the memory step
         final_memory_step.timing.end_time = time.time()
diff --git a/sdk/nexent/core/agents/nexent_agent.py b/sdk/nexent/core/agents/nexent_agent.py
index ed43b6691..a5efcbe82 100644
--- a/sdk/nexent/core/agents/nexent_agent.py
+++ b/sdk/nexent/core/agents/nexent_agent.py
@@ -46,8 +46,10 @@ def _tool_name(tool_obj: Any) -> str:
 
 def _is_retriever_tool(tool_obj: Any) -> bool:
     """Classify tools that should use RETRIEVER rather than TOOL semantics."""
-    name = type(tool_obj).__name__
-    return name in ("KnowledgeBaseSearchTool", "SearchMemoryTool")
+    return (
+        type(tool_obj).__name__ == "KnowledgeBaseSearchTool"
+        or _tool_name(tool_obj) == "knowledge_base_search"
+    )
 
 
 def _build_tool_input(callable_obj: Callable, args: tuple, kwargs: Dict[str, Any]) -> Dict[str, Any]:
@@ -198,16 +200,11 @@ def create_local_tool(self, tool_config: ToolConfig):
             raise ValueError(f"{class_name} not found in local")
         else:
             if class_name == "KnowledgeBaseSearchTool":
-                # Filter out conflicting parameters from params to avoid conflicts.
-                # Parameters declared with exclude=True cannot be passed to __init__
-                # due to smolagents.tools.Tool wrapper restrictions; they are set as
-                # attributes on the instance after construction, sourced from metadata.
-                # `document_paths` is intentionally hidden from the LLM and only
-                # populated via tool_params from the northbound interface.
+                # Filter out conflicting parameters from params to avoid conflicts
+                # These parameters have exclude=True and cannot be passed to __init__
+                # due to smolagents.tools.Tool wrapper restrictions
                 filtered_params = {k: v for k, v in params.items()
-                                   if k not in ["vdb_core", "embedding_model", "observer",
-                                                 "rerank_model", "display_name_to_index_map",
-                                                 "document_paths"]}
+                                   if k not in ["vdb_core", "embedding_model", "observer", "rerank_model", "display_name_to_index_map"]}
                 # Create instance with only non-excluded parameters
                 tools_obj = tool_class(**filtered_params)
                 # Set excluded parameters directly as attributes after instantiation
@@ -221,13 +218,6 @@ def create_local_tool(self, tool_config: ToolConfig):
                     "rerank_model", None) if tool_config.metadata else None
                 tools_obj.display_name_to_index_map = tool_config.metadata.get(
                     "display_name_to_index_map", {}) if tool_config.metadata else {}
-                # Internal access control: restrict results to documents whose
-                # path_or_url is in the allow list. Only the northbound interface
-                # may populate this; never the LLM.
-                tools_obj.set_document_paths(
-                    tool_config.metadata.get(
-                        "document_paths") if tool_config.metadata else None
-                )
             elif class_name in ["DifySearchTool", "DataMateSearchTool"]:
                 # These parameters have exclude=True and cannot be passed to __init__
                 filtered_params = {k: v for k, v in params.items()
@@ -263,19 +253,6 @@ def create_local_tool(self, tool_config: ToolConfig):
                                        storage_client=tool_config.metadata.get("storage_client", []),
                                        validate_url_access=validate_url_access,
                                        **params)
-            elif class_name in ["StoreMemoryTool", "SearchMemoryTool"]:
-                tools_obj = tool_class()
-                tools_obj.observer = self.observer
-                tools_obj.memory_config = tool_config.metadata.get(
-                    "memory_config", {}) if tool_config.metadata else {}
-                tools_obj.tenant_id = tool_config.metadata.get(
-                    "tenant_id", "") if tool_config.metadata else ""
-                tools_obj.user_id = tool_config.metadata.get(
-                    "user_id", "") if tool_config.metadata else ""
-                tools_obj.agent_id = tool_config.metadata.get(
-                    "agent_id", "") if tool_config.metadata else ""
-                tools_obj.memory_user_config = tool_config.metadata.get(
-                    "memory_user_config", None) if tool_config.metadata else None
             else:
                 tools_obj = tool_class(**params)
                 if hasattr(tools_obj, 'observer'):
@@ -434,7 +411,6 @@ def create_single_agent(self, agent_config: AgentConfig):
                 description=agent_config.description,
                 max_steps=agent_config.max_steps,
                 prompt_templates=prompt_templates,
-                verification_config=agent_config.verification_config,
                 provide_run_summary=agent_config.provide_run_summary,
                 managed_agents=managed_agents_list,
                 additional_authorized_imports=SAFE_PYTHON_INTERPRETER_IMPORTS,
diff --git a/sdk/nexent/core/agents/verification.py b/sdk/nexent/core/agents/verification.py
deleted file mode 100644
index e75f41c42..000000000
--- a/sdk/nexent/core/agents/verification.py
+++ /dev/null
@@ -1,732 +0,0 @@
-from __future__ import annotations
-
-import ast
-import json
-import re
-from dataclasses import dataclass, field
-from typing import Any, Dict, List, Optional
-
-from smolagents.models import ChatMessage, MessageRole
-from smolagents.utils import truncate_content
-
-from ...monitor import get_monitoring_manager
-from ..utils.observer import MessageObserver, ProcessType
-from .agent_model import AgentVerificationConfig
-
-
-@dataclass
-class VerificationCheck:
-    name: str
-    passed: bool
-    reason: str = ""
-    fix_hint: str = ""
-
-
-@dataclass
-class VerificationResult:
-    passed: bool
-    severity: str
-    event: str
-    score: float = 1.0
-    phase: str = "pass"
-    failed_criteria: List[str] = field(default_factory=list)
-    repair_instruction: str = ""
-    user_visible_note: str = ""
-    checks: List[VerificationCheck] = field(default_factory=list)
-
-    def to_payload(self, round_number: int = 0, message: Optional[str] = None) -> Dict[str, Any]:
-        return {
-            "phase": self.phase,
-            "event": self.event,
-            "round": round_number,
-            "severity": self.severity,
-            "score": round(float(self.score), 3),
-            "failed_criteria": self.failed_criteria,
-            "repair_instruction": self.repair_instruction,
-            "user_visible_note": self.user_visible_note,
-            "message": message or self.user_visible_note or self.repair_instruction,
-            "passed": self.passed,
-        }
-
-
-class _SilentObserver:
-    """Observer shim used to prevent verifier LLM tokens from appearing in chat UI."""
-
-    current_mode = ProcessType.MODEL_OUTPUT_THINKING
-
-    def add_model_new_token(self, _new_token):
-        return None
-
-    def add_model_reasoning_content(self, _reasoning_content):
-        return None
-
-    def flush_remaining_tokens(self):
-        return None
-
-
-class VerificationController:
-    """Layered verification for critical ReAct events and final answers."""
-
-    _ERROR_RE = re.compile(
-        r"(traceback|exception|error:|failed|timeout|unauthorized|permission denied)",
-        re.IGNORECASE,
-    )
-    _EMPTY_RE = re.compile(r"^\s*(execution logs:\s*)?(last output from code snippet:\s*)?\s*$", re.IGNORECASE)
-    _RAW_TAG_RE = re.compile(r"</?(code|RUN)>|<DISPLAY:[^>]+>|</DISPLAY>", re.IGNORECASE)
-    _CITATION_RE = re.compile(r"\[\[[a-e]\d+\]\]")
-    _LIGHTWEIGHT_CONVERSATION_RE = re.compile(
-        r"^\s*(你好|您好|嗨|哈喽|hello|hi|hey|早上好|上午好|中午好|下午好|晚上好|"
-        r"在吗|你是谁|你会干什么|介绍一下你自己|谢谢|好的|好|可以|没事|再见|"
-        r"thanks|thank you|ok|bye)\s*[。！？!?.]*\s*$",
-        re.IGNORECASE,
-    )
-    _EVIDENCE_DEMAND_RE = re.compile(
-        r"(搜索|检索|查询|查找|分析|调研|根据|基于|引用|证据|来源|文档|文件|代码|项目|数据库|"
-        r"最新|今天|昨天|现在|当前|执行|运行|部署|修复|报错|日志|search|retrieve|cite|source|"
-        r"evidence|file|code|database|latest|today|run|execute|deploy|error|log)",
-        re.IGNORECASE,
-    )
-
-    def __init__(
-        self,
-        config: AgentVerificationConfig,
-        observer: MessageObserver,
-        agent_name: str,
-        model: Any,
-        logger: Any = None,
-    ) -> None:
-        self.config = config
-        self.observer = observer
-        self.agent_name = agent_name
-        self.model = model
-        self.logger = logger
-
-    def is_enabled(self) -> bool:
-        return bool(self.config and self.config.enabled)
-
-    def emit(self, result: VerificationResult, round_number: int = 0, message: Optional[str] = None) -> None:
-        if not self.is_enabled():
-            return
-        try:
-            display_message = message or self._build_display_message(result)
-            self.observer.add_message(
-                self.agent_name,
-                ProcessType.VERIFICATION,
-                json.dumps(result.to_payload(round_number, display_message), ensure_ascii=False),
-            )
-        except Exception:
-            if self.logger:
-                self.logger.log("Failed to emit verification event")
-
-    def _build_display_message(self, result: VerificationResult) -> str:
-        if result.passed and result.phase in {"pass", "final_pass"}:
-            prefix = "最终自检通过" if result.phase == "final_pass" else "基础自检通过"
-            summary = self._build_pass_summary(result)
-            return f"{prefix}：{summary}" if summary else prefix
-
-        if result.phase in {"warning", "blocked", "repair", "final_fail"}:
-            note = result.user_visible_note or result.repair_instruction
-            if note:
-                prefix = {
-                    "warning": "自检发现需关注项",
-                    "blocked": "自检已阻断",
-                    "repair": "自检未通过，正在修正",
-                    "final_fail": "最终自检未通过",
-                }.get(result.phase, "自检提示")
-                return f"{prefix}：{note}"
-
-        return result.user_visible_note or result.repair_instruction or ""
-
-    def _build_pass_summary(self, result: VerificationResult) -> str:
-        if result.event == "tool_precheck":
-            return "动作非空、语法正常，未发现越权风险"
-        if result.event == "retrieval":
-            return "检索返回可用内容，未发现错误信号"
-        if result.event == "handoff":
-            return "子任务返回可用结论，未发现错误信号"
-        if result.event in {"tool_result", "code_execution"}:
-            return "执行结果非空，未发现错误信号"
-
-        if result.event == "final_answer":
-            if "Lightweight conversational task" in (result.user_visible_note or ""):
-                return "轻量对话无需外部证据，答案非空且格式正常"
-
-            labels = self._passed_check_labels(result.checks)
-            if labels:
-                return "、".join(labels[:3])
-            if result.user_visible_note:
-                return result.user_visible_note
-            return "答案满足当前任务要求，未发现阻断问题"
-
-        labels = self._passed_check_labels(result.checks)
-        return "、".join(labels[:3])
-
-    def _passed_check_labels(self, checks: List[VerificationCheck]) -> List[str]:
-        label_map = {
-            "non_empty_code": "动作非空",
-            "python_syntax": "语法正常",
-            "action_scope": "未发现越权风险",
-            "tool_relevance_signal": "动作与任务相关",
-            "observation_present": "结果非空",
-            "tool_error_handled": "未发现未处理错误",
-            "retrieval_has_evidence": "检索证据可用",
-            "handoff_has_substance": "子任务结论可用",
-            "final_answer_non_empty": "答案非空",
-            "no_unresolved_raw_tags": "无内部标记",
-            "no_unresolved_placeholders": "无占位符",
-            "previous_errors_acknowledged": "未发现未处理错误",
-            "intent_coverage": "覆盖用户目标",
-            "evidence_grounding": "证据支撑充分",
-            "citation_integrity": "引用格式正常",
-            "format_safety": "格式安全",
-            "tool_error_handling": "工具错误已处理",
-        }
-        ordered_names = [
-            "intent_coverage",
-            "evidence_grounding",
-            "tool_error_handling",
-            "citation_integrity",
-            "format_safety",
-            "final_answer_non_empty",
-            "no_unresolved_raw_tags",
-            "no_unresolved_placeholders",
-            "previous_errors_acknowledged",
-            "observation_present",
-            "tool_error_handled",
-            "retrieval_has_evidence",
-            "handoff_has_substance",
-            "non_empty_code",
-            "python_syntax",
-            "action_scope",
-            "tool_relevance_signal",
-        ]
-        passed_names = {check.name for check in checks if check.passed}
-        return [label_map[name] for name in ordered_names if name in passed_names and name in label_map]
-
-    def verify_before_tool_call(
-        self,
-        code_action: str,
-        step_number: int,
-        available_tool_names: Optional[List[str]] = None,
-    ) -> VerificationResult:
-        if not self._should_verify_step("tool_precheck"):
-            return self._pass("tool_precheck")
-
-        checks: List[VerificationCheck] = []
-        code_text = code_action or ""
-
-        checks.append(VerificationCheck(
-            name="non_empty_code",
-            passed=bool(code_text.strip()),
-            reason="" if code_text.strip() else "The generated action code is empty.",
-            fix_hint="Generate a concrete tool call or a final answer.",
-        ))
-
-        syntax_ok = True
-        try:
-            ast.parse(code_text)
-        except SyntaxError as exc:
-            syntax_ok = False
-            checks.append(VerificationCheck(
-                name="python_syntax",
-                passed=False,
-                reason=f"Python syntax error: {exc}",
-                fix_hint="Rewrite the action as valid Python inside <code>...</code>.",
-            ))
-        if syntax_ok:
-            checks.append(VerificationCheck(name="python_syntax", passed=True))
-
-        dangerous_terms = [
-            "__import__",
-            "eval(",
-            "exec(",
-            "subprocess",
-            "os.system",
-            "shutil.rmtree",
-            "socket.",
-        ]
-        dangerous_hits = [term for term in dangerous_terms if term in code_text]
-        checks.append(VerificationCheck(
-            name="action_scope",
-            passed=not dangerous_hits,
-            reason=f"Potentially unsafe code terms: {', '.join(dangerous_hits)}" if dangerous_hits else "",
-            fix_hint="Use the platform-provided tools instead of direct system or network operations.",
-        ))
-
-        if "final_answer(" not in code_text and available_tool_names:
-            used_tools = [name for name in available_tool_names if re.search(rf"\b{re.escape(name)}\s*\(", code_text)]
-            checks.append(VerificationCheck(
-                name="tool_relevance_signal",
-                passed=bool(used_tools) or "print(" in code_text,
-                reason="" if used_tools or "print(" in code_text else "No known tool call or printed observation was detected.",
-                fix_hint="Call a relevant tool with keyword arguments, or print the evidence needed for the next step.",
-            ))
-
-        return self._result_from_checks(
-            event="tool_precheck",
-            checks=checks,
-            blocking_names={"non_empty_code", "python_syntax", "action_scope"},
-            step_number=step_number,
-        )
-
-    def verify_after_tool_call(
-        self,
-        code_action: str,
-        observation: str,
-        step_number: int,
-        is_final_answer: bool = False,
-    ) -> VerificationResult:
-        event = self._classify_step_event(code_action, is_final_answer)
-        if not self._should_verify_step(event):
-            return self._pass(event)
-
-        observation_text = observation or ""
-        checks = [
-            VerificationCheck(
-                name="observation_present",
-                passed=not self._EMPTY_RE.match(observation_text),
-                reason="" if observation_text.strip() else "The action produced no visible observation.",
-                fix_hint="Retry with better parameters, inspect tool errors, or explain that evidence is unavailable.",
-            ),
-            VerificationCheck(
-                name="tool_error_handled",
-                passed=not self._ERROR_RE.search(observation_text),
-                reason="The observation contains an error signal." if self._ERROR_RE.search(observation_text) else "",
-                fix_hint="Do not ignore this tool error. Diagnose it, retry safely, or state the limitation.",
-            ),
-        ]
-
-        if event == "retrieval":
-            checks.append(VerificationCheck(
-                name="retrieval_has_evidence",
-                passed=not self._looks_empty_retrieval(observation_text),
-                reason="Retrieval appears empty or has no usable evidence." if self._looks_empty_retrieval(observation_text) else "",
-                fix_hint="Search again with refined terms or say that supporting evidence was not found.",
-            ))
-
-        if event == "handoff":
-            checks.append(VerificationCheck(
-                name="handoff_has_substance",
-                passed=not self._looks_empty_handoff(observation_text),
-                reason="The delegated agent returned no useful result." if self._looks_empty_handoff(observation_text) else "",
-                fix_hint="Reassign a narrower task or proceed with clearly stated limitations.",
-            ))
-
-        return self._result_from_checks(
-            event=event,
-            checks=checks,
-            blocking_names=set(),
-            step_number=step_number,
-        )
-
-    def verify_before_final_answer(
-        self,
-        candidate: Any,
-        observation: str,
-        step_number: int,
-    ) -> VerificationResult:
-        if not self.is_enabled() or not self.config.final_verification_enabled:
-            return self._pass("final_answer")
-
-        answer = "" if candidate is None else str(candidate)
-        observation_text = observation or ""
-        recent_error_signal = self._has_recent_error_signal(observation_text)
-        checks = [
-            VerificationCheck(
-                name="final_answer_non_empty",
-                passed=bool(answer.strip()),
-                reason="" if answer.strip() else "The final answer candidate is empty.",
-                fix_hint="Produce a concise answer or an explicit inability summary.",
-            ),
-            VerificationCheck(
-                name="no_unresolved_raw_tags",
-                passed=not self._RAW_TAG_RE.search(answer),
-                reason="The final answer still contains internal execution/display tags." if self._RAW_TAG_RE.search(answer) else "",
-                fix_hint="Convert internal tags to user-facing Markdown before answering.",
-            ),
-            VerificationCheck(
-                name="no_unresolved_placeholders",
-                passed=not any(marker in answer for marker in ["{{", "}}", "<TODO>", "TODO:"]),
-                reason="The final answer contains unresolved placeholders." if any(marker in answer for marker in ["{{", "}}", "<TODO>", "TODO:"]) else "",
-                fix_hint="Replace placeholders with real content or remove them.",
-            ),
-            VerificationCheck(
-                name="previous_errors_acknowledged",
-                passed=not recent_error_signal or self._mentions_limitation(answer),
-                reason="A recent error signal is not acknowledged in the final answer." if recent_error_signal and not self._mentions_limitation(answer) else "",
-                fix_hint="Acknowledge the failed operation, retry, or state what could not be verified.",
-            ),
-        ]
-
-        return self._result_from_checks(
-            event="final_answer",
-            checks=checks,
-            blocking_names={"final_answer_non_empty", "no_unresolved_raw_tags", "no_unresolved_placeholders"},
-            step_number=step_number,
-        )
-
-    def verify_final_answer(
-        self,
-        task: str,
-        candidate: Any,
-        memory_summary: str,
-        round_number: int,
-    ) -> VerificationResult:
-        if not self.is_enabled() or not self.config.final_verification_enabled:
-            return self._pass("final_answer", phase="final_pass")
-
-        start = self._pass("final_answer", phase="start")
-        self.emit(start, round_number, "正在自检最终答案：检查答案完整性、格式和错误处理")
-
-        deterministic = self.verify_before_final_answer(
-            candidate=candidate,
-            observation=memory_summary,
-            step_number=round_number,
-        )
-        if not deterministic.passed:
-            deterministic.phase = "final_fail"
-            self.emit(deterministic, round_number)
-            return deterministic
-
-        if not self.config.llm_verification_enabled:
-            deterministic.phase = "final_pass"
-            self.emit(deterministic, round_number)
-            return deterministic
-
-        policy = self._build_final_verification_policy(task, memory_summary)
-        if policy["task_profile"] == "lightweight_conversation":
-            deterministic.phase = "final_pass"
-            deterministic.user_visible_note = "Lightweight conversational task; deterministic checks passed."
-            self.emit(deterministic, round_number)
-            return deterministic
-
-        llm_result = self._run_llm_verifier(task, candidate, memory_summary, round_number, policy)
-        self.emit(llm_result, round_number)
-        return llm_result
-
-    def build_feedback_observation(self, result: VerificationResult) -> str:
-        failed = ", ".join(result.failed_criteria) if result.failed_criteria else "verification"
-        instruction = result.repair_instruction or "Revise the next action based on the failed verification checks."
-        return (
-            "\nVerification feedback:\n"
-            f"- Event: {result.event}\n"
-            f"- Severity: {result.severity}\n"
-            f"- Failed criteria: {failed}\n"
-            f"- Repair instruction: {instruction}\n"
-        )
-
-    def build_controlled_failure_answer(self, candidate: Any, result: VerificationResult) -> str:
-        note = result.user_visible_note or "最终答案未能通过自验证。"
-        failed = "、".join(result.failed_criteria) if result.failed_criteria else "verification"
-        instruction = result.repair_instruction or "请补充更多信息或放宽任务约束后重试。"
-        if self.config.fail_policy == "warn" and candidate:
-            return f"{candidate}\n\n> 自验证提示：{note}"
-        return (
-            "我无法在当前步骤内给出已通过自验证的确定答案。\n\n"
-            f"- 未通过项：{failed}\n"
-            f"- 原因：{note}\n"
-            f"- 建议：{instruction}"
-        )
-
-    def _should_verify_step(self, event: str) -> bool:
-        return (
-            self.is_enabled()
-            and self.config.step_verification_enabled
-            and event in set(self.config.critical_events)
-        )
-
-    def _run_llm_verifier(
-        self,
-        task: str,
-        candidate: Any,
-        memory_summary: str,
-        round_number: int,
-        policy: Optional[Dict[str, Any]] = None,
-    ) -> VerificationResult:
-        policy = policy or self._build_final_verification_policy(task, memory_summary)
-        monitoring_manager = get_monitoring_manager()
-        attrs = {
-            "agent.verification.event": "final_answer",
-            "agent.verification.round": round_number,
-            "agent.verification.strictness": self.config.strictness,
-            "agent.verification.fail_policy": self.config.fail_policy,
-            "agent.verification.task_profile": policy["task_profile"],
-            "agent.verification.evidence_required": policy["evidence_required"],
-            "agent.verification.tool_error_check_required": policy["tool_error_check_required"],
-        }
-        with monitoring_manager.trace_agent_step(
-            "agent.verify.final_answer",
-            step_type="verification",
-            **attrs,
-        ):
-            messages = self._build_verifier_messages(task, candidate, memory_summary, policy)
-            saved_observer = getattr(self.model, "observer", None)
-            if saved_observer is not None:
-                try:
-                    self.model.observer = _SilentObserver()
-                except Exception:
-                    pass
-            try:
-                chat_message: ChatMessage = self.model(messages)
-                content = chat_message.content or ""
-                result = self._parse_llm_verifier_result(content, policy)
-                monitoring_manager.add_span_event(
-                    "agent.verification.result",
-                    {
-                        "agent.verification.status": result.phase,
-                        "agent.verification.score": result.score,
-                        "agent.verification.failed_criteria": json.dumps(result.failed_criteria, ensure_ascii=False),
-                    },
-                )
-                return result
-            except Exception as exc:
-                if self.logger:
-                    self.logger.log(f"LLM verifier unavailable: {exc}")
-                result = VerificationResult(
-                    passed=True,
-                    severity="warning",
-                    event="final_answer",
-                    phase="final_pass",
-                    score=0.75,
-                    failed_criteria=["verifier_unavailable"],
-                    user_visible_note="Verifier was unavailable; deterministic checks passed.",
-                )
-                monitoring_manager.add_span_event(
-                    "agent.verification.unavailable",
-                    {"error.type": type(exc).__name__, "error.message": str(exc)},
-                )
-                return result
-            finally:
-                if saved_observer is not None:
-                    try:
-                        self.model.observer = saved_observer
-                    except Exception:
-                        pass
-
-    def _build_verifier_messages(
-        self,
-        task: str,
-        candidate: Any,
-        memory_summary: str,
-        policy: Optional[Dict[str, Any]] = None,
-    ) -> List[ChatMessage]:
-        policy = policy or self._build_final_verification_policy(task, memory_summary)
-        clean_memory_summary = self._strip_internal_verification_feedback(memory_summary or "")
-        system_prompt = (
-            "You are a strict answer verifier for a ReAct agent. "
-            "Check only the evidence shown to you. Do not reveal chain-of-thought. "
-            "Return JSON only with keys: passed, score, status, failed_criteria, checks, "
-            "revision_instruction, user_visible_note. "
-            "Criteria: intent_coverage, evidence_grounding, tool_error_handling, citation_integrity, format_safety. "
-            "Apply criteria conditionally: for lightweight conversational tasks such as greetings or capability chat, "
-            "do not require external observations, citations, tool calls, or retrieval evidence. "
-            "Only fail evidence_grounding when evidence_required is true. "
-            "Only fail tool_error_handling when tool_error_check_required is true and the answer ignores an actual "
-            "tool/code execution error in the evidence summary."
-        )
-        user_prompt = json.dumps(
-            {
-                "task": truncate_content(str(task), max_length=4000),
-                "candidate_answer": truncate_content(str(candidate), max_length=4000),
-                "react_evidence_summary": truncate_content(clean_memory_summary, max_length=6000),
-                "task_profile": policy["task_profile"],
-                "evidence_required": policy["evidence_required"],
-                "tool_error_check_required": policy["tool_error_check_required"],
-                "pass_score": self.config.pass_score,
-                "strictness": self.config.strictness,
-            },
-            ensure_ascii=False,
-        )
-        return [
-            ChatMessage(role=MessageRole.SYSTEM, content=[{"type": "text", "text": system_prompt}]),
-            ChatMessage(role=MessageRole.USER, content=[{"type": "text", "text": user_prompt}]),
-        ]
-
-    def _parse_llm_verifier_result(
-        self,
-        content: str,
-        policy: Optional[Dict[str, Any]] = None,
-    ) -> VerificationResult:
-        policy = policy or {
-            "task_profile": "unknown",
-            "evidence_required": True,
-            "tool_error_check_required": True,
-        }
-        data = self._extract_json(content)
-        passed = bool(data.get("passed"))
-        score = float(data.get("score", 0.0))
-        status = str(data.get("status") or ("pass" if passed else "revise"))
-        failed_criteria = data.get("failed_criteria") or []
-        if not isinstance(failed_criteria, list):
-            failed_criteria = [str(failed_criteria)]
-        failed_criteria = [str(item) for item in failed_criteria]
-        ignored_criteria = set()
-        if not policy.get("evidence_required", True):
-            ignored_criteria.add("evidence_grounding")
-        if not policy.get("tool_error_check_required", True):
-            ignored_criteria.add("tool_error_handling")
-        effective_failed_criteria = [
-            criterion for criterion in failed_criteria if criterion not in ignored_criteria
-        ]
-
-        checks = []
-        for item in data.get("checks") or []:
-            if isinstance(item, dict):
-                name = str(item.get("name", "unknown"))
-                check_passed = bool(item.get("passed"))
-                if name in ignored_criteria:
-                    check_passed = True
-                checks.append(VerificationCheck(
-                    name=name,
-                    passed=check_passed,
-                    reason=str(item.get("reason", "")),
-                    fix_hint=str(item.get("fix_hint", "")),
-                ))
-
-        threshold_passed = score >= self.config.pass_score
-        if failed_criteria and not effective_failed_criteria:
-            passed = True
-            score = max(score, self.config.pass_score)
-            threshold_passed = True
-            status = "pass"
-        effective_passed = passed and threshold_passed
-        severity = "info" if effective_passed else "blocking"
-        return VerificationResult(
-            passed=effective_passed,
-            severity=severity,
-            event="final_answer",
-            phase="final_pass" if effective_passed else "final_fail",
-            score=score,
-            failed_criteria=effective_failed_criteria if effective_failed_criteria else ([] if effective_passed else ["llm_verifier"]),
-            repair_instruction=str(data.get("revision_instruction") or data.get("repair_instruction") or ""),
-            user_visible_note=str(data.get("user_visible_note") or ""),
-            checks=checks,
-        )
-
-    def _extract_json(self, content: str) -> Dict[str, Any]:
-        text = (content or "").strip()
-        if text.startswith("```"):
-            text = re.sub(r"^```(?:json)?\s*", "", text)
-            text = re.sub(r"\s*```$", "", text)
-        try:
-            return json.loads(text)
-        except json.JSONDecodeError:
-            start = text.find("{")
-            end = text.rfind("}")
-            if start >= 0 and end > start:
-                return json.loads(text[start:end + 1])
-            raise
-
-    def _result_from_checks(
-        self,
-        event: str,
-        checks: List[VerificationCheck],
-        blocking_names: set[str],
-        step_number: int,
-    ) -> VerificationResult:
-        failed = [check for check in checks if not check.passed]
-        blocking_failed = [check for check in failed if check.name in blocking_names]
-        should_block = bool(blocking_failed) or (self.config.strictness == "strict" and bool(failed))
-        passed = not should_block
-        severity = "info" if not failed else ("blocking" if should_block else "warning")
-        phase = "pass" if not failed else ("blocked" if should_block else "warning")
-        score = max(0.0, 1.0 - 0.15 * len(failed) - 0.35 * len(blocking_failed))
-        failed_names = [check.name for check in failed]
-        repair_instruction = " ".join(check.fix_hint for check in failed if check.fix_hint).strip()
-        user_visible_note = "；".join(check.reason for check in failed if check.reason).strip()
-        result = VerificationResult(
-            passed=passed,
-            severity=severity,
-            event=event,
-            score=score,
-            phase=phase,
-            failed_criteria=failed_names,
-            repair_instruction=repair_instruction,
-            user_visible_note=user_visible_note,
-            checks=checks,
-        )
-        monitoring_manager = get_monitoring_manager()
-        with monitoring_manager.trace_agent_step(
-            "agent.verify.step",
-            step_type="verification",
-            **{
-                "agent.verification.event": event,
-                "agent.verification.step_number": step_number,
-                "agent.verification.status": phase,
-                "agent.verification.severity": severity,
-                "agent.verification.score": score,
-                "agent.verification.failed_criteria": json.dumps(failed_names, ensure_ascii=False),
-            },
-        ):
-            monitoring_manager.add_span_event(
-                "agent.verification.result",
-                {
-                    "agent.verification.passed": passed,
-                    "agent.verification.failed_criteria": json.dumps(failed_names, ensure_ascii=False),
-                },
-            )
-        self.emit(result, step_number)
-        return result
-
-    def _build_final_verification_policy(self, task: str, memory_summary: str) -> Dict[str, Any]:
-        clean_memory_summary = self._strip_internal_verification_feedback(memory_summary or "")
-        lightweight = self._is_lightweight_conversation_task(task)
-        evidence_required = (not lightweight) and bool(self._EVIDENCE_DEMAND_RE.search(task or ""))
-        return {
-            "task_profile": "lightweight_conversation" if lightweight else "task_oriented",
-            "evidence_required": evidence_required,
-            "tool_error_check_required": self._has_recent_error_signal(clean_memory_summary),
-        }
-
-    def _is_lightweight_conversation_task(self, task: str) -> bool:
-        text = (task or "").strip()
-        if not text:
-            return False
-        if self._LIGHTWEIGHT_CONVERSATION_RE.match(text):
-            return True
-        return False
-
-    def _strip_internal_verification_feedback(self, text: str) -> str:
-        lines = (text or "").splitlines()
-        cleaned: List[str] = []
-        skipping = False
-        for line in lines:
-            if line.strip() == "Verification feedback:":
-                skipping = True
-                continue
-            if skipping:
-                if not line.strip() or line.lstrip().startswith("- "):
-                    continue
-                skipping = False
-            cleaned.append(line)
-        return "\n".join(cleaned)
-
-    def _has_recent_error_signal(self, text: str) -> bool:
-        clean_text = self._strip_internal_verification_feedback(text or "")
-        return bool(self._ERROR_RE.search(clean_text))
-
-    def _classify_step_event(self, code_action: str, is_final_answer: bool) -> str:
-        if is_final_answer:
-            return "final_answer"
-        code = code_action or ""
-        lowered = code.lower()
-        if "knowledge_base_search" in lowered or "search(" in lowered or "_search" in lowered:
-            return "retrieval"
-        if "task=" in code and re.search(r"\w+\s*\(\s*task\s*=", code):
-            return "handoff"
-        return "code_execution"
-
-    def _pass(self, event: str, phase: str = "pass") -> VerificationResult:
-        return VerificationResult(passed=True, severity="info", event=event, phase=phase)
-
-    def _looks_empty_retrieval(self, text: str) -> bool:
-        lowered = (text or "").lower()
-        return any(marker in lowered for marker in ["no result", "no results", "[]", "未找到", "无结果", "没有找到"])
-
-    def _looks_empty_handoff(self, text: str) -> bool:
-        lowered = (text or "").lower()
-        return any(marker in lowered for marker in ["cannot help", "unable", "no answer", "无法", "不能", "空"])
-
-    def _mentions_limitation(self, answer: str) -> bool:
-        lowered = (answer or "").lower()
-        return any(marker in lowered for marker in ["无法", "失败", "错误", "未能", "cannot", "unable", "failed", "error", "limitation"])
diff --git a/sdk/nexent/core/tools/__init__.py b/sdk/nexent/core/tools/__init__.py
index c35991f6e..a640cb5ff 100644
--- a/sdk/nexent/core/tools/__init__.py
+++ b/sdk/nexent/core/tools/__init__.py
@@ -24,8 +24,6 @@
 from .run_skill_script_tool import run_skill_script
 from .read_skill_md_tool import read_skill_md
 from .read_skill_config_tool import read_skill_config
-from .store_memory_tool import StoreMemoryTool
-from .search_memory_tool import SearchMemoryTool
 
 __all__ = [
     "MySqlTool",
@@ -55,7 +53,5 @@
     "AnalyzeVideoTool",
     "run_skill_script",
     "read_skill_md",
-    "read_skill_config",
-    "StoreMemoryTool",
-    "SearchMemoryTool",
+    "read_skill_config"
 ]
diff --git a/sdk/nexent/core/tools/knowledge_base_search_tool.py b/sdk/nexent/core/tools/knowledge_base_search_tool.py
index c0115a0ab..3405be833 100644
--- a/sdk/nexent/core/tools/knowledge_base_search_tool.py
+++ b/sdk/nexent/core/tools/knowledge_base_search_tool.py
@@ -21,21 +21,6 @@
 logger = logging.getLogger("knowledge_base_search_tool")
 
 
-def _unwrap_field_info(value):
-    """Resolve a value that may be wrapped in a Pydantic FieldInfo.
-
-    Parameters declared with `Field(...)` and `exclude=True` are not expanded by
-    smolagents' Tool wrapper, so they arrive at `__init__` as raw FieldInfo
-    instances instead of their declared defaults. This helper extracts the
-    concrete value so callers can safely treat the result as plain data.
-    """
-    if isinstance(value, FieldInfo):
-        if value.default_factory is not None:
-            return value.default_factory()
-        return value.default
-    return value
-
-
 class KnowledgeBaseSearchTool(Tool):
     """Knowledge base search tool"""
 
@@ -63,10 +48,6 @@ class KnowledgeBaseSearchTool(Tool):
         },
     }
 
-    # Internal parameter: restricts search results to specified document paths only.
-    # Not exposed to LLM, only settable via tool_params from /chat/run.
-    _internal_document_paths: Optional[List[str]] = None
-
     init_param_descriptions = {
         "top_k": {
             "description": "Maximum number of search results",
@@ -115,10 +96,6 @@ def __init__(
         display_name_to_index_map: dict = Field(
             description="Mapping from display_name (knowledge_name) to index_name",
             default_factory=dict, exclude=True),
-        # Internal parameter: not exposed to LLM, only settable via tool_params from /chat/run.
-        document_paths: Optional[List[str]] = Field(
-            description="Internal: restrict results to documents with these path_or_urls", default=None, exclude=True
-        ),
     ):
         """Initialize the KBSearchTool.
 
@@ -144,26 +121,11 @@ def __init__(
         self.rerank_model = rerank_model
         self.data_process_service = os.getenv("DATA_PROCESS_SERVICE")
         self.display_name_to_index_map = display_name_to_index_map
-        # `document_paths` is declared with `exclude=True` so smolagents passes the
-        # raw FieldInfo default when no value is supplied. Unwrap it here so the
-        # internal filter is always a concrete list (or None), never a FieldInfo.
-        self._internal_document_paths = _unwrap_field_info(document_paths)
 
         self.record_ops = 1
         self.running_prompt_zh = "知识库检索中..."
         self.running_prompt_en = "Searching the knowledge base..."
 
-    def set_document_paths(self, document_paths: Optional[List[str]]) -> None:
-        """Set the internal document_paths filter for access control.
-
-        This method is intended for internal use only, called via tool_params
-        from the /chat/run endpoint. It is NOT exposed to the LLM.
-
-        Args:
-            document_paths: List of allowed document path_or_urls. If None, no filtering is applied.
-        """
-        self._internal_document_paths = _unwrap_field_info(document_paths)
-
     def _convert_to_index_names(self, names: List[str]) -> List[str]:
         """Convert display names (knowledge_name) to index names if necessary.
 
@@ -193,36 +155,6 @@ def _convert_to_index_names(self, names: List[str]) -> List[str]:
                 converted_names.append(name)
         return converted_names
 
-    def _filter_by_document_paths(self, results: List[dict]) -> List[dict]:
-        """Filter search results by allowed document paths for access control.
-
-        If _internal_document_paths is set, only results whose path_or_url is in the
-        allowed list are returned. Results with no path_or_url field are discarded
-        when the filter is active.
-
-        Args:
-            results: List of search result dicts from VDB search
-
-        Returns:
-            Filtered list containing only results with allowed document paths
-        """
-        allowed_paths = _unwrap_field_info(self._internal_document_paths)
-        if not allowed_paths:
-            return results
-
-        filtered = [
-            result for result in results
-            if result.get("path_or_url") in allowed_paths
-        ]
-
-        if filtered:
-            logger.info(
-                "Document paths filter applied: %d/%d results match allowed paths",
-                len(filtered),
-                len(results),
-            )
-        return filtered
-
     def forward(self, query: str, index_names: Optional[List[str]] = None) -> str:
         # Parse index_names from string (always required)
         search_index_names = index_names if index_names is not None else self.index_names
@@ -271,9 +203,6 @@ def forward(self, query: str, index_names: Optional[List[str]] = None) -> str:
         )
         kb_search_results = kb_search_data["results"]
 
-        # Apply document_paths access control: filter out results not in allowed list
-        kb_search_results = self._filter_by_document_paths(kb_search_results)
-
         if not kb_search_results:
             raise Exception("No results found! Try a less restrictive/shorter query.")
 
diff --git a/sdk/nexent/core/tools/search_memory_tool.py b/sdk/nexent/core/tools/search_memory_tool.py
deleted file mode 100644
index 4819a7625..000000000
--- a/sdk/nexent/core/tools/search_memory_tool.py
+++ /dev/null
@@ -1,109 +0,0 @@
-import asyncio
-import logging
-from typing import Any
-
-from smolagents.tools import Tool
-from pydantic import Field
-
-from ..utils.observer import MessageObserver, ProcessType
-from ..utils.tools_common_message import ToolSign, ToolCategory
-
-logger = logging.getLogger("search_memory_tool")
-
-
-class SearchMemoryTool(Tool):
-    name = "search_memory"
-    description = (
-        "Search long-term memory for relevant information from previous interactions. "
-        "Use this when you need context about the user's preferences, past decisions, "
-        "or previously discussed topics that aren't in the current conversation. "
-        "The system already provides some memory context automatically -- use this tool "
-        "when you need to search for specific information not already available."
-    )
-    description_zh = (
-        "搜索长期记忆中来自之前交互的相关信息。"
-        "当你需要了解用户的偏好、过去的决策或当前对话中未提及的之前讨论过的话题时使用此工具。"
-        "系统已自动提供一些记忆上下文 -- 仅在需要搜索尚未提供的特定信息时使用此工具。"
-    )
-
-    inputs = {
-        "query": {
-            "type": "string",
-            "description": "Natural language query describing what to search for",
-            "description_zh": "描述要搜索内容的自然语言查询"
-        },
-        "top_k": {
-            "type": "integer",
-            "description": "Maximum number of results to return",
-            "description_zh": "返回结果的最大数量",
-            "default": 5,
-            "nullable": True
-        }
-    }
-    output_type = "string"
-    category = ToolCategory.SEARCH.value
-    tool_sign = ToolSign.MEMORY_OPERATION.value
-
-    def __init__(
-        self,
-        memory_config: dict = Field(description="Mem0 configuration", exclude=True),
-        tenant_id: str = Field(description="Tenant ID", default="", exclude=True),
-        user_id: str = Field(description="User ID", default="", exclude=True),
-        agent_id: str = Field(description="Agent ID", default="", exclude=True),
-        memory_user_config: Any = Field(description="User memory preferences", default=None, exclude=True),
-        observer: MessageObserver = Field(description="Message observer", default=None, exclude=True),
-    ):
-        super().__init__()
-        self.memory_config = memory_config
-        self.tenant_id = tenant_id
-        self.user_id = user_id
-        self.agent_id = agent_id
-        self.memory_user_config = memory_user_config
-        self.observer = observer
-        self.running_prompt_en = "Searching memory..."
-        self.running_prompt_zh = "搜索记忆中..."
-
-    def forward(self, query: str, top_k: int = 5) -> str:
-        logger.info(f"[ACTIVE MEMORY] SearchMemoryTool invoked: query={query[:200]}, top_k={top_k}, user_id={self.user_id}, agent_id={self.agent_id}")
-        if self.observer:
-            running_prompt = self.running_prompt_zh if self.observer.lang == "zh" else self.running_prompt_en
-            self.observer.add_message("", ProcessType.TOOL, running_prompt)
-
-        memory_levels = ["tenant", "user", "agent", "user_agent"]
-        if self.memory_user_config.agent_share_option == "never":
-            memory_levels.remove("agent")
-        if self.agent_id in getattr(self.memory_user_config, "disable_agent_ids", []):
-            if "agent" in memory_levels:
-                memory_levels.remove("agent")
-        if self.agent_id in getattr(self.memory_user_config, "disable_user_agent_ids", []):
-            if "user_agent" in memory_levels:
-                memory_levels.remove("user_agent")
-
-        try:
-            from ...memory.memory_service import search_memory_in_levels
-            result = asyncio.run(search_memory_in_levels(
-                query_text=query,
-                memory_config=self.memory_config,
-                tenant_id=self.tenant_id,
-                user_id=self.user_id,
-                agent_id=self.agent_id,
-                top_k=top_k,
-                memory_levels=memory_levels,
-            ))
-
-            items = result.get("results", [])
-            logger.info(f"[ACTIVE MEMORY] SearchMemoryTool completed: found {len(items)} memories, levels={[item.get('memory_level', 'unknown') for item in items]}")
-            if not items:
-                return "No relevant memories found."
-
-            lines = [f"Found {len(items)} relevant memories:"]
-            for i, item in enumerate(items):
-                content = item.get("memory", "") or item.get("content", "")
-                score = item.get("score", 0.0)
-                level = item.get("memory_level", "unknown")
-                lines.append(f"[{i+1}] (score: {score:.2f}, level: {level}) {content}")
-            return "\n".join(lines)
-
-        except Exception as e:
-            logger.error(f"search_memory failed: {e}")
-            return f"Memory search failed: {str(e)}. Continuing without memory results."
diff --git a/sdk/nexent/core/tools/store_memory_tool.py b/sdk/nexent/core/tools/store_memory_tool.py
deleted file mode 100644
index 29dbc4a8f..000000000
--- a/sdk/nexent/core/tools/store_memory_tool.py
+++ /dev/null
@@ -1,110 +0,0 @@
-import asyncio
-import logging
-from typing import Any
-
-from smolagents.tools import Tool
-from pydantic import Field
-
-from ..utils.observer import MessageObserver, ProcessType
-from ..utils.tools_common_message import ToolSign, ToolCategory
-
-logger = logging.getLogger("store_memory_tool")
-
-
-class StoreMemoryTool(Tool):
-    name = "store_memory"
-    description = (
-        "Save important information to long-term memory for future recall. "
-        "Use this when the user shares personal preferences, facts about themselves, "
-        "project context, or instructions that should persist across conversations. "
-        "Do NOT store transient information like temporary calculations, information "
-        "already in the knowledge base, or data the user explicitly says to forget."
-    )
-    description_zh = (
-        "将重要信息保存到长期记忆中以便未来回忆。"
-        "当用户分享个人偏好、关于自己的事实、项目上下文或应跨对话保留的指令时使用此工具。"
-        "不要存储临时信息，如临时计算结果、知识库中已有的信息或用户明确要求遗忘的数据。"
-    )
-
-    inputs = {
-        "content": {
-            "type": "string",
-            "description": "The information to remember",
-            "description_zh": "需要记住的信息"
-        }
-    }
-    output_type = "string"
-    category = ToolCategory.DATABASE.value
-    tool_sign = ToolSign.MEMORY_OPERATION.value
-
-    def __init__(
-        self,
-        memory_config: dict = Field(description="Mem0 configuration", exclude=True),
-        tenant_id: str = Field(description="Tenant ID", default="", exclude=True),
-        user_id: str = Field(description="User ID", default="", exclude=True),
-        agent_id: str = Field(description="Agent ID", default="", exclude=True),
-        memory_user_config: Any = Field(description="User memory preferences", default=None, exclude=True),
-        observer: MessageObserver = Field(description="Message observer", default=None, exclude=True),
-    ):
-        super().__init__()
-        self.memory_config = memory_config
-        self.tenant_id = tenant_id
-        self.user_id = user_id
-        self.agent_id = agent_id
-        self.memory_user_config = memory_user_config
-        self.observer = observer
-        self.store_count = 0
-        self.max_stores_per_run = 3
-        self.running_prompt_en = "Saving to memory..."
-        self.running_prompt_zh = "保存到记忆中..."
-
-    def forward(self, content: str) -> str:
-        logger.info(f"[ACTIVE MEMORY] StoreMemoryTool invoked: content={content[:200]}, user_id={self.user_id}, agent_id={self.agent_id}, store_count={self.store_count}/{self.max_stores_per_run}")
-        if self.observer:
-            running_prompt = self.running_prompt_zh if self.observer.lang == "zh" else self.running_prompt_en
-            self.observer.add_message("", ProcessType.TOOL, running_prompt)
-
-        if self.store_count >= self.max_stores_per_run:
-            return "Memory storage limit reached for this conversation. Information will be saved automatically at the end."
-
-        levels = ["user_agent", "agent"]
-        if self.memory_user_config.agent_share_option == "never":
-            levels.remove("agent")
-        if self.agent_id in getattr(self.memory_user_config, "disable_user_agent_ids", []):
-            levels = [l for l in levels if l != "user_agent"]
-        if self.agent_id in getattr(self.memory_user_config, "disable_agent_ids", []):
-            levels = [l for l in levels if l != "agent"]
-        if not levels:
-            return "No memory levels available (all disabled by user preferences)."
-
-        try:
-            from ...memory.memory_service import add_memory_in_levels
-            result = asyncio.run(add_memory_in_levels(
-                messages=[{"role": "user", "content": content}],
-                memory_config=self.memory_config,
-                tenant_id=self.tenant_id,
-                user_id=self.user_id,
-                agent_id=self.agent_id,
-                memory_levels=levels,
-            ))
-            self.store_count += 1
-
-            items = result.get("results", [])
-            logger.info(f"[ACTIVE MEMORY] StoreMemoryTool completed: {len(items)} items processed, events={[item.get('event', 'NONE') for item in items]}")
-            if not items:
-                return "No new facts were extracted from the content."
-
-            stored_facts = []
-            for item in items:
-                event = item.get("event", "NONE")
-                text = item.get("memory", "")
-                if event in ("ADD", "UPDATE"):
-                    stored_facts.append(f"[{event}] {text}")
-
-            if not stored_facts:
-                return "The information was already present in memory (no changes needed)."
-            return "Stored successfully:\n" + "\n".join(stored_facts)
-
-        except Exception as e:
-            logger.error(f"store_memory failed: {e}")
-            return f"Failed to store memory: {str(e)}. Continuing without saving."
diff --git a/sdk/nexent/core/utils/observer.py b/sdk/nexent/core/utils/observer.py
index fc45b30aa..c123b5157 100644
--- a/sdk/nexent/core/utils/observer.py
+++ b/sdk/nexent/core/utils/observer.py
@@ -27,7 +27,6 @@ class ProcessType(Enum):
     TOOL = "tool"  # tool name
     MEMORY_SEARCH = "memory_search"  # memory search status
     MAX_STEPS_REACHED = "max_steps_reached"  # agent reached maximum steps limit
-    VERIFICATION = "verification"  # layered ReAct self-verification status
 
 
 # message transformer base class
@@ -160,8 +159,7 @@ def _init_message_transformers(self):
             ProcessType.CARD: default_transformer,
             ProcessType.TOOL: default_transformer,
             ProcessType.MEMORY_SEARCH: default_transformer,
-            ProcessType.MAX_STEPS_REACHED: default_transformer,
-            ProcessType.VERIFICATION: default_transformer
+            ProcessType.MAX_STEPS_REACHED: default_transformer
         }
 
     def add_model_new_token(self, new_token):
diff --git a/sdk/nexent/core/utils/tools_common_message.py b/sdk/nexent/core/utils/tools_common_message.py
index 6b5f2e056..1d27f6b6d 100644
--- a/sdk/nexent/core/utils/tools_common_message.py
+++ b/sdk/nexent/core/utils/tools_common_message.py
@@ -17,7 +17,6 @@ class ToolSign(Enum):
     TERMINAL_OPERATION = "t"  # Terminal operation tool identifier
     MULTIMODAL_OPERATION = "m"  # Multimodal operation tool identifier
     DATABASE_OPERATION = "z"  # Database operation tool identifier
-    MEMORY_OPERATION = "n"      # Memory operation tool identifier
 
 
 # Tool sign mapping for backward compatibility
@@ -34,7 +33,6 @@ class ToolSign(Enum):
     "terminal_operation": ToolSign.TERMINAL_OPERATION.value,
     "multimodal_operation": ToolSign.MULTIMODAL_OPERATION.value,
     "database_operation": ToolSign.DATABASE_OPERATION.value,
-    "memory_operation": ToolSign.MEMORY_OPERATION.value,
 }
 
 # Reverse mapping for lookup
diff --git a/sdk/nexent/memory/memory_core.py b/sdk/nexent/memory/memory_core.py
index c5004c00e..434bf2cb0 100644
--- a/sdk/nexent/memory/memory_core.py
+++ b/sdk/nexent/memory/memory_core.py
@@ -102,9 +102,7 @@ async def get_memory_instance(memory_config: Dict[str, Any]) -> AsyncMemory:
     # Validate *before* computing hash so we fail fast with human-readable error
     _validate_config(memory_config)
 
-    config_hash = _hash_config(memory_config)
-    loop = asyncio.get_event_loop()
-    cache_key = f"{config_hash}:{id(loop)}"
+    cache_key = _hash_config(memory_config)
 
     async with _get_cache_lock():
         if cache_key in _MEMORY_CACHE:
diff --git a/sdk/nexent/skills/skill_manager.py b/sdk/nexent/skills/skill_manager.py
index c2e50c790..4c05b3c06 100644
--- a/sdk/nexent/skills/skill_manager.py
+++ b/sdk/nexent/skills/skill_manager.py
@@ -7,7 +7,6 @@
 import shlex
 import shutil
 import subprocess
-import sys
 import tempfile
 import zipfile
 from typing import Any, Dict, List, Optional, Union
@@ -787,13 +786,9 @@ def _run_python_script(self, script_path: str, params: Optional[str]) -> str:
         """
         cmd_parts = shlex.split(params) if params else []
 
-        # Use sys.executable to ensure the script runs in the same Python environment
-        # as the current process, so all installed packages (e.g., python-docx) are available
-        python_executable = sys.executable
-
         try:
             result = subprocess.run(
-                [python_executable, script_path] + cmd_parts,
+                ["python", script_path] + cmd_parts,
                 capture_output=True,
                 text=True,
                 timeout=300,
diff --git a/sdk/pyproject.toml b/sdk/pyproject.toml
index e39bbbf5e..cdb5459b9 100644
--- a/sdk/pyproject.toml
+++ b/sdk/pyproject.toml
@@ -9,12 +9,12 @@ description = "Nexent Agent Framework"
 authors = [
     { name = "Nexent Dev Team" }
 ]
-requires-python = ">=3.11,<3.12"
+requires-python = ">=3.10"
 keywords = ["agent", "ai", "framework"]
 classifiers = [
     "Intended Audience :: Developers",
     "Programming Language :: Python :: 3",
-    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.10",
 ]
 dependencies = [
     "aiofiles>=24.1.0",
@@ -38,8 +38,8 @@ dependencies = [
     "botocore>=1.37.34",
     "python-multipart>=0.0.20",
     "mcpadapt>=0.1.13",
-    "mcp>=1.24.0,<1.30",
-    "fastmcp>=2.14.2,<3.0",
+    "mcp>=1.19.0,<1.23",
+    "fastmcp==2.12.0",
     "docker>=7.0.0",
     "kubernetes>=29.0.0",
     "tiktoken>=0.5.0",
diff --git a/sonar-project.properties b/sonar-project.properties
deleted file mode 100644
index 7da5cc4c8..000000000
--- a/sonar-project.properties
+++ /dev/null
@@ -1,5 +0,0 @@
-sonar.projectKey=ModelEngine-Group_nexent
-sonar.organization=modelengine-group
-
-sonar.exclusions=**/init.sql
-sonar.cpd.exclusions=**/init.sql
\ No newline at end of file
diff --git a/test/backend/agents/test_create_agent_info.py b/test/backend/agents/test_create_agent_info.py
index 083886c1a..f650de5d7 100644
--- a/test/backend/agents/test_create_agent_info.py
+++ b/test/backend/agents/test_create_agent_info.py
@@ -47,21 +47,6 @@ class ToolExecutionException(Exception):
 
 consts_model_module = types.ModuleType("consts.model")
 consts_model_module.HistoryItem = HistoryItem
-
-
-class MockAgentToolParamsRequest(BaseModel):
-    """Mock for AgentToolParamsRequest."""
-    tools: Dict[str, Dict[str, Any]] = {}
-
-
-class MockToolParamsRequest(BaseModel):
-    """Mock for ToolParamsRequest."""
-    agents: Dict[str, MockAgentToolParamsRequest] = {}
-
-
-consts_model_module.HistoryItem = HistoryItem
-consts_model_module.AgentToolParamsRequest = MockAgentToolParamsRequest
-consts_model_module.ToolParamsRequest = MockToolParamsRequest
 sys.modules["consts.model"] = consts_model_module
 
 # Mock consts.exceptions module with ValidationError
@@ -78,7 +63,7 @@ class MockToolParamsRequest(BaseModel):
     setattr(consts_module, "model", consts_model_module)
     setattr(consts_module, "exceptions", consts_exceptions_module)
 
-# Also add model to consts module attributes (with AgentToolParamsRequest and ToolParamsRequest)
+# Also add model to consts module attributes
 consts_module = sys.modules.get("consts")
 if consts_module:
     setattr(consts_module, "model", consts_model_module)
@@ -165,11 +150,6 @@ def __init__(self, **kwargs):
 
 # Mock external dependencies before imports
 mock_message_observer = MagicMock()
-class MockAgentVerificationConfig:
-    @classmethod
-    def model_validate(cls, value):
-        return value or {}
-
 sys.modules['nexent.core.utils.observer'] = MagicMock(MessageObserver=mock_message_observer)
 sys.modules['nexent.core.agents.agent_model'] = _create_stub_module(
     "nexent.core.agents.agent_model",
@@ -179,7 +159,6 @@ def model_validate(cls, value):
     ToolConfig=MagicMock(),
     ExternalA2AAgentConfig=MagicMock(),
     AgentRunInfo=MagicMock(),
-    AgentVerificationConfig=MockAgentVerificationConfig,
     MessageObserver=MagicMock(),
     ContextComponent=_create_stub_component_class("ContextComponent"),
     ToolsComponent=_create_stub_component_class("ToolsComponent"),
@@ -260,7 +239,6 @@ def model_validate(cls, value):
 sys.modules['nexent.core.agents.agent_model'].ModelConfig = mock_model_config
 sys.modules['nexent.core.agents.agent_model'].ToolConfig = mock_tool_config
 sys.modules['nexent.core.agents.agent_model'].AgentRunInfo = mock_agent_run_info
-sys.modules['nexent.core.agents.agent_model'].AgentVerificationConfig = MockAgentVerificationConfig
 sys.modules['nexent.core.utils.observer'].MessageObserver = mock_message_observer
 
 # Mock BASE_BUILTIN_MODULES
@@ -315,9 +293,6 @@ def model_validate(cls, value):
     _build_internal_s3_url,
     _format_minio_files_for_content,
     _convert_history_with_minio_files,
-    _normalize_tool_params_request,
-    _get_agent_tool_overrides,
-    _merge_tool_params,
 )
 
 # Import HistoryItem for testing (from mocked consts.model)
@@ -326,9 +301,6 @@ def model_validate(cls, value):
 # Import ValidationError for testing (from mocked consts.exceptions)
 ValidationError = sys.modules["consts.exceptions"].ValidationError
 
-# Import ToolParamsRequest for testing
-ToolParamsRequest = sys.modules["consts.model"].ToolParamsRequest
-
 # Import constants for testing
 from consts.const import MODEL_CONFIG_MAPPING
 
@@ -764,11 +736,6 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
         """Ensure multimodal param is forwarded to embedding model selection."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["idx1", "idx2"],
-            "multimodal": True,
-            "rerank": False,
-        }
 
         with patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
@@ -777,7 +744,7 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
                 patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names') as mock_get_knowledge_map, \
                 patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config:
-
+            
             mock_tool_config.return_value = mock_tool_instance
 
             mock_search_tools.return_value = [
@@ -788,7 +755,7 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
                     "inputs": "string",
                     "output_type": "string",
                     "params": [
-                        {"name": "index_names", "default": ["idx1", "idx2"]},
+                        {"name": "index_names", "default": ["idx1", "idx2"]},  # 添加这个
                         {"name": "multimodal", "default": True},
                         {"name": "rerank", "default": False},
                     ],
@@ -806,6 +773,9 @@ async def test_create_tool_config_list_knowledge_base_multimodal(self):
             assert len(result) == 1
             # Verify get_embedding_model_by_index_name was called with tenant_id and first index_name
             mock_embedding_by_index.assert_called_once_with("tenant_1", "idx1")
+            
+            # Verify that multimodal parameter was removed from params (popped)
+            assert "multimodal" not in result[0].params
 
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_analyze_image_tool(self):
@@ -927,16 +897,11 @@ async def test_create_tool_config_list_with_analyze_text_file_tool(self):
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_knowledge_base_tool_metadata(self):
         """
-        Test that KnowledgeBaseSearchTool metadata contains vdb_core, embedding_model,
+        Test that KnowledgeBaseSearchTool metadata contains vdb_core, embedding_model, 
         rerank_model, display_name_to_index_map, and index_name_to_display_map.
         """
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["idx_a"],
-            "rerank": True,
-            "rerank_model_name": "gte-rerank-v2",
-        }
 
         with patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
@@ -979,7 +944,7 @@ async def test_create_tool_config_list_with_knowledge_base_tool_metadata(self):
 
             # Verify correct functions were called with correct parameters
             mock_get_vector_db_core.assert_called_once()
-            # Verify that call uses tenant_id and first index_name
+            # 修改：验证调用时使用 tenant_id 和 index_name
             mock_embedding.assert_called_once_with("tenant_1", "idx_a")
             mock_rerank.assert_called_once_with(tenant_id="tenant_1", model_name="gte-rerank-v2")
             mock_get_knowledge_map.assert_called_once_with(["idx_a"])
@@ -1264,156 +1229,11 @@ async def test_create_tool_config_list_multiple_tools_same_type(self):
             assert mock_tool_1.metadata["display_name_to_index_map"] == {}
             assert mock_tool_2.metadata["display_name_to_index_map"] == {}
 
-    @pytest.mark.asyncio
-    async def test_create_tool_config_list_applies_request_overrides_for_multiple_tools(self):
-        """Request tool_params should override DB params for multiple tools in one agent."""
-        kb_tool = MagicMock()
-        kb_tool.class_name = "KnowledgeBaseSearchTool"
-        kb_tool.params = {
-            "index_names": ["idx_override"],
-            "rerank": True,
-            "rerank_model_name": "gte-rerank-v2",
-            "top_k": 10,
-        }
-        analyze_tool = MagicMock()
-        analyze_tool.class_name = "AnalyzeTextFileTool"
-        analyze_tool.params = {
-            "prompt": "override prompt",
-        }
-
-        with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
-                patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
-                patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
-                patch('backend.agents.create_agent_info.get_vector_db_core') as mock_get_vector_db_core, \
-                patch('backend.agents.create_agent_info.get_embedding_model_by_index_name') as mock_embedding, \
-                patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
-                patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names', return_value={"idx_override": "Override KB"}), \
-                patch('backend.agents.create_agent_info.get_llm_model', return_value='llm-model'):
-            mock_tool_config.side_effect = [kb_tool, analyze_tool]
-            mock_get_vector_db_core.return_value = 'vdb-core'
-            mock_embedding.return_value = ('embedding-model', 1, {'status': 'ok'})
-            mock_rerank.return_value = 'rerank-model'
-            mock_search_tools.return_value = [
-                {
-                    'class_name': 'KnowledgeBaseSearchTool',
-                    'name': 'knowledge_base_search',
-                    'description': 'kb',
-                    'inputs': '{}',
-                    'output_type': 'string',
-                    'params': [
-                        {'name': 'index_names', 'default': ['idx_default']},
-                        {'name': 'rerank', 'default': False},
-                        {'name': 'rerank_model_name', 'default': ''},
-                        {'name': 'top_k', 'default': 5},
-                    ],
-                    'source': 'local',
-                    'usage': None,
-                },
-                {
-                    'class_name': 'AnalyzeTextFileTool',
-                    'name': 'analyze_text_file',
-                    'description': 'text',
-                    'inputs': '{}',
-                    'output_type': 'string',
-                    'params': [
-                        {'name': 'prompt', 'default': 'default prompt'},
-                    ],
-                    'source': 'local',
-                    'usage': None,
-                },
-            ]
-
-            result = await create_tool_config_list(
-                'agent_1',
-                'tenant_1',
-                'user_1',
-                tool_params={
-                    'agents': {
-                        'test_agent': {
-                            'tools': {
-                                'knowledge_base_search': {
-                                    'top_k': 10,
-                                    'rerank': True,
-                                    'rerank_model_name': 'gte-rerank-v2',
-                                    'index_names': ['idx_override'],
-                                },
-                                'analyze_text_file': {
-                                    'prompt': 'override prompt',
-                                },
-                            }
-                        }
-                    }
-                },
-            )
-
-        assert len(result) == 2
-        assert kb_tool.params['top_k'] == 10
-        assert kb_tool.params['rerank'] is True
-        assert kb_tool.params['rerank_model_name'] == 'gte-rerank-v2'
-        assert kb_tool.params['index_names'] == ['idx_override']
-        assert analyze_tool.params['prompt'] == 'override prompt'
-        mock_rerank.assert_called_once_with(tenant_id='tenant_1', model_name='gte-rerank-v2')
-        mock_embedding.assert_called_once_with('tenant_1', 'idx_override')
-
-    @pytest.mark.asyncio
-    async def test_create_tool_config_list_with_tool_params(self):
-        """Test create_tool_config_list with valid tool_params."""
-        mock_tool_instance = MagicMock()
-        mock_tool_instance.class_name = "AnalyzeTextFileTool"
-        mock_tool_instance.params = {
-            "prompt": "override prompt",
-        }
-
-        with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
-                patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
-                patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
-                patch('backend.agents.create_agent_info.get_llm_model', return_value='llm-model'):
-            mock_tool_config.return_value = mock_tool_instance
-
-            mock_search_tools.return_value = [
-                {
-                    'class_name': 'AnalyzeTextFileTool',
-                    'name': 'analyze_text_file',
-                    'description': 'text',
-                    'inputs': '{}',
-                    'output_type': 'string',
-                    'params': [
-                        {'name': 'prompt', 'default': 'default prompt'},
-                    ],
-                    'source': 'local',
-                    'usage': None,
-                }
-            ]
-
-            result = await create_tool_config_list(
-                'agent_1',
-                'tenant_1',
-                'user_1',
-                tool_params={
-                    'agents': {
-                        'test_agent': {
-                            'tools': {
-                                'analyze_text_file': {
-                                    'prompt': 'override prompt',
-                                }
-                            }
-                        }
-                    }
-                },
-            )
-
-            assert len(result) == 1
-            assert result[0] is mock_tool_instance
-
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_dify_tool(self):
         """Test that DifySearchTool gets correct metadata including rerank model."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "DifySearchTool"
-        mock_tool_instance.params = {
-            "rerank": True,
-            "rerank_model_name": "gte-rerank-v2",
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1439,6 +1259,7 @@ async def test_create_tool_config_list_with_dify_tool(self):
                 }
             ]
 
+            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify rerank model was fetched
@@ -1455,10 +1276,6 @@ async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
         """Test that DifySearchTool without rerank gets None metadata."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "DifySearchTool"
-        mock_tool_instance.params = {
-            "rerank": False,
-            "rerank_model_name": "",
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1483,6 +1300,7 @@ async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
                 }
             ]
 
+            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify rerank model was NOT fetched
@@ -1492,15 +1310,53 @@ async def test_create_tool_config_list_with_dify_tool_no_rerank(self):
             assert len(result) == 1
             assert result[0] is mock_tool_instance
 
+    @pytest.mark.asyncio
+    async def test_create_tool_config_list_with_datamate_tool(self):
+        """Test that DataMateSearchTool gets correct metadata including rerank model."""
+        mock_tool_instance = MagicMock()
+        mock_tool_instance.class_name = "DataMateSearchTool"
+
+        with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
+                patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
+                patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
+                patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank:
+
+            mock_tool_config.return_value = mock_tool_instance
+            mock_rerank.return_value = "mock_datamate_rerank_model"
+
+            mock_search_tools.return_value = [
+                {
+                    "class_name": "DataMateSearchTool",
+                    "name": "datamate_search",
+                    "description": "DataMate knowledge search",
+                    "inputs": "string",
+                    "output_type": "string",
+                    "params": [
+                        {"name": "rerank", "default": True},
+                        {"name": "rerank_model_name", "default": "jina-rerank-v2"},
+                    ],
+                    "source": "local",
+                    "usage": None
+                }
+            ]
+
+            from backend.agents.create_agent_info import create_tool_config_list
+            result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
+
+            # Verify rerank model was fetched
+            mock_rerank.assert_called_once_with(
+                tenant_id="tenant_1", model_name="jina-rerank-v2"
+            )
+
+            # Verify metadata
+            assert len(result) == 1
+            assert result[0] is mock_tool_instance
+
     @pytest.mark.asyncio
     async def test_create_tool_config_list_with_datamate_tool_no_rerank(self):
         """Test that DataMateSearchTool without rerank gets None metadata."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "DataMateSearchTool"
-        mock_tool_instance.params = {
-            "rerank": False,
-            "rerank_model_name": "",
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -1525,12 +1381,13 @@ async def test_create_tool_config_list_with_datamate_tool_no_rerank(self):
                 }
             ]
 
+            from backend.agents.create_agent_info import create_tool_config_list
             result = await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify rerank model was NOT fetched
             mock_rerank.assert_not_called()
 
-            # Verify result
+            # Verify metadata
             assert len(result) == 1
             assert result[0] is mock_tool_instance
 
@@ -1630,7 +1487,7 @@ class TestCreateAgentConfig:
     async def test_create_agent_config_basic(self):
         """Test case for basic agent configuration creation"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1681,15 +1538,14 @@ async def test_create_agent_config_basic(self):
                 managed_agents=[],
                 external_a2a_agents=[],
                 context_manager_config=ANY,
-                context_components=ANY,
-                verification_config=ANY
+                context_components=ANY
             )
 
     @pytest.mark.asyncio
     async def test_create_agent_config_with_sub_agents(self):
         """Test case for creating agent configuration with sub-agents"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1710,9 +1566,7 @@ async def test_create_agent_config_with_sub_agents(self):
                 "model_id": 123,
                 "provide_run_summary": True
             }
-            mock_query_sub.return_value = [
-                {"selected_agent_id": "sub_agent_1", "selected_agent_version_no": None}
-            ]
+            mock_query_sub.return_value = ["sub_agent_1"]
             mock_create_tools.return_value = []
             mock_get_template.return_value = {
                 "system_prompt": "{{duty}} {{constraint}} {{few_shots}}"}
@@ -1753,74 +1607,14 @@ async def test_create_agent_config_with_sub_agents(self):
                     managed_agents=[mock_sub_agent_config],
                     external_a2a_agents=[],
                     context_manager_config=ANY,
-                    context_components=ANY,
-                    verification_config=ANY
+                    context_components=ANY
                 )
 
-    @pytest.mark.asyncio
-    async def test_create_agent_config_with_pinned_sub_agent_version(self):
-        """Test sub-agent config uses pinned selected_agent_version_no from relation"""
-        with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
-                patch('backend.agents.create_agent_info.resolve_sub_agent_version_no', return_value=3) as mock_resolve, \
-                patch('backend.agents.create_agent_info.create_tool_config_list', new_callable=AsyncMock) as mock_create_tools, \
-                patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
-                patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
-                patch('backend.agents.create_agent_info.build_memory_context') as mock_build_memory, \
-                patch('backend.agents.create_agent_info.AgentConfig') as mock_agent_config, \
-                patch('backend.agents.create_agent_info.prepare_prompt_templates') as mock_prepare_templates, \
-                patch('backend.agents.create_agent_info.get_model_by_model_id') as mock_get_model_by_id:
-
-            mock_search_agent.return_value = {
-                "name": "test_agent",
-                "description": "test description",
-                "duty_prompt": "test duty",
-                "constraint_prompt": "test constraint",
-                "few_shots_prompt": "test few shots",
-                "max_steps": 5,
-                "model_id": 123,
-                "provide_run_summary": True,
-            }
-            mock_query_sub.return_value = [
-                {"selected_agent_id": 42, "selected_agent_version_no": 3}
-            ]
-            mock_create_tools.return_value = []
-            mock_get_template.return_value = {"system_prompt": "{{duty}}"}
-            mock_tenant_config.get_app_config.side_effect = ["TestApp", "Test Description"]
-            mock_build_memory.return_value = Mock(
-                user_config=Mock(memory_switch=False),
-                memory_config={},
-                tenant_id="tenant_1",
-                user_id="user_1",
-                agent_id="agent_1",
-            )
-            mock_prepare_templates.return_value = {"system_prompt": "populated_system_prompt"}
-            mock_get_model_by_id.return_value = {"display_name": "test_model"}
-
-            mock_sub_agent_config = Mock()
-            mock_sub_agent_config.name = "sub_agent"
-
-            with patch(
-                'backend.agents.create_agent_info.create_agent_config',
-                new_callable=AsyncMock,
-                return_value=mock_sub_agent_config,
-            ) as mock_recursive_create:
-                mock_agent_config.reset_mock()
-                await create_agent_config("agent_1", "tenant_1", "user_1", "zh", "test query", version_no=2)
-
-                mock_resolve.assert_called_once_with(
-                    selected_agent_id=42,
-                    selected_agent_version_no=3,
-                    tenant_id="tenant_1",
-                )
-                mock_recursive_create.assert_called_once()
-                assert mock_recursive_create.call_args.kwargs["version_no"] == 3
-
     @pytest.mark.asyncio
     async def test_create_agent_config_with_memory(self):
         """Test case for creating agent configuration with memory"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -1884,7 +1678,7 @@ async def test_create_agent_config_memory_disabled_no_search(self):
             "backend.agents.create_agent_info.search_agent_info_by_agent_id"
         ) as mock_search_agent, \
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub, \
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -1962,7 +1756,7 @@ async def test_create_agent_config_memory_disabled_no_search(self):
     async def test_create_agent_config_model_id_none(self):
         """Test case for creating agent configuration when model_id is None"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -2012,8 +1806,7 @@ async def test_create_agent_config_model_id_none(self):
                 managed_agents=[],
                 external_a2a_agents=[],
                 context_manager_config=ANY,
-                context_components=ANY,
-                verification_config=ANY
+                context_components=ANY
             )
 
     @pytest.mark.asyncio
@@ -2024,7 +1817,7 @@ async def test_create_agent_config_memory_exception(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2104,7 +1897,7 @@ async def test_create_agent_config_memory_levels_agent_share_never(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2199,7 +1992,7 @@ async def test_create_agent_config_memory_levels_disable_agent(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2294,7 +2087,7 @@ async def test_create_agent_config_memory_levels_disable_user_agent(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2388,7 +2181,7 @@ async def test_create_agent_config_with_knowledge_base_summary_filtering(self):
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2509,7 +2302,7 @@ async def test_create_agent_config_uses_metadata_index_name_to_display_map(self)
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2620,7 +2413,7 @@ async def test_create_agent_config_metadata_without_index_name_to_display_map(se
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2720,7 +2513,7 @@ async def test_create_agent_config_knowledge_base_summary_no_indexes_message(
                 "backend.agents.create_agent_info.search_agent_info_by_agent_id"
             ) as mock_search_agent,
             patch(
-                "backend.agents.create_agent_info.query_sub_agent_relations"
+                "backend.agents.create_agent_info.query_sub_agents_id_list"
             ) as mock_query_sub,
             patch(
                 "backend.agents.create_agent_info.create_tool_config_list"
@@ -2785,7 +2578,7 @@ async def test_create_agent_config_knowledge_base_summary_no_indexes_message(
     async def test_create_agent_config_knowledge_base_summary_error(self):
         """Test case for error handling during knowledge base summary build"""
         with patch('backend.agents.create_agent_info.search_agent_info_by_agent_id') as mock_search_agent, \
-                patch('backend.agents.create_agent_info.query_sub_agent_relations') as mock_query_sub, \
+                patch('backend.agents.create_agent_info.query_sub_agents_id_list') as mock_query_sub, \
                 patch('backend.agents.create_agent_info.create_tool_config_list') as mock_create_tools, \
                 patch('backend.agents.create_agent_info.get_agent_prompt_template') as mock_get_template, \
                 patch('backend.agents.create_agent_info.tenant_config_manager') as mock_tenant_config, \
@@ -3159,7 +2952,6 @@ async def test_create_agent_run_info_success(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=1,
-                tool_params=None,
             )
             mock_get_mcp.assert_called_once_with(tenant_id="tenant_1", is_need_auth=True)
             mock_filter.assert_called_once_with("agent_config", {
@@ -3696,7 +3488,6 @@ async def test_create_agent_run_info_forwards_allow_memory_false(self):
                 last_user_query="processed_query",
                 allow_memory_search=False,
                 version_no=1,
-                tool_params=None,
             )
 
     @pytest.mark.asyncio
@@ -3743,7 +3534,6 @@ async def test_create_agent_run_info_is_debug_true(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=0,  # Debug mode uses draft version 0
-                tool_params=None,
             )
 
     @pytest.mark.asyncio
@@ -3796,7 +3586,6 @@ async def test_create_agent_run_info_no_published_version_fallback(self):
                 last_user_query="processed_query",
                 allow_memory_search=True,
                 version_no=0,  # Fallback to draft version 0
-                tool_params=None,
             )
             # Verify that get_remote_mcp_server_list was called with is_need_auth=True
             mock_get_mcp.assert_called_once_with(tenant_id="tenant_1", is_need_auth=True)
@@ -4461,10 +4250,6 @@ async def test_knowledge_base_with_display_name_to_index_map(self):
         """Test that KnowledgeBaseSearchTool gets correct display_name_to_index_map from index_names"""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["idx1", "idx2"],
-            "rerank": False,
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4726,16 +4511,11 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
         """Test that ValidationError is raised when index_names is empty for KnowledgeBaseSearchTool."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": [],
-            "rerank": False,
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
                 patch('backend.agents.create_agent_info.search_tools_for_sub_agent') as mock_search_tools, \
                 patch('backend.agents.create_agent_info.get_vector_db_core') as mock_get_vector_db_core, \
-                patch('backend.agents.create_agent_info.get_embedding_model_by_index_name') as mock_get_emb, \
                 patch('backend.agents.create_agent_info.get_rerank_model') as mock_rerank, \
                 patch('backend.agents.create_agent_info.get_knowledge_name_map_by_index_names') as mock_get_knowledge_map:
 
@@ -4758,7 +4538,6 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
                 }
             ]
             mock_get_vector_db_core.return_value = "vdb_core_instance"
-            mock_get_emb.return_value = None  # Will trigger ValidationError
             mock_rerank.return_value = None
             mock_get_knowledge_map.return_value = {}
 
@@ -4767,17 +4546,13 @@ async def test_knowledge_base_empty_index_names_raises_validation_error(self):
                 await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
             # Verify error message
-            assert "index_names" in str(exc_info.value) and "not configured" in str(exc_info.value)
+            assert "Embedding model is required for knowledge_base_search but index_names is empty" in str(exc_info.value)
 
     @pytest.mark.asyncio
     async def test_knowledge_base_no_embedding_model_raises_validation_error(self):
         """Test that ValidationError is raised when get_embedding_model_by_index_name returns None."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["idx1"],
-            "rerank": False,
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4815,7 +4590,8 @@ async def test_knowledge_base_no_embedding_model_raises_validation_error(self):
             with pytest.raises(ValidationError) as exc_info:
                 await create_tool_config_list("agent_1", "tenant_1", "user_1")
 
-            # Verify error message contains guidance about configuring embedding model
+            # Verify error message contains index name and guidance
+            assert "No embedding model found for index 'idx1'" in str(exc_info.value)
             assert "Please configure an embedding model for this knowledge base" in str(exc_info.value)
 
     @pytest.mark.asyncio
@@ -4823,11 +4599,6 @@ async def test_knowledge_base_with_valid_embedding_model(self):
         """Test that KnowledgeBaseSearchTool correctly sets embedding_model when get_embedding_model_by_index_name succeeds."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["idx1", "idx2"],
-            "rerank": True,
-            "rerank_model_name": "gte-rerank-v2",
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4871,19 +4642,19 @@ async def test_knowledge_base_with_valid_embedding_model(self):
 
             # Verify the tool was created successfully
             assert len(result) == 1
-
+            
             # Verify get_embedding_model_by_index_name was called with correct parameters
             mock_get_emb_by_index.assert_called_once_with("tenant_1", "idx1")
-
+            
             # Verify metadata contains the embedding_model
             assert result[0].metadata["embedding_model"] == mock_embedding_model
-
+            
             # Verify metadata also contains other expected fields
             assert "vdb_core" in result[0].metadata
             assert "rerank_model" in result[0].metadata
             assert "display_name_to_index_map" in result[0].metadata
             assert "index_name_to_display_map" in result[0].metadata
-
+            
             # Verify mappings are correct
             assert result[0].metadata["display_name_to_index_map"] == {
                 "Knowledge Base 1": "idx1",
@@ -4899,10 +4670,6 @@ async def test_knowledge_base_with_single_index_and_embedding_model(self):
         """Test KnowledgeBaseSearchTool with single index_name and valid embedding model."""
         mock_tool_instance = MagicMock()
         mock_tool_instance.class_name = "KnowledgeBaseSearchTool"
-        mock_tool_instance.params = {
-            "index_names": ["single_index"],
-            "rerank": False,
-        }
 
         with patch('backend.agents.create_agent_info.ToolConfig') as mock_tool_config, \
                 patch('backend.agents.create_agent_info.discover_langchain_tools', return_value=[]), \
@@ -4943,13 +4710,13 @@ async def test_knowledge_base_with_single_index_and_embedding_model(self):
 
             # Verify the tool was created successfully
             assert len(result) == 1
-
+            
             # Verify get_embedding_model_by_index_name was called
             mock_get_emb_by_index.assert_called_once_with("tenant_1", "single_index")
-
+            
             # Verify embedding_model is set correctly
             assert result[0].metadata["embedding_model"] == mock_embedding_model
-
+            
             # Verify mappings for single index
             assert result[0].metadata["display_name_to_index_map"] == {
                 "My Knowledge Base": "single_index"
@@ -4992,12 +4759,12 @@ async def test_knowledge_base_embedding_model_error_metadata(self):
             mock_get_vector_db_core.return_value = "vdb_core"
             mock_rerank.return_value = None
             mock_get_knowledge_map.return_value = {"test_idx": "Test KB"}
-
+            
             # Return valid embedding model with error metadata
             mock_embedding_model = MagicMock()
             mock_get_emb_by_index.return_value = (
-                mock_embedding_model,
-                789,
+                mock_embedding_model, 
+                789, 
                 {"status": "error", "message": "Some error but model exists"}
             )
 
@@ -5422,157 +5189,3 @@ def test_convert_history_with_minio_files_all_items_have_minio_files(self):
 
 if __name__ == "__main__":
     pytest.main([__file__])
-
-
-# ============================================================================
-# Additional tests for improved coverage
-# ============================================================================
-
-
-class TestNormalizeToolParamsRequest:
-    """Tests for _normalize_tool_params_request function."""
-
-    def test_normalize_with_none(self):
-        """Test that None returns empty ToolParamsRequest."""
-        result = _normalize_tool_params_request(None)
-        assert isinstance(result, ToolParamsRequest)
-        assert result.agents == {}
-
-    def test_normalize_with_tool_params_request(self):
-        """Test that ToolParamsRequest is returned as-is."""
-        req = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
-        result = _normalize_tool_params_request(req)
-        assert result is req
-
-    def test_normalize_with_valid_dict(self):
-        """Test that valid dict is validated into ToolParamsRequest."""
-        input_dict = {"agents": {"agent1": {"tools": {"tool1": {"param1": "value1"}}}}}
-        result = _normalize_tool_params_request(input_dict)
-        assert isinstance(result, ToolParamsRequest)
-        assert "agent1" in result.agents
-
-    def test_normalize_with_invalid_type_raises_validation_error(self):
-        """Test that non-dict, non-ToolParamsRequest raises ValidationError."""
-        with pytest.raises(ValidationError, match="tool_params must be an object"):
-            _normalize_tool_params_request("invalid_string")
-
-    def test_normalize_with_invalid_dict_returns_empty(self):
-        """Test that invalid dict returns empty ToolParamsRequest (mock behavior)."""
-        # The mock ToolParamsRequest doesn't validate, so it just returns empty
-        result = _normalize_tool_params_request({"invalid_key": 123})
-        assert isinstance(result, ToolParamsRequest)
-
-
-class TestGetAgentToolOverrides:
-    """Tests for _get_agent_tool_overrides function."""
-
-    def test_get_overrides_with_none_tool_params(self):
-        """Test that None tool_params returns empty dict."""
-        result = _get_agent_tool_overrides(None, "agent1")
-        assert result == {}
-
-    def test_get_overrides_with_none_agent_name(self):
-        """Test that None agent_name returns empty dict."""
-        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
-        result = _get_agent_tool_overrides(tool_params, None)
-        assert result == {}
-
-    def test_get_overrides_with_empty_agent_name(self):
-        """Test that empty agent_name returns empty dict."""
-        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
-        result = _get_agent_tool_overrides(tool_params, "")
-        assert result == {}
-
-    def test_get_overrides_with_unknown_agent(self):
-        """Test that unknown agent returns empty dict."""
-        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}})})
-        result = _get_agent_tool_overrides(tool_params, "unknown_agent")
-        assert result == {}
-
-    def test_get_overrides_with_existing_agent(self):
-        """Test that existing agent returns its tool overrides."""
-        tool_params = ToolParamsRequest(agents={"agent1": MockAgentToolParamsRequest(tools={"tool1": {"param1": "value1"}, "tool2": {"param2": "value2"}})})
-        result = _get_agent_tool_overrides(tool_params, "agent1")
-        assert result == {"tool1": {"param1": "value1"}, "tool2": {"param2": "value2"}}
-
-
-class TestBuildInternalS3Url:
-    """Tests for _build_internal_s3_url function."""
-
-    def test_build_with_non_dict(self):
-        """Test that non-dict input returns empty string."""
-        assert _build_internal_s3_url("not a dict") == ""
-        assert _build_internal_s3_url(None) == ""
-        assert _build_internal_s3_url(123) == ""
-
-    def test_build_with_empty_dict(self):
-        """Test that empty dict returns empty string."""
-        assert _build_internal_s3_url({}) == ""
-
-    def test_build_with_object_name(self):
-        """Test URL building with object_name."""
-        result = _build_internal_s3_url({"object_name": "path/to/file.txt"})
-        # Bucket name depends on test environment mock (MINIO_DEFAULT_BUCKET = "test-bucket")
-        assert result.startswith("s3://")
-        assert "path/to/file.txt" in result
-
-    def test_build_with_object_name_leading_slash(self):
-        """Test URL building with leading slash in object_name."""
-        result = _build_internal_s3_url({"object_name": "/path/to/file.txt"})
-        # Bucket name depends on test environment mock
-        assert result.startswith("s3://")
-        assert "path/to/file.txt" in result
-
-    def test_build_with_s3_url_input(self):
-        """Test that s3:// URL is returned as-is."""
-        result = _build_internal_s3_url({"url": "s3://bucket/path/file.txt"})
-        assert result == "s3://bucket/path/file.txt"
-
-    def test_build_with_s3_single_slash(self):
-        """Test URL building with s3:/ prefix."""
-        result = _build_internal_s3_url({"url": "s3:/bucket/file.txt"})
-        assert result == "s3://bucket/file.txt"
-
-    def test_build_with_blob_url(self):
-        """Test that blob: URL returns empty string."""
-        assert _build_internal_s3_url({"url": "blob:http://example.com/file"}) == ""
-
-    def test_build_with_s3_blob_url(self):
-        """Test that s3:/blob: URL returns empty string."""
-        assert _build_internal_s3_url({"url": "s3:/blob:http://example.com/file"}) == ""
-
-    def test_build_with_http_url(self):
-        """Test that non-s3 URL returns s3:/ prefixed version."""
-        result = _build_internal_s3_url({"url": "https://example.com/file.txt"})
-        assert result == "s3:/https://example.com/file.txt"
-
-
-class TestMergeToolParams:
-    """Tests for _merge_tool_params function."""
-
-    def test_merge_with_override_params(self):
-        """Test that override params update merged params."""
-        tool_record = {"params": [{"name": "param1", "default": "default1"}, {"name": "param2", "default": "default2"}]}
-        override_params = {"param1": "override1"}
-        result = _merge_tool_params(tool_record, override_params)
-        assert result == {"param1": "override1", "param2": "default2"}
-
-    def test_merge_with_extra_params(self):
-        """Test that extra params take precedence."""
-        tool_record = {"params": [{"name": "param1", "default": "default1"}]}
-        override_params = {"param1": "override1"}
-        extra_params = {"param1": "extra1", "internal_param": "secret"}
-        result = _merge_tool_params(tool_record, override_params, extra_params)
-        assert result == {"param1": "extra1", "internal_param": "secret"}
-
-    def test_merge_with_no_params_in_tool_record(self):
-        """Test merge when tool_record has no params."""
-        tool_record = {}
-        result = _merge_tool_params(tool_record, {"override": "value"})
-        assert result == {"override": "value"}
-
-    def test_merge_with_empty_override_params(self):
-        """Test merge with empty override params."""
-        tool_record = {"params": [{"name": "param1", "default": "default1"}]}
-        result = _merge_tool_params(tool_record, {})
-        assert result == {"param1": "default1"}
diff --git a/test/backend/app/test_agent_app.py b/test/backend/app/test_agent_app.py
index f65083217..f1f0ca6a4 100644
--- a/test/backend/app/test_agent_app.py
+++ b/test/backend/app/test_agent_app.py
@@ -720,7 +720,7 @@ def test_export_agent_api_success(mocker, mock_auth_header):
     """Test export_agent_api success case returning JSON."""
     mock_export_agent = mocker.patch(
         "apps.agent_app.export_agent_with_skills_impl", new_callable=AsyncMock)
-    mock_export_agent.return_value = {"agent_id": 123, "name": "Test Agent"}
+    mock_export_agent.return_value = '{"agent_id": 123, "name": "Test Agent"}'
 
     response = config_client.post(
         "/agent/export",
diff --git a/test/backend/app/test_agent_repository_app.py b/test/backend/app/test_agent_repository_app.py
deleted file mode 100644
index b9b0d573a..000000000
--- a/test/backend/app/test_agent_repository_app.py
+++ /dev/null
@@ -1,161 +0,0 @@
-"""Unit tests for backend.apps.agent_repository_app module."""
-
-import os
-import sys
-from unittest.mock import AsyncMock, MagicMock
-
-import pytest
-from fastapi import FastAPI
-from fastapi.testclient import TestClient
-
-current_dir = os.path.dirname(os.path.abspath(__file__))
-backend_dir = os.path.abspath(os.path.join(current_dir, "../../../backend"))
-sys.path.insert(0, backend_dir)
-
-sys.modules.setdefault("services.agent_repository_service", MagicMock())
-sys.modules.setdefault("utils.auth_utils", MagicMock())
-
-from apps.agent_repository_app import agent_repository_router
-
-app = FastAPI()
-app.include_router(agent_repository_router)
-client = TestClient(app)
-
-
-@pytest.fixture
-def mock_auth_header():
-    return {"Authorization": "Bearer test_token"}
-
-
-def test_create_agent_repository_listing_api_success(mocker, mock_auth_header):
-    """Test create_agent_repository_listing_api success case."""
-    mock_get_user_id = mocker.patch(
-        "apps.agent_repository_app.get_current_user_id"
-    )
-    mock_create_listing = mocker.patch(
-        "apps.agent_repository_app.create_agent_repository_listing_impl",
-        new_callable=AsyncMock,
-    )
-
-    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
-    mock_create_listing.return_value = {
-        "agent_repository_id": 42,
-        "agent_id": 123,
-        "source_version_no": 1,
-        "is_updated": False,
-    }
-
-    response = client.post(
-        "/repository/agent/123/versions/1",
-        headers=mock_auth_header,
-    )
-
-    assert response.status_code == 200
-    mock_get_user_id.assert_called_once_with(mock_auth_header["Authorization"])
-    mock_create_listing.assert_awaited_once_with(
-        agent_id=123,
-        tenant_id="test_tenant_id",
-        user_id="test_user_id",
-        version_no=1,
-    )
-    assert response.json()["agent_repository_id"] == 42
-    assert response.json()["is_updated"] is False
-
-
-def test_create_agent_repository_listing_api_draft_version(mocker, mock_auth_header):
-    """Test create_agent_repository_listing_api with draft version (version_no=0)."""
-    mock_get_user_id = mocker.patch(
-        "apps.agent_repository_app.get_current_user_id"
-    )
-    mock_create_listing = mocker.patch(
-        "apps.agent_repository_app.create_agent_repository_listing_impl",
-        new_callable=AsyncMock,
-    )
-
-    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
-    mock_create_listing.return_value = {
-        "agent_repository_id": 42,
-        "agent_id": 123,
-        "source_version_no": 0,
-        "is_updated": True,
-    }
-
-    response = client.post(
-        "/repository/agent/123/versions/0",
-        headers=mock_auth_header,
-    )
-
-    assert response.status_code == 200
-    mock_create_listing.assert_awaited_once_with(
-        agent_id=123,
-        tenant_id="test_tenant_id",
-        user_id="test_user_id",
-        version_no=0,
-    )
-    assert response.json()["source_version_no"] == 0
-
-
-def test_create_agent_repository_listing_api_bad_request(mocker, mock_auth_header):
-    """Test create_agent_repository_listing_api with ValueError."""
-    mock_get_user_id = mocker.patch(
-        "apps.agent_repository_app.get_current_user_id"
-    )
-    mock_create_listing = mocker.patch(
-        "apps.agent_repository_app.create_agent_repository_listing_impl",
-        new_callable=AsyncMock,
-    )
-
-    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
-    mock_create_listing.side_effect = ValueError("version_no must be >= 0")
-
-    response = client.post(
-        "/repository/agent/123/versions/-1",
-        headers=mock_auth_header,
-    )
-
-    assert response.status_code == 400
-    assert response.json()["detail"] == "version_no must be >= 0"
-
-
-def test_create_agent_repository_listing_api_rejects_asset_owner(mocker, mock_auth_header):
-    """Test create_agent_repository_listing_api rejects ASSET_OWNER agents with 400."""
-    mock_get_user_id = mocker.patch(
-        "apps.agent_repository_app.get_current_user_id"
-    )
-    mock_create_listing = mocker.patch(
-        "apps.agent_repository_app.create_agent_repository_listing_impl",
-        new_callable=AsyncMock,
-    )
-
-    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
-    mock_create_listing.side_effect = ValueError("租户管理员智能体无法共享")
-
-    response = client.post(
-        "/repository/agent/123/versions/1",
-        headers=mock_auth_header,
-    )
-
-    assert response.status_code == 400
-    assert response.json()["detail"] == "租户管理员智能体无法共享"
-
-
-def test_create_agent_repository_listing_api_exception(mocker, mock_auth_header):
-    """Test create_agent_repository_listing_api with general exception."""
-    mock_get_user_id = mocker.patch(
-        "apps.agent_repository_app.get_current_user_id"
-    )
-    mock_create_listing = mocker.patch(
-        "apps.agent_repository_app.create_agent_repository_listing_impl",
-        new_callable=AsyncMock,
-    )
-
-    mock_get_user_id.return_value = ("test_user_id", "test_tenant_id")
-    mock_create_listing.side_effect = Exception("Database error")
-
-    response = client.post(
-        "/repository/agent/123/versions/1",
-        headers=mock_auth_header,
-    )
-
-    assert response.status_code == 500
-    assert "Create agent repository listing error." in response.json()["detail"]
diff --git a/test/backend/app/test_cas_app.py b/test/backend/app/test_cas_app.py
deleted file mode 100644
index 97536c2db..000000000
--- a/test/backend/app/test_cas_app.py
+++ /dev/null
@@ -1,184 +0,0 @@
-import os
-import sys
-import unittest
-from http import HTTPStatus
-from unittest.mock import AsyncMock, MagicMock
-
-from fastapi import FastAPI
-from fastapi.testclient import TestClient
-
-test_dir = os.path.dirname(__file__)
-backend_dir = os.path.abspath(os.path.join(test_dir, "../../../backend"))
-sys.path.insert(0, backend_dir)
-
-
-class _CasAuthenticationError(Exception):
-    pass
-
-
-_MODULES_TO_RESTORE = ["services.cas_service"]
-_ORIGINAL_MODULES = {name: sys.modules.get(name) for name in _MODULES_TO_RESTORE}
-
-cas_service_mock = MagicMock()
-cas_service_mock.CAS_SERVER_URL = "https://cas.example.com"
-cas_service_mock.CasAuthenticationError = _CasAuthenticationError
-cas_service_mock.get_cas_config = MagicMock(
-    return_value={
-        "enabled": True,
-        "login_mode": "button",
-        "renew_before_seconds": 300,
-        "renew_timeout_seconds": 10,
-        "display_name": "CAS",
-    }
-)
-cas_service_mock.build_login_url = MagicMock(return_value="https://cas.example.com/login?service=x")
-cas_service_mock.build_renew_url = MagicMock(return_value="https://cas.example.com/login?gateway=true")
-cas_service_mock.login_with_ticket = AsyncMock(
-    return_value={
-        "user": {"id": "user-1", "email": "u@example.com", "role": "USER"},
-        "session": {"access_token": "jwt", "expires_at": 1779780000, "expires_in_seconds": 3600},
-        "redirect_url": "/chat",
-    }
-)
-cas_service_mock.renew_with_ticket = AsyncMock(
-    return_value={
-        "user": {"id": "user-1", "email": "u@example.com", "role": "USER"},
-        "session": {"access_token": "jwt2", "expires_at": 1779780300, "expires_in_seconds": 3600},
-        "redirect_url": "/",
-        "renew": True,
-    }
-)
-cas_service_mock.revoke_from_logout_request = MagicMock(
-    return_value={"revoked": 1, "cas_user_id": "cas-user-1", "session_index": "ST-1"}
-)
-sys.modules["services.cas_service"] = cas_service_mock
-
-from apps.cas_app import router  # noqa: E402
-
-for _name, _module in _ORIGINAL_MODULES.items():
-    if _module is None:
-        sys.modules.pop(_name, None)
-    else:
-        sys.modules[_name] = _module
-
-app = FastAPI()
-app.include_router(router)
-client = TestClient(app)
-
-
-class TestCasApp(unittest.TestCase):
-    def tearDown(self):
-        cas_service_mock.build_login_url.side_effect = None
-        cas_service_mock.build_login_url.return_value = "https://cas.example.com/login?service=x"
-        cas_service_mock.build_renew_url.side_effect = None
-        cas_service_mock.build_renew_url.return_value = "https://cas.example.com/login?gateway=true"
-        cas_service_mock.login_with_ticket.side_effect = None
-        cas_service_mock.revoke_from_logout_request.reset_mock()
-
-    def test_config_returns_public_cas_settings(self):
-        response = client.get("/user/cas/config")
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        data = response.json()
-        self.assertEqual(data["message"], "success")
-        self.assertTrue(data["data"]["enabled"])
-        self.assertEqual(data["data"]["login_mode"], "button")
-
-    def test_login_redirects_to_cas_server(self):
-        response = client.get("/user/cas/login?redirect=/chat", follow_redirects=False)
-
-        self.assertEqual(response.status_code, HTTPStatus.FOUND)
-        self.assertEqual(response.headers["location"], "https://cas.example.com/login?service=x")
-        cas_service_mock.build_login_url.assert_called_with("/chat")
-
-    def test_login_returns_400_when_cas_not_configured(self):
-        cas_service_mock.build_login_url.side_effect = _CasAuthenticationError("CAS is not configured")
-
-        response = client.get("/user/cas/login")
-
-        self.assertEqual(response.status_code, HTTPStatus.BAD_REQUEST)
-        self.assertEqual(response.json()["detail"], "CAS login is not available")
-        self.assertNotIn("CAS is not configured", response.text)
-
-    def test_login_rejects_redirect_url_outside_configured_cas_server(self):
-        cas_service_mock.build_login_url.return_value = "https://evil.example.com/login?service=x"
-
-        response = client.get("/user/cas/login?redirect=/chat", follow_redirects=False)
-
-        self.assertEqual(response.status_code, HTTPStatus.BAD_REQUEST)
-        self.assertEqual(response.json()["detail"], "CAS login is not available")
-
-    def test_callback_returns_session_payload(self):
-        response = client.get("/user/cas/callback?ticket=ST-1&redirect=/chat")
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        data = response.json()
-        self.assertEqual(data["message"], "CAS login successful")
-        self.assertEqual(data["data"]["session"]["access_token"], "jwt")
-        cas_service_mock.login_with_ticket.assert_awaited()
-
-    def test_callback_returns_401_for_invalid_ticket(self):
-        cas_service_mock.login_with_ticket.side_effect = _CasAuthenticationError("bad ticket")
-
-        response = client.get("/user/cas/callback?ticket=bad")
-
-        self.assertEqual(response.status_code, HTTPStatus.UNAUTHORIZED)
-        self.assertEqual(response.json()["detail"], "CAS authentication failed")
-        self.assertNotIn("bad ticket", response.text)
-
-    def test_renew_does_not_expose_cas_configuration_exception(self):
-        cas_service_mock.build_renew_url.side_effect = _CasAuthenticationError("internal CAS config path")
-
-        response = client.get("/user/cas/renew")
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        self.assertIn("cas-renew-failed", response.text)
-        self.assertIn("CAS renew failed", response.text)
-        self.assertNotIn("internal CAS config path", response.text)
-
-    def test_renew_callback_without_ticket_posts_failure_to_iframe_parent(self):
-        response = client.get("/user/cas/renew_callback")
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        self.assertIn("text/html", response.headers["content-type"])
-        self.assertIn("cas-renew-failed", response.text)
-
-    def test_logout_callback_accepts_cas_form_body(self):
-        xml = """
-        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
-          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
-          <saml:NameID>cas-user-1</saml:NameID>
-          <samlp:SessionIndex>ST-1</samlp:SessionIndex>
-        </samlp:LogoutRequest>
-        """
-
-        response = client.post(
-            "/user/cas/logout_callback",
-            data={"logoutRequest": xml},
-        )
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        self.assertEqual(response.json()["data"]["revoked"], 1)
-        cas_service_mock.revoke_from_logout_request.assert_called_once_with(xml)
-
-    def test_callback_post_accepts_cas_single_logout_request(self):
-        xml = """
-        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
-          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
-          <saml:NameID>cas-user-1</saml:NameID>
-          <samlp:SessionIndex>ST-1</samlp:SessionIndex>
-        </samlp:LogoutRequest>
-        """
-
-        response = client.post(
-            "/user/cas/callback",
-            data={"logoutRequest": xml},
-        )
-
-        self.assertEqual(response.status_code, HTTPStatus.OK)
-        self.assertEqual(response.json()["data"]["revoked"], 1)
-        cas_service_mock.revoke_from_logout_request.assert_called_once_with(xml)
-
-
-if __name__ == "__main__":
-    unittest.main()
diff --git a/test/backend/app/test_idata_app.py b/test/backend/app/test_idata_app.py
index 4f7774ccd..66b213f96 100644
--- a/test/backend/app/test_idata_app.py
+++ b/test/backend/app/test_idata_app.py
@@ -5,7 +5,6 @@
 """
 import sys
 import os
-import types
 from unittest.mock import patch, MagicMock
 
 import pytest
@@ -20,57 +19,6 @@
 if backend_dir not in sys.path:
     sys.path.insert(0, backend_dir)
 
-# Stub the SDK modules used during import so tests do not load nexent.__init__ and
-# its optional runtime dependencies.
-nexent_module = types.ModuleType("nexent")
-nexent_module.__path__ = []
-nexent_storage_module = types.ModuleType("nexent.storage")
-nexent_storage_module.__path__ = []
-nexent_storage_factory_module = types.ModuleType("nexent.storage.storage_client_factory")
-nexent_minio_config_module = types.ModuleType("nexent.storage.minio_config")
-nexent_utils_module = types.ModuleType("nexent.utils")
-nexent_utils_module.__path__ = []
-nexent_http_client_manager_module = types.ModuleType("nexent.utils.http_client_manager")
-
-
-class MockMinIOStorageConfig:
-    def __init__(self, *args, **kwargs):
-        self.default_bucket = kwargs.get("default_bucket")
-
-    def validate(self):
-        return None
-
-
-nexent_storage_factory_module.create_storage_client_from_config = MagicMock()
-nexent_storage_factory_module.MinIOStorageConfig = MockMinIOStorageConfig
-nexent_minio_config_module.MinIOStorageConfig = MockMinIOStorageConfig
-nexent_http_client_manager_module.http_client_manager = MagicMock()
-nexent_module.storage = nexent_storage_module
-nexent_module.utils = nexent_utils_module
-nexent_storage_module.storage_client_factory = nexent_storage_factory_module
-nexent_storage_module.minio_config = nexent_minio_config_module
-nexent_utils_module.http_client_manager = nexent_http_client_manager_module
-
-sys.modules["nexent"] = nexent_module
-sys.modules["nexent.storage"] = nexent_storage_module
-sys.modules["nexent.storage.storage_client_factory"] = nexent_storage_factory_module
-sys.modules["nexent.storage.minio_config"] = nexent_minio_config_module
-sys.modules["nexent.utils"] = nexent_utils_module
-sys.modules["nexent.utils.http_client_manager"] = nexent_http_client_manager_module
-
-backend_module = sys.modules.get("backend") or types.ModuleType("backend")
-backend_module.__path__ = [backend_dir]
-backend_database_module = types.ModuleType("backend.database")
-backend_database_module.__path__ = [os.path.join(backend_dir, "database")]
-backend_database_client_module = types.ModuleType("backend.database.client")
-backend_database_client_module.MinioClient = MagicMock()
-backend_module.database = backend_database_module
-backend_database_module.client = backend_database_client_module
-
-sys.modules["backend"] = backend_module
-sys.modules["backend.database"] = backend_database_module
-sys.modules["backend.database.client"] = backend_database_client_module
-
 # Mock the storage client factory BEFORE importing any backend modules that depend on it.
 # This prevents MinIO connection attempts during module import.
 
@@ -569,17 +517,29 @@ def test_router_prefix(self):
     def test_routes_registered(self):
         """Test that all routes are registered."""
         app = _build_app()
-        paths = app.openapi()["paths"]
+        routes = [route.path for route in app.routes]
 
-        assert "/idata/knowledge-space" in paths
-        assert "/idata/datasets" in paths
+        assert "/idata/knowledge-space" in routes
+        assert "/idata/datasets" in routes
 
     def test_router_methods(self):
         """Test that routes have correct HTTP methods."""
         app = _build_app()
-        paths = app.openapi()["paths"]
 
-        assert "/idata/knowledge-space" in paths
-        assert "/idata/datasets" in paths
-        assert "get" in paths["/idata/knowledge-space"]
-        assert "get" in paths["/idata/datasets"]
+        # Find routes by path
+        knowledge_space_route = None
+        datasets_route = None
+
+        for route in app.routes:
+            if hasattr(route, 'path'):
+                if route.path == "/idata/knowledge-space":
+                    knowledge_space_route = route
+                elif route.path == "/idata/datasets":
+                    datasets_route = route
+
+        assert knowledge_space_route is not None
+        assert datasets_route is not None
+
+        # Check HTTP methods
+        assert "GET" in [method for method in knowledge_space_route.methods]
+        assert "GET" in [method for method in datasets_route.methods]
diff --git a/test/backend/app/test_knowledge_summary_app.py b/test/backend/app/test_knowledge_summary_app.py
index fcbad52db..6201cf381 100644
--- a/test/backend/app/test_knowledge_summary_app.py
+++ b/test/backend/app/test_knowledge_summary_app.py
@@ -12,7 +12,6 @@
 from unittest.mock import patch, MagicMock, AsyncMock
 
 import pytest
-from pydantic import BaseModel
 
 # Apply patches that need to be active before imports
 from unittest.mock import patch as mock_patch
@@ -40,16 +39,7 @@ class MockToolConfig:
     pass
 
 
-class MockAgentVerificationConfig:
-    @classmethod
-    def model_validate(cls, value):
-        mock_config = MagicMock()
-        mock_config.model_dump.return_value = value
-        return mock_config
-
-
 nexent_core_agents_agent_model.ToolConfig = MockToolConfig
-nexent_core_agents_agent_model.AgentVerificationConfig = MockAgentVerificationConfig
 sys.modules['nexent.core.agents.agent_model'] = nexent_core_agents_agent_model
 nexent_nexent_vector_database = types.ModuleType('nexent.vector_database')
 sys.modules['nexent.vector_database'] = nexent_nexent_vector_database
@@ -83,18 +73,6 @@ def mock_get_vector_db_core():
 sys.modules['services.redis_service'] = types.ModuleType('services.redis_service')
 sys.modules['services.group_service'] = types.ModuleType('services.group_service')
 
-# knowledge_summary_app only needs this request model from consts.model. Keeping
-# it local avoids importing unrelated EmailStr models and optional validators.
-consts_model_mock = types.ModuleType('consts.model')
-
-
-class ChangeSummaryRequest(BaseModel):
-    summary_result: str
-
-
-consts_model_mock.ChangeSummaryRequest = ChangeSummaryRequest
-sys.modules['consts.model'] = consts_model_mock
-
 # Mock utils modules used by knowledge_summary_app to avoid deep DB/storage import chains
 utils_auth_utils_mock = types.ModuleType('utils.auth_utils')
 utils_auth_utils_mock.get_current_user_id = MagicMock(return_value=("test_user_id", "test_tenant_id"))
@@ -112,6 +90,7 @@ class ChangeSummaryRequest(BaseModel):
 # Import the modules we need
 from fastapi.testclient import TestClient
 from fastapi import FastAPI
+from pydantic import BaseModel
 from apps.knowledge_summary_app import router
 
 # Create a test app and client
diff --git a/test/backend/app/test_northbound_app.py b/test/backend/app/test_northbound_app.py
index 827e04e4d..2bfb25a76 100644
--- a/test/backend/app/test_northbound_app.py
+++ b/test/backend/app/test_northbound_app.py
@@ -1,22 +1,53 @@
-"""Unit tests for backend.apps.northbound_app module."""
-import sys
 import os
-
-# The conftest.py sets up all mocks
-
-from unittest.mock import AsyncMock, MagicMock, patch
+import sys
+from unittest.mock import MagicMock, AsyncMock
 import pytest
-from fastapi import FastAPI
+from fastapi import FastAPI, HTTPException
+from fastapi.responses import StreamingResponse
 from fastapi.testclient import TestClient
-from io import BytesIO
-
-# Import from conftest (which sets up mocks automatically)
+import types
+import sys as _sys
+
+# Dynamically determine the backend path
+current_dir = os.path.dirname(os.path.abspath(__file__))
+backend_dir = os.path.abspath(os.path.join(current_dir, "../../../backend"))
+sys.path.append(backend_dir)
+
+
+# Pre-mock heavy dependencies before importing router
+sys.modules['consts'] = MagicMock()
+sys.modules['consts.model'] = MagicMock()
+
+consts_exceptions_mod = types.ModuleType("consts.exceptions")
+
+class LimitExceededError(Exception):
+    pass
+class UnauthorizedError(Exception):
+    pass
+class SignatureValidationError(Exception):
+    pass
+
+consts_exceptions_mod.LimitExceededError = LimitExceededError
+consts_exceptions_mod.UnauthorizedError = UnauthorizedError
+consts_exceptions_mod.SignatureValidationError = SignatureValidationError
+
+# Ensure the parent 'consts' is a module
+if 'consts' not in _sys.modules or not isinstance(_sys.modules['consts'], types.ModuleType):
+    consts_root = types.ModuleType("consts")
+    consts_root.__path__ = []
+    _sys.modules['consts'] = consts_root
+else:
+    consts_root = _sys.modules['consts']
+
+consts_root.exceptions = consts_exceptions_mod
+_sys.modules['consts.exceptions'] = consts_exceptions_mod
+sys.modules['services'] = MagicMock()
+sys.modules['services.northbound_service'] = MagicMock()
+sys.modules['utils'] = MagicMock()
+sys.modules['utils.auth_utils'] = MagicMock()
+
+# Import router after setting mocks
 from apps.northbound_app import router
-from consts.exceptions import (
-    LimitExceededError,
-    UnauthorizedError,
-    SignatureValidationError,
-)
 
 
 app = FastAPI()
@@ -25,7 +56,6 @@
 
 
 def _build_headers(auth="Bearer test_jwt", request_id="req-123", aksk=True):
-    """Build request headers for testing."""
     headers = {
         "Authorization": auth,
         "X-Request-Id": request_id,
@@ -39,12 +69,8 @@ def _build_headers(auth="Bearer test_jwt", request_id="req-123", aksk=True):
     return headers
 
 
-# =============================================================================
-# Health Check Tests
-# =============================================================================
-
-def test_health_check():
-    """Test health check endpoint returns healthy status."""
+@pytest.mark.asyncio
+async def test_health_check():
     resp = client.get("/nb/v1/health")
     assert resp.status_code == 200
     data = resp.json()
@@ -52,783 +78,544 @@ def test_health_check():
     assert data["service"] == "northbound-api"
 
 
-# =============================================================================
-# Upload Chat Attachments Tests
-# =============================================================================
-
-def test_upload_chat_attachments_success():
-    """Test successful chat attachment upload."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
+def test_run_chat_calls_service(monkeypatch):
+    # Mock Bearer token validation to return valid token
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    # Mock user/tenant lookup to return user and tenant
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    async def _gen():
+        yield b"data: hello\n\n"
+    start_mock = AsyncMock(return_value=StreamingResponse(_gen(), media_type="text/event-stream"))
+    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", start_mock)
 
-        mock_ctx.return_value = MagicMock()
-        mock_upload.return_value = {
-            "message": "Processed 1 files",
-            "requestId": "req-123",
-            "results": [{"filename": "test.pdf", "status": "success"}],
-        }
+    # Use integer conversation_id as the endpoint expects Optional[int]
+    payload = {"conversation_id": 1, "agent_name": "agent-a", "query": "hi"}
+    headers = {**_build_headers(), "Idempotency-Key": "idem-1"}
+    resp = client.post("/nb/v1/chat/run", json=payload, headers=headers)
 
-        # Create a fake file upload
-        file_content = b"test file content"
-        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
-
-        resp = client.post(
-            "/nb/v1/chat/attachments/upload",
-            files=files,
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-        data = resp.json()
-        assert data["message"] == "Processed 1 files"
-
-
-def test_upload_chat_attachments_limit_exceeded():
-    """Test upload returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
-
-        mock_ctx.return_value = MagicMock()
-        mock_upload.side_effect = LimitExceededError("Upload limit exceeded")
-
-        file_content = b"test file content"
-        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
-
-        resp = client.post(
-            "/nb/v1/chat/attachments/upload",
-            files=files,
-            headers=_build_headers(),
-        )
+    assert resp.status_code == 200
+    assert "text/event-stream" in resp.headers["content-type"]
+    # Validate call into service
+    assert start_mock.await_count == 1
+    args, kwargs = start_mock.call_args
+    assert kwargs["conversation_id"] == 1
+    assert kwargs["agent_name"] == "agent-a"
+    assert kwargs["query"] == "hi"
+    assert kwargs["idempotency_key"] == "idem-1"
+
+
+def test_stop_chat_calls_service(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    stop_mock = AsyncMock(return_value={"message": "success"})
+    monkeypatch.setattr("apps.northbound_app.stop_chat", stop_mock)
+
+    # Use integer conversation_id in URL path
+    resp = client.get("/nb/v1/chat/stop/123", headers=_build_headers())
+    assert resp.status_code == 200
+    assert stop_mock.await_count == 1
 
-        assert resp.status_code == 429
 
+def test_get_history_calls_service(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    hist_mock = AsyncMock(return_value={"message": "success"})
+    monkeypatch.setattr("apps.northbound_app.get_conversation_history", hist_mock)
 
-def test_upload_chat_attachments_internal_error():
-    """Test upload returns 500 when internal error occurs."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
+    # Use integer conversation_id in URL path
+    resp = client.get("/nb/v1/conversations/123", headers=_build_headers())
+    assert resp.status_code == 200
+    assert hist_mock.await_count == 1
 
-        mock_ctx.return_value = MagicMock()
-        mock_upload.side_effect = Exception("Unknown error")
 
-        file_content = b"test file content"
-        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
+def test_list_agents_calls_service(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    agents_mock = AsyncMock(return_value={"message": "success", "data": []})
+    monkeypatch.setattr("apps.northbound_app.get_agent_info_list", agents_mock)
 
-        resp = client.post(
-            "/nb/v1/chat/attachments/upload",
-            files=files,
-            headers=_build_headers(),
-        )
+    resp = client.get("/nb/v1/agents", headers=_build_headers())
+    assert resp.status_code == 200
+    assert agents_mock.await_count == 1
 
-        assert resp.status_code == 500
 
+def test_list_conversations_calls_service(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    list_mock = AsyncMock(return_value={"message": "success", "data": []})
+    monkeypatch.setattr("apps.northbound_app.list_conversations", list_mock)
 
-# =============================================================================
-# Run Chat Tests
-# =============================================================================
+    resp = client.get("/nb/v1/conversations", headers=_build_headers())
+    assert resp.status_code == 200
+    assert list_mock.await_count == 1
+
+
+def test_update_title_sets_headers(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    # Ensure NorthboundContext yields plain string fields (avoid MagicMock in headers)
+    class _NCtx:
+        def __init__(self, request_id: str, tenant_id: str, user_id: str, authorization: str, token_id: int = 0):
+            self.request_id = request_id
+            self.tenant_id = tenant_id
+            self.user_id = user_id
+            self.authorization = authorization
+            self.token_id = token_id
+    monkeypatch.setattr("apps.northbound_app.NorthboundContext", _NCtx)
+    update_mock = AsyncMock(return_value={"message": "success", "data": "nb-4", "idempotency_key": "ide-xyz"})
+    monkeypatch.setattr("apps.northbound_app.update_conversation_title", update_mock)
+
+    headers = {**_build_headers(request_id="req-999"), "Idempotency-Key": "ide-xyz"}
+    resp = client.put("/nb/v1/conversations/123/title", params={"title": "New Title"}, headers=headers)
+    assert resp.status_code == 200
+    # Router wraps JSONResponse and should echo idempotency and request id
+    assert resp.headers.get("Idempotency-Key") == "ide-xyz"
+    assert resp.headers.get("X-Request-Id") == "req-999"
+    assert update_mock.await_count == 1
 
-def test_run_chat_success():
-    """Test successful chat run initiation."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
 
-        mock_ctx.return_value = MagicMock()
-        mock_run.return_value = {
-            "message": "Chat run initiated",
-            "request_id": "req-789",
-            "status": "initiated",
-        }
+def _std_headers(auth="Bearer test_jwt"):
+    return {
+        **_build_headers(auth=auth),
+        "Idempotency-Key": "idem-xyz",
+    }
 
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello, agent",
-            },
-            headers=_build_headers(),
-        )
 
-        assert resp.status_code == 200
+@pytest.mark.parametrize("exc_cls, status", [
+    (UnauthorizedError, 401),
+    (LimitExceededError, 429),
+    (SignatureValidationError, 401),
+])
+def test_run_chat_auth_exceptions_are_mapped(monkeypatch, exc_cls, status):
+    # Force Bearer token validation to raise domain exceptions
+    def _raise(*_, **__):
+        raise exc_cls("boom")
+
+    monkeypatch.setattr(
+        "apps.northbound_app.validate_bearer_token", _raise)
+    # Even if provided, auth should not be parsed because token validation fails first
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    assert resp.status_code == status
+
+
+def test_run_chat_missing_authorization_header_returns_401(monkeypatch):
+    # When no Authorization header, validate_bearer_token returns (False, None)
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (False, None))
+    # No Authorization header
+    headers = {k: v for k, v in _std_headers().items() if k.lower()
+               != "authorization"}
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=headers,
+    )
+    assert resp.status_code == 401
+    assert "bearer token" in resp.json()["detail"].lower()
 
 
-def test_run_chat_limit_exceeded():
-    """Test run chat returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello",
-            },
-            headers=_build_headers(),
-        )
+def test_run_chat_jwt_parse_exception_returns_401(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
 
-        assert resp.status_code == 429
+    def _raise_user_lookup(_access_key):
+        raise Exception("user lookup error")
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", _raise_user_lookup)
 
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    # When user lookup fails due to an invalid API key, return 401
+    assert resp.status_code == 401
+    assert "invalid api key" in resp.json()["detail"].lower()
 
-def test_run_chat_unauthorized():
-    """Test run chat returns 500 on unauthorized (broad exception handling)."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx:
-        mock_ctx.side_effect = UnauthorizedError("Invalid token")
 
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello",
-            },
-            headers=_build_headers(),
-        )
-
-        # The run_chat endpoint has broad exception handling, so unauthorized returns 500
-        assert resp.status_code == 500
-
-
-# =============================================================================
-# Stop Chat Tests
-# =============================================================================
-
-def test_stop_chat_success():
-    """Test successful chat stop."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
-
-        mock_ctx.return_value = MagicMock()
-        mock_stop.return_value = True
-
-        resp = client.get(
-            "/nb/v1/chat/stop/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-
-
-# =============================================================================
-# Get Conversation Tests
-# =============================================================================
-
-def test_get_conversation_success():
-    """Test successful retrieval of conversation."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.return_value = {
-            "conversation_id": 123,
-            "history": [
-                {"role": "user", "content": "Hello"},
-                {"role": "assistant", "content": "Hi there!"},
-            ]
-        }
-
-        resp = client.get(
-            "/nb/v1/conversations/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-        data = resp.json()
-        assert data["conversation_id"] == 123
-        assert len(data["history"]) == 2
-
-
-# =============================================================================
-# List Agents Tests
-# =============================================================================
-
-def test_list_agents_success():
-    """Test successful retrieval of agent list."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.return_value = {
-            "agents": [
-                {"name": "agent1", "description": "First agent"},
-                {"name": "agent2", "description": "Second agent"},
-            ]
-        }
-
-        resp = client.get(
-            "/nb/v1/agents",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-        data = resp.json()
-        assert len(data["agents"]) == 2
+def test_run_chat_jwt_missing_user_id_returns_400(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr(
+        "apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+            "user_id": None, "tenant_id": "t1", "token_id": "t1"
+        })
 
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    assert resp.status_code == 400
+    assert "user" in resp.json()["detail"].lower()
 
-# =============================================================================
-# List Conversations Tests
-# =============================================================================
 
-def test_list_conversations_success():
-    """Test successful retrieval of conversation list."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
-
-        mock_ctx.return_value = MagicMock()
-        mock_list.return_value = {
-            "conversations": [
-                {"id": 1, "title": "Conversation 1"},
-                {"id": 2, "title": "Conversation 2"},
-            ]
-        }
+def test_run_chat_jwt_missing_tenant_id_returns_400(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr(
+        "apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+            "user_id": "u1", "tenant_id": None, "token_id": "t1"
+        })
 
-        resp = client.get(
-            "/nb/v1/conversations",
-            headers=_build_headers(),
-        )
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    assert resp.status_code == 400
+    assert "tenant" in resp.json()["detail"].lower()
 
-        assert resp.status_code == 200
-        data = resp.json()
-        assert len(data["conversations"]) == 2
-
-
-# =============================================================================
-# Update Conversation Title Tests
-# =============================================================================
-
-def test_update_conversation_title_success():
-    """Test successful update of conversation title."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
 
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.return_value = {"idempotency_key": "idem-key", "conversation_id": 123, "title": "New Title"}
+def test_run_chat_internal_error_when_parsing_context_returns_401(monkeypatch):
+    def _raise(*_, **__):
+        raise Exception("unexpected")
+    monkeypatch.setattr(
+        "apps.northbound_app.validate_bearer_token", _raise)
 
-        resp = client.put(
-            "/nb/v1/conversations/123/title?title=New%20Title",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-
-
-# =============================================================================
-# File Fetch Tests
-# =============================================================================
-
-def test_file_fetch_missing_url():
-    """Test file fetch returns 422 when URL is missing."""
-    resp = client.get(
-        "/nb/v1/file/fetch",
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    # Any exception during validation returns 401
+    assert resp.status_code == 401
+
+
+def test_run_chat_unexpected_service_error_maps_500(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    start_mock = AsyncMock(side_effect=Exception("boom"))
+    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", start_mock)
+
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1, "agent_name": "a", "query": "hi"},
+        headers=_std_headers(),
+    )
+    assert resp.status_code == 500
+
+
+@pytest.mark.parametrize("path", [
+    "/nb/v1/chat/stop/123",
+    "/nb/v1/conversations/123",
+    "/nb/v1/agents",
+    "/nb/v1/conversations",
+])
+@pytest.mark.parametrize("exc_cls, status", [
+    (UnauthorizedError, 401),
+    (LimitExceededError, 429),
+    (SignatureValidationError, 401),
+])
+def test_other_endpoints_auth_exceptions_are_mapped(monkeypatch, path, exc_cls, status):
+    def _raise(*_, **__):
+        raise exc_cls("boom")
+    monkeypatch.setattr(
+        "apps.northbound_app.validate_bearer_token", _raise)
+
+    resp = client.get(path, headers=_build_headers())
+    assert resp.status_code == status
+
+
+@pytest.mark.parametrize(
+    "path, target",
+    [
+        ("/nb/v1/chat/stop/123", "apps.northbound_app.stop_chat"),
+        ("/nb/v1/conversations/123", "apps.northbound_app.get_conversation_history"),
+        ("/nb/v1/agents", "apps.northbound_app.get_agent_info_list"),
+        ("/nb/v1/conversations", "apps.northbound_app.list_conversations"),
+    ],
+)
+def test_other_endpoints_unexpected_service_error_maps_500(monkeypatch, path, target):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    monkeypatch.setattr(target, AsyncMock(side_effect=Exception("boom")))
+
+    resp = client.get(path, headers=_build_headers())
+    assert resp.status_code == 500
+
+
+def test_update_title_unexpected_service_error_maps_500(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+    monkeypatch.setattr("apps.northbound_app.update_conversation_title", AsyncMock(
+        side_effect=Exception("boom")))
+
+    resp = client.put(
+        "/nb/v1/conversations/123/title",
+        params={"title": "x"},
         headers=_build_headers(),
     )
+    assert resp.status_code == 500
+
+
+def test_run_chat_sets_headers_from_service_response(monkeypatch):
+    # Mock Bearer token and user lookup
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+
+    # Ensure NorthboundContext yields plain string fields (avoid MagicMock in headers)
+    class _NCtx:
+        def __init__(self, request_id: str, tenant_id: str, user_id: str, authorization: str, token_id: int = 0):
+            self.request_id = request_id
+            self.tenant_id = tenant_id
+            self.user_id = user_id
+            self.authorization = authorization
+            self.token_id = token_id
+
+    monkeypatch.setattr("apps.northbound_app.NorthboundContext", _NCtx)
+
+    async def _gen():
+        yield b"data: ok\n\n"
+
+    async def _start(ctx, conversation_id, agent_name, query, meta_data=None, idempotency_key=None):
+        resp = StreamingResponse(_gen(), media_type="text/event-stream")
+        # Service attaches headers in latest logic; emulate here
+        resp.headers["X-Request-Id"] = ctx.request_id
+        resp.headers["conversation_id"] = str(conversation_id)
+        return resp
+
+    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", _start)
+
+    headers = {**_std_headers(), "X-Request-Id": "rid-123"}
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1,
+              "agent_name": "agent-a", "query": "hello"},
+        headers=headers,
+    )
 
-    # Missing required parameter returns 422
-    assert resp.status_code == 422
-
-
-# =============================================================================
-# Error Handling Tests
-# =============================================================================
-
-def test_invalid_request_body():
-    """Test that invalid request body returns 422."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx:
-        mock_ctx.return_value = MagicMock()
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={},  # Missing required fields
-            headers=_build_headers(),
-        )
-
-        # FastAPI returns 422 for validation errors
-        assert resp.status_code == 422
-
-
-def test_run_chat_with_conversation_id():
-    """Test run chat with existing conversation ID."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.return_value = {
-            "message": "Chat run continued",
-            "request_id": "req-456",
-            "status": "continued",
-        }
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello again",
-                "conversation_id": 123,
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-
-
-def test_run_chat_with_attachments():
-    """Test run chat with file attachments."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.return_value = {
-            "message": "Chat run with attachments",
-            "request_id": "req-789",
-            "status": "initiated",
-        }
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Summarize the attached report",
-                "attachments": ["s3://nexent/attachments/file.pdf"],
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-
-
-def test_run_chat_with_tool_params():
-    """Test run chat with tool parameter overrides."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.return_value = {
-            "message": "Chat run with tool params",
-            "request_id": "req-101",
-            "status": "initiated",
-        }
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Search the knowledge base",
-                "tool_params": {
-                    "agents": {
-                        "general-assistant": {
-                            "tools": {
-                                "knowledge_base_search": {
-                                    "top_k": 5,
-                                }
-                            }
-                        }
-                    }
-                },
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 200
-
-
-def test_run_chat_permission_error():
-    """Test run chat returns 403 when permission denied."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.side_effect = PermissionError("Access denied")
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello",
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 403
-
-
-def test_run_chat_internal_error():
-    """Test run chat returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.side_effect = Exception("Unexpected error")
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello",
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 500
-
-
-def test_run_chat_value_error():
-    """Test run chat returns 400 on value error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.start_streaming_chat', new_callable=AsyncMock) as mock_run:
-
-        mock_ctx.return_value = MagicMock()
-        mock_run.side_effect = ValueError("Invalid agent name")
-
-        resp = client.post(
-            "/nb/v1/chat/run",
-            json={
-                "agent_name": "general-assistant",
-                "query": "Hello",
-            },
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 400
-
-
-# =============================================================================
-# Stop Chat Error Tests
-# =============================================================================
-
-def test_stop_chat_limit_exceeded():
-    """Test stop chat returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
-
-        mock_ctx.return_value = MagicMock()
-        mock_stop.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.get(
-            "/nb/v1/chat/stop/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 429
-
-
-def test_stop_chat_internal_error():
-    """Test stop chat returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.stop_chat', new_callable=AsyncMock) as mock_stop:
-
-        mock_ctx.return_value = MagicMock()
-        mock_stop.side_effect = Exception("Unexpected error")
-
-        resp = client.get(
-            "/nb/v1/chat/stop/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 500
-
-
-# =============================================================================
-# Get Conversation Error Tests
-# =============================================================================
-
-def test_get_conversation_limit_exceeded():
-    """Test get conversation returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.get(
-            "/nb/v1/conversations/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 429
-
-
-def test_get_conversation_internal_error():
-    """Test get conversation returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_conversation_history', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.side_effect = Exception("Unexpected error")
-
-        resp = client.get(
-            "/nb/v1/conversations/123",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 500
-
-
-# =============================================================================
-# List Agents Error Tests
-# =============================================================================
-
-def test_list_agents_limit_exceeded():
-    """Test list agents returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.get(
-            "/nb/v1/agents",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 429
-
-
-def test_list_agents_internal_error():
-    """Test list agents returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.get_agent_info_list', new_callable=AsyncMock) as mock_get:
-
-        mock_ctx.return_value = MagicMock()
-        mock_get.side_effect = Exception("Unexpected error")
-
-        resp = client.get(
-            "/nb/v1/agents",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 500
-
-
-# =============================================================================
-# List Conversations Error Tests
-# =============================================================================
-
-def test_list_conversations_limit_exceeded():
-    """Test list conversations returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
-
-        mock_ctx.return_value = MagicMock()
-        mock_list.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.get(
-            "/nb/v1/conversations",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 429
-
-
-def test_list_conversations_internal_error():
-    """Test list conversations returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.list_conversations', new_callable=AsyncMock) as mock_list:
-
-        mock_ctx.return_value = MagicMock()
-        mock_list.side_effect = Exception("Unexpected error")
-
-        resp = client.get(
-            "/nb/v1/conversations",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 500
-
-
-# =============================================================================
-# Update Conversation Title Error Tests
-# =============================================================================
-
-def test_update_conversation_title_limit_exceeded():
-    """Test update conversation title returns 429 when limit exceeded."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
-
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.side_effect = LimitExceededError("Rate limit exceeded")
-
-        resp = client.put(
-            "/nb/v1/conversations/123/title?title=New%20Title",
-            headers=_build_headers(),
-        )
-
-        assert resp.status_code == 429
+    assert resp.status_code == 200
+    assert resp.headers.get("X-Request-Id") == "rid-123"
+    assert resp.headers.get("conversation_id") == "1"
 
 
-def test_update_conversation_title_not_found():
-    """Test update conversation title returns 404 when conversation not found."""
-    from consts.exceptions import ConversationNotFoundError
+def test_run_chat_service_error_maps_500(monkeypatch):
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+    async def _raise(*args, **kwargs):
+        raise Exception("Failed to persist user message: boom")
 
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.side_effect = ConversationNotFoundError("Conversation not found")
+    monkeypatch.setattr("apps.northbound_app.start_streaming_chat", _raise)
 
-        resp = client.put(
-            "/nb/v1/conversations/999/title?title=New%20Title",
-            headers=_build_headers(),
-        )
+    resp = client.post(
+        "/nb/v1/chat/run",
+        json={"conversation_id": 1,
+              "agent_name": "agent-a", "query": "hello"},
+        headers=_std_headers(),
+    )
 
-        assert resp.status_code == 404
+    assert resp.status_code == 500
 
 
-def test_update_conversation_title_internal_error():
-    """Test update conversation title returns 500 on internal error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+# --- Tests for /file/fetch endpoint ---
 
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.side_effect = Exception("Unexpected error")
+def test_fetch_file_missing_presigned_url():
+    """Missing presigned_url parameter returns 422 (FastAPI validation)."""
+    resp = client.get("/nb/v1/file/fetch")
+    assert resp.status_code == 422
 
-        resp = client.put(
-            "/nb/v1/conversations/123/title?title=New%20Title",
-            headers=_build_headers(),
-        )
 
-        assert resp.status_code == 500
+def test_fetch_file_invalid_url_scheme(monkeypatch):
+    """URL scheme other than http/https returns 400."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "ftp://example.com/file"},
+        headers=_build_headers(),
+    )
+    assert resp.status_code == 400
+    assert "Invalid URL scheme" in resp.json()["detail"]
+
+
+def test_fetch_file_success(monkeypatch):
+    """Valid presigned_url: proxies file content as StreamingResponse."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
+
+    import httpx
+    mock_response = MagicMock()
+    mock_response.status_code = 200
+    mock_response.headers = {
+        "Content-Type": "application/pdf",
+        "Content-Disposition": 'attachment; filename="report.pdf"',
+    }
+    mock_response.aiter_bytes = MagicMock(return_value=iter([b"PDF content here"]))
 
-def test_update_conversation_title_with_meta_data():
-    """Test update conversation title with metadata."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(return_value=mock_response)
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.return_value = {"idempotency_key": "idem-key", "conversation_id": 123}
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
-        resp = client.put(
-            "/nb/v1/conversations/123/title?title=New%20Title&meta_data=%7B%22source%22%3A%22test%22%7D",
-            headers=_build_headers(),
-        )
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+        headers=_build_headers(),
+    )
 
-        assert resp.status_code == 200
+    assert resp.status_code == 200
+    assert resp.headers["content-type"] == "application/pdf"
+    assert "report.pdf" in resp.headers["content-disposition"]
 
 
-def test_update_conversation_title_with_idempotency_key():
-    """Test update conversation title with idempotency key."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.update_conversation_title', new_callable=AsyncMock) as mock_update:
+def test_fetch_file_non_200_returns_502(monkeypatch):
+    """MinIO returns non-200: maps to 502 Bad Gateway."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
-        mock_ctx.return_value = MagicMock()
-        mock_ctx.return_value.request_id = "req-123"
-        mock_update.return_value = {"idempotency_key": "my-key", "conversation_id": 123}
+    mock_response = MagicMock()
+    mock_response.status_code = 403
+    mock_response.headers = {}
 
-        resp = client.put(
-            "/nb/v1/conversations/123/title?title=New%20Title",
-            headers={**_build_headers(), "Idempotency-Key": "my-key"},
-        )
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(return_value=mock_response)
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-        assert resp.status_code == 200
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+        headers=_build_headers(),
+    )
 
-# =============================================================================
-# Upload Attachments Error Tests
-# =============================================================================
+    assert resp.status_code == 502
+    assert "Failed to fetch file from storage" in resp.json()["detail"]
 
-def test_upload_chat_attachments_value_error():
-    """Test upload returns 400 on value error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
 
-        mock_ctx.return_value = MagicMock()
-        mock_upload.side_effect = ValueError("Invalid file")
+def test_fetch_file_timeout_returns_504(monkeypatch):
+    """httpx.TimeoutException: maps to 504 Gateway Timeout."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
-        file_content = b"test file content"
-        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
+    import httpx
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(side_effect=httpx.TimeoutException("Connection timed out"))
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-        resp = client.post(
-            "/nb/v1/chat/attachments/upload",
-            files=files,
-            headers=_build_headers(),
-        )
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
-        assert resp.status_code == 400
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+        headers=_build_headers(),
+    )
 
+    assert resp.status_code == 504
+    assert "Timeout" in resp.json()["detail"]
 
-def test_upload_chat_attachments_permission_error():
-    """Test upload returns 403 on permission error."""
-    with patch('apps.northbound_app._get_northbound_context', new_callable=AsyncMock) as mock_ctx, \
-            patch('apps.northbound_app.upload_files_for_northbound', new_callable=AsyncMock) as mock_upload:
 
-        mock_ctx.return_value = MagicMock()
-        mock_upload.side_effect = PermissionError("Access denied")
+def test_fetch_file_request_error_returns_502(monkeypatch):
+    """httpx.RequestError: maps to 502 Bad Gateway."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
-        file_content = b"test file content"
-        files = {"files": ("test.pdf", BytesIO(file_content), "application/pdf")}
+    import httpx
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(side_effect=httpx.RequestError("Connection refused", request=MagicMock()))
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-        resp = client.post(
-            "/nb/v1/chat/attachments/upload",
-            files=files,
-            headers=_build_headers(),
-        )
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
-        assert resp.status_code == 403
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+        headers=_build_headers(),
+    )
 
+    assert resp.status_code == 502
+    assert "Failed to fetch file from storage" in resp.json()["detail"]
 
-if __name__ == "__main__":
-    pytest.main([__file__, "-v"])
 
+def test_fetch_file_unexpected_error_returns_500(monkeypatch):
+    """Unexpected exception: maps to 500 Internal Server Error."""
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", lambda auth: (True, {"token_id": "t1"}))
+    monkeypatch.setattr("apps.northbound_app.get_user_and_tenant_by_access_key", lambda access_key: {
+        "user_id": "u1", "tenant_id": "t1", "token_id": "t1"
+    })
 
-# =============================================================================
-# Helper Function Tests
-# =============================================================================
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(side_effect=RuntimeError("unexpected failure"))
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-def test_resolve_proxy_download_filename_with_rfc598_filename():
-    """Test filename resolution with RFC 598 filename."""
-    from apps.northbound_app import _resolve_proxy_download_filename
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
-    result = _resolve_proxy_download_filename(
-        "https://example.com/path/file.pdf",
-        'filename="report.pdf"'
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
+        headers=_build_headers(),
     )
-    assert result == "report.pdf"
 
+    assert resp.status_code == 500
+    assert "Internal server error" in resp.json()["detail"]
 
-def test_resolve_proxy_download_filename_with_rfc598_star_filename():
-    """Test filename resolution with RFC 598 star filename."""
-    from apps.northbound_app import _resolve_proxy_download_filename
 
-    result = _resolve_proxy_download_filename(
-        "https://example.com/path/file.pdf",
-        "filename*=UTF-8''report%20final.pdf"
-    )
-    assert result == "report final.pdf"
+def test_fetch_file_no_auth_required(monkeypatch):
+    """Endpoint requires no authentication (NOTE: No authentication required)."""
+    auth_called = []
 
+    def _track_auth(auth):
+        auth_called.append(auth)
+        return (True, {"token_id": "t1"})
 
-def test_resolve_proxy_download_filename_from_url():
-    """Test filename resolution from URL when no content-disposition."""
-    from apps.northbound_app import _resolve_proxy_download_filename
+    monkeypatch.setattr("apps.northbound_app.validate_bearer_token", _track_auth)
 
-    result = _resolve_proxy_download_filename(
-        "https://example.com/path/to/document.pdf",
-        ""
-    )
-    assert result == "document.pdf"
+    mock_response = MagicMock()
+    mock_response.status_code = 200
+    mock_response.headers = {"Content-Type": "text/plain"}
+    mock_response.aiter_bytes = MagicMock(return_value=iter([b"hello"]))
 
+    mock_client = MagicMock()
+    mock_client.get = AsyncMock(return_value=mock_response)
+    mock_client.__aenter__ = AsyncMock(return_value=mock_client)
+    mock_client.__aexit__ = AsyncMock(return_value=None)
 
-def test_resolve_proxy_download_filename_no_filename_in_url():
-    """Test filename resolution returns 'download' when no filename in URL."""
-    from apps.northbound_app import _resolve_proxy_download_filename
+    monkeypatch.setattr("httpx.AsyncClient", lambda **kwargs: mock_client)
 
-    result = _resolve_proxy_download_filename(
-        "https://example.com/path/",
-        ""
+    # No headers at all - should still work because auth is not checked
+    resp = client.get(
+        "/nb/v1/file/fetch",
+        params={"presigned_url": "http://minio:9000/bucket/file.pdf"},
     )
-    assert result == "download"
 
-
-def test_resolve_proxy_download_filename_empty_content_disposition():
-    """Test filename resolution with empty content-disposition."""
-    from apps.northbound_app import _resolve_proxy_download_filename
-
-    result = _resolve_proxy_download_filename(
-        "https://example.com/path/file.pdf",
-        None
-    )
-    assert result == "file.pdf"
+    assert resp.status_code == 200
diff --git a/test/backend/app/test_northbound_base_app.py b/test/backend/app/test_northbound_base_app.py
index 9ab9a3d11..4f58b3062 100644
--- a/test/backend/app/test_northbound_base_app.py
+++ b/test/backend/app/test_northbound_base_app.py
@@ -274,17 +274,17 @@ def test_cors_middleware_configuration(self):
 
     def test_router_inclusion(self):
         """The main northbound router should be included."""
-        paths = app.openapi()["paths"]
-        self.assertIn("/dummy", paths)
+        routes = [route.path for route in app.routes]
+        self.assertIn("/dummy", routes)
 
     def test_a2a_router_inclusion(self):
         """A2A router should be registered under /nb/a2a."""
-        paths = app.openapi()["paths"]
-        self.assertIn("/nb/a2a/{endpoint_id}/.well-known/agent-card.json", paths)
-        self.assertIn("/nb/a2a/{endpoint_id}/v1", paths)
-        self.assertIn("/nb/a2a/{endpoint_id}/message:send", paths)
-        self.assertIn("/nb/a2a/{endpoint_id}/message:stream", paths)
-        self.assertIn("/nb/a2a/{endpoint_id}/tasks/{task_id}", paths)
+        routes = [route.path for route in app.routes]
+        self.assertIn("/nb/a2a/{endpoint_id}/.well-known/agent-card.json", routes)
+        self.assertIn("/nb/a2a/{endpoint_id}/v1", routes)
+        self.assertIn("/nb/a2a/{endpoint_id}/message:send", routes)
+        self.assertIn("/nb/a2a/{endpoint_id}/message:stream", routes)
+        self.assertIn("/nb/a2a/{endpoint_id}/tasks/{task_id}", routes)
 
     # -------------------------------------------------------------------
     # Exception handlers - delegated to app_factory which calls register_exception_handlers
diff --git a/test/backend/app/test_northbound_knowledge_app.py b/test/backend/app/test_northbound_knowledge_app.py
index e39abdf19..54d11b4c5 100644
--- a/test/backend/app/test_northbound_knowledge_app.py
+++ b/test/backend/app/test_northbound_knowledge_app.py
@@ -57,15 +57,6 @@ class _ElasticSearchServiceStub:
     def list_indices(*args, **kwargs):
         return {"indices": ["kb1"]}
 
-    @staticmethod
-    async def delete_document_by_scope(index_name, path_or_url, scope, vdb_core):
-        return {
-            "status": "success",
-            "message": "Documents deleted successfully",
-            "scope": scope,
-            "deleted_es_count": 1,
-        }
-
     @staticmethod
     def delete_documents(index_name, path_or_url, vdb_core):
         return {"message": "Documents deleted successfully", "deleted": 1}
@@ -247,10 +238,7 @@ def test_redis_cleanup_failure_still_returns_200(self, client, mock_northbound_c
 
         response = client.delete(
             "/nb/v1/knowledge/indices/kb1/documents",
-            params={
-                "path_or_url": "minio://path/doc.pdf",
-                "scope": "full",
-            },
+            params={"path_or_url": "minio://path/doc.pdf"},
         )
 
         assert response.status_code == 200
diff --git a/test/backend/app/test_prompt_app.py b/test/backend/app/test_prompt_app.py
index 722b0f4d2..40d88e0e2 100644
--- a/test/backend/app/test_prompt_app.py
+++ b/test/backend/app/test_prompt_app.py
@@ -8,19 +8,6 @@
 backend_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), "../../../backend"))
 sys.path.insert(0, backend_dir)
 
-prompt_service_stub = type(sys)("services.prompt_service")
-prompt_service_stub.gen_system_prompt_streamable = MagicMock()
-prompt_service_stub.OptimizeRequest = type("OptimizeRequest", (), {"__init__": lambda self, **kwargs: self.__dict__.update(kwargs)})
-prompt_service_stub.OptimizeResult = type("OptimizeResult", (), {})
-prompt_service_stub.PromptOptimizationService = MagicMock()
-sys.modules["services.prompt_service"] = prompt_service_stub
-sys.modules["backend.services.prompt_service"] = prompt_service_stub
-
-auth_utils_stub = type(sys)("utils.auth_utils")
-auth_utils_stub.get_current_user_info = MagicMock()
-sys.modules["utils.auth_utils"] = auth_utils_stub
-sys.modules["backend.utils.auth_utils"] = auth_utils_stub
-
 from apps.prompt_app import router
 
 
@@ -30,21 +17,18 @@
 
 
 @patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.PromptOptimizationService")
-def test_optimize_prompt_section_api_success(mock_service_cls, mock_get_current_user_info):
-    """Test /prompt/optimize returns optimized content with X-Prompt-Source header"""
+@patch("apps.prompt_app.optimize_prompt_section_impl")
+def test_optimize_prompt_section_api_success(
+    mock_optimize_prompt_section,
+    mock_get_current_user_info,
+):
     mock_get_current_user_info.return_value = ("user-1", "tenant-1", "en")
-
-    mock_result = MagicMock()
-    mock_result.optimized_content = "Optimized"
-    mock_result.source = "nexent"
-    mock_result.section_type = "duty"
-    mock_result.section_title = "Agent Role"
-    mock_result.original_content = "Original"
-
-    mock_svc_instance = MagicMock()
-    mock_svc_instance.optimize.return_value = mock_result
-    mock_service_cls.return_value = mock_svc_instance
+    mock_optimize_prompt_section.return_value = {
+        "section_type": "duty",
+        "section_title": "Agent Role",
+        "original_content": "Original",
+        "optimized_content": "Optimized",
+    }
 
     response = client.post(
         "/prompt/optimize",
@@ -64,165 +48,20 @@ def test_optimize_prompt_section_api_success(mock_service_cls, mock_get_current_
     )
 
     assert response.status_code == 200
-    data = response.json()
-    assert data["message"] == "Success"
-    assert data["data"]["optimized_content"] == "Optimized"
-    assert data["data"]["section_type"] == "duty"
-    assert data["data"]["section_title"] == "Agent Role"
-    assert data["data"]["original_content"] == "Original"
+    assert response.json()["message"] == "Prompt section optimized successfully"
+    assert response.json()["data"]["optimized_content"] == "Optimized"
     mock_get_current_user_info.assert_called_once()
-    mock_svc_instance.optimize.assert_called_once()
-
-
-@patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.PromptOptimizationService")
-def test_optimize_prompt_section_api_with_mode(mock_service_cls, mock_get_current_user_info):
-    """Test /prompt/optimize accepts mode/start_pos/end_pos parameters"""
-    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
-
-    mock_result = MagicMock()
-    mock_result.optimized_content = "Inserted content"
-    mock_result.source = "jiuwen"
-    mock_result.section_type = "duty"
-    mock_result.section_title = "智能体角色"
-    mock_result.original_content = "Old content"
-
-    mock_svc_instance = MagicMock()
-    mock_svc_instance.optimize.return_value = mock_result
-    mock_service_cls.return_value = mock_svc_instance
-
-    response = client.post(
-        "/prompt/optimize",
-        json={
-            "task_description": "Test insert",
-            "agent_id": 5,
-            "model_id": 3,
-            "section_type": "duty",
-            "section_title": "智能体角色",
-            "current_content": "Old content",
-            "feedback": "Insert more detail",
-            "mode": "insert",
-            "start_pos": 10,
-            "end_pos": 20,
-        },
-        headers={"Authorization": "Bearer token"},
-    )
-
-    assert response.status_code == 200
-    call_args = mock_svc_instance.optimize.call_args
-    assert call_args[0][0].mode == "insert"
-    assert call_args[0][0].start_pos == 10
-    assert call_args[0][0].end_pos == 20
-
-
-@patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.PromptOptimizationService")
-def test_optimize_prompt_section_api_nexent_capability_error(mock_service_cls, mock_get_current_user_info):
-    """Test /prompt/optimize returns 400 when NexentCapabilityError is raised"""
-    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "en")
-
-    from adapters.exception import NexentCapabilityError
-    mock_svc_instance = MagicMock()
-    mock_svc_instance.optimize.side_effect = NexentCapabilityError(
-        "nexent 原生模式只支持 general 模式，当前请求 mode=insert 不支持"
+    mock_optimize_prompt_section.assert_called_once_with(
+        agent_id=1,
+        model_id=2,
+        task_description="Build an agent",
+        tenant_id="tenant-1",
+        language="en",
+        section_type="duty",
+        section_title="Agent Role",
+        current_content="Original",
+        feedback="Make it clearer",
+        tool_ids=[10],
+        sub_agent_ids=[20],
+        knowledge_base_display_names=["kb-a"],
     )
-    mock_service_cls.return_value = mock_svc_instance
-
-    response = client.post(
-        "/prompt/optimize",
-        json={
-            "task_description": "Build an agent",
-            "agent_id": 1,
-            "model_id": 2,
-            "section_type": "duty",
-            "section_title": "Agent Role",
-            "current_content": "Original",
-            "feedback": "Make it clearer",
-            "mode": "insert",
-        },
-        headers={"Authorization": "Bearer token"},
-    )
-
-    assert response.status_code == 400
-    data = response.json()
-    assert "general" in data["message"]
-
-
-@patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.PromptOptimizationService")
-def test_optimize_badcase_api_success(mock_service_cls, mock_get_current_user_info):
-    """Test /prompt/optimize/badcase returns optimized content with X-Prompt-Source header"""
-    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
-
-    mock_result = MagicMock()
-    mock_result.optimized_content = "Fixed based on bad cases"
-    mock_result.source = "jiuwen"
-    mock_result.section_type = "duty"
-    mock_result.section_title = "智能体角色"
-    mock_result.original_content = "Old content"
-
-    mock_svc_instance = MagicMock()
-    mock_svc_instance.optimize_badcase.return_value = mock_result
-    mock_service_cls.return_value = mock_svc_instance
-
-    response = client.post(
-        "/prompt/optimize/badcase",
-        json={
-            "agent_id": 1,
-            "model_id": 2,
-            "current_content": "Old content",
-            "bad_cases": [
-                {
-                    "question": "用户问如何退款",
-                    "answer": "请联系客服",
-                    "label": "退款问题",
-                    "reason": "没有给出具体操作步骤",
-                }
-            ],
-            "section_type": "duty",
-            "section_title": "智能体角色",
-            "tool_ids": [10],
-            "sub_agent_ids": [],
-            "knowledge_base_display_names": [],
-        },
-        headers={"Authorization": "Bearer token"},
-    )
-
-    assert response.status_code == 200
-    data = response.json()
-    assert data["message"] == "Success"
-    assert data["data"]["optimized_content"] == "Fixed based on bad cases"
-    mock_svc_instance.optimize_badcase.assert_called_once()
-
-
-@patch("apps.prompt_app.get_current_user_info")
-@patch("apps.prompt_app.PromptOptimizationService")
-def test_optimize_badcase_api_nexent_capability_error(mock_service_cls, mock_get_current_user_info):
-    """Test /prompt/optimize/badcase returns 400 when NexentCapabilityError is raised"""
-    mock_get_current_user_info.return_value = ("user-1", "tenant-1", "zh")
-
-    from adapters.exception import NexentCapabilityError
-    mock_svc_instance = MagicMock()
-    mock_svc_instance.optimize_badcase.side_effect = NexentCapabilityError(
-        "nexent 原生模式不支持 badcase 优化"
-    )
-    mock_service_cls.return_value = mock_svc_instance
-
-    response = client.post(
-        "/prompt/optimize/badcase",
-        json={
-            "agent_id": 1,
-            "model_id": 2,
-            "current_content": "Old content",
-            "bad_cases": [
-                {"question": "Q1", "answer": "A1"}
-            ],
-            "section_type": "duty",
-            "section_title": "智能体角色",
-        },
-        headers={"Authorization": "Bearer token"},
-    )
-
-    assert response.status_code == 400
-    data = response.json()
-    assert "badcase" in data["message"]
diff --git a/test/backend/app/test_prompt_template_app.py b/test/backend/app/test_prompt_template_app.py
index d54b13412..8cd78cf1d 100644
--- a/test/backend/app/test_prompt_template_app.py
+++ b/test/backend/app/test_prompt_template_app.py
@@ -5,7 +5,6 @@
 from http import HTTPStatus
 
 import pytest
-from pydantic import BaseModel
 
 
 BACKEND_PATH = os.path.abspath(
@@ -19,7 +18,6 @@ def _reset_prompt_template_app_modules():
     sys.modules.pop("apps.prompt_template_app", None)
     sys.modules.pop("services.prompt_template_service", None)
     sys.modules.pop("utils.auth_utils", None)
-    sys.modules.pop("consts.model", None)
 
 
 @pytest.fixture
@@ -38,17 +36,6 @@ def prompt_template_app_module(monkeypatch):
         setattr(service_module, name, lambda *args, **kwargs: None)
     monkeypatch.setitem(sys.modules, "services.prompt_template_service", service_module)
 
-    class PromptTemplateRequest(BaseModel):
-        template_name: str
-        description: str
-        template_type: str
-        template_content_zh: dict
-        template_content_en: dict
-
-    consts_model_module = types.ModuleType("consts.model")
-    consts_model_module.PromptTemplateRequest = PromptTemplateRequest
-    monkeypatch.setitem(sys.modules, "consts.model", consts_model_module)
-
     auth_module = types.ModuleType("utils.auth_utils")
     auth_module.get_current_user_id = lambda authorization: ("user-1", "tenant-1")
     monkeypatch.setitem(sys.modules, "utils.auth_utils", auth_module)
diff --git a/test/backend/app/test_tool_config_app.py b/test/backend/app/test_tool_config_app.py
index 3633b9378..31da4b761 100644
--- a/test/backend/app/test_tool_config_app.py
+++ b/test/backend/app/test_tool_config_app.py
@@ -533,60 +533,6 @@ def test_import_openapi_service_success(
             tenant_id="tenant456",
             user_id="user123",
             service_description="Test API",
-            headers_template=None,
-            force_update=False
-        )
-        mock_refresh_mcp.assert_called_once_with("tenant456")
-
-    @patch('apps.tool_config_app._refresh_openapi_services_in_mcp')
-    @patch('apps.tool_config_app.get_current_user_id')
-    @patch('apps.tool_config_app.import_openapi_service')
-    def test_import_openapi_service_success_with_headers_template(
-        self, mock_import_service, mock_get_user_id, mock_refresh_mcp
-    ):
-        """Test successful OpenAPI service import with headers template"""
-        mock_get_user_id.return_value = ("user123", "tenant456")
-        mock_import_service.return_value = {
-            "tools_created": 1,
-            "tools_updated": 0,
-            "tools_deleted": 0
-        }
-        mock_refresh_mcp.return_value = {"status": "refreshed"}
-        headers_template = {
-            "Authorization": "Bearer {{token}}",
-            "X-Tenant-ID": "{{tenant_id}}"
-        }
-
-        response = client.post(
-            "/tool/openapi_service",
-            json={
-                "service_name": "test_service",
-                "server_url": "https://api.example.com",
-                "openapi_json": {"openapi": "3.0.0", "info": {"title": "Test"}, "paths": {}},
-                "service_description": "Test API",
-                "headers_template": headers_template,
-                "force_update": False
-            }
-        )
-
-        assert response.status_code == HTTPStatus.OK
-        data = response.json()
-        assert data["status"] == "success"
-        assert data["message"] == "OpenAPI service import successful"
-        assert data["data"]["tools_created"] == 1
-        assert data["data"]["tools_updated"] == 0
-        assert data["data"]["tools_deleted"] == 0
-        assert data["data"]["mcp_refresh"]["status"] == "refreshed"
-
-        mock_get_user_id.assert_called_once_with(None)
-        mock_import_service.assert_called_once_with(
-            service_name="test_service",
-            openapi_json={"openapi": "3.0.0", "info": {"title": "Test"}, "paths": {}},
-            server_url="https://api.example.com",
-            tenant_id="tenant456",
-            user_id="user123",
-            service_description="Test API",
-            headers_template=headers_template,
             force_update=False
         )
         mock_refresh_mcp.assert_called_once_with("tenant456")
diff --git a/test/backend/app/test_user_management_app.py b/test/backend/app/test_user_management_app.py
index f5875aca4..fd2f08ddd 100644
--- a/test/backend/app/test_user_management_app.py
+++ b/test/backend/app/test_user_management_app.py
@@ -520,69 +520,6 @@ def test_logout_signout_error_ignored(self, mock_get_client):
         mock_get_client.assert_called_once_with("Bearer token")
         mock_client.auth.sign_out.assert_called_once()
 
-    @patch('database.cas_session_db.revoke_cas_session_by_session_id')
-    @patch('apps.user_management_app.build_logout_url')
-    @patch('apps.user_management_app.extract_session_id_from_authorization')
-    @patch('apps.user_management_app.get_authorized_client')
-    def test_logout_returns_cas_logout_url_for_cas_session(
-        self,
-        mock_get_client,
-        mock_extract_session_id,
-        mock_build_logout_url,
-        mock_revoke_cas_session,
-    ):
-        """Test logout returns CAS logout URL when the JWT carries a CAS session id."""
-        mock_client = MagicMock()
-        mock_get_client.return_value = mock_client
-        mock_extract_session_id.return_value = "sid-1"
-        mock_build_logout_url.return_value = (
-            "https://cas.example.com/cas/logout?service=https%3A%2F%2Fcas.example.com%2Fcas%2Flogin"
-        )
-
-        response = client.post(
-            "/user/logout",
-            headers={"Authorization": "Bearer token"}
-        )
-
-        assert response.status_code == HTTPStatus.OK
-        data = response.json()
-        assert (
-            data["data"]["cas_logout_url"]
-            == "https://cas.example.com/cas/logout?service=https%3A%2F%2Fcas.example.com%2Fcas%2Flogin"
-        )
-        mock_revoke_cas_session.assert_called_once_with("sid-1", actor="user")
-        mock_build_logout_url.assert_called_once_with()
-        mock_client.auth.sign_out.assert_called_once()
-
-    @patch('database.cas_session_db.revoke_cas_session_by_session_id')
-    @patch('apps.user_management_app.build_logout_url')
-    @patch('apps.user_management_app.extract_session_id_from_authorization')
-    @patch('apps.user_management_app.get_authorized_client')
-    def test_logout_does_not_return_cas_logout_url_when_not_configured(
-        self,
-        mock_get_client,
-        mock_extract_session_id,
-        mock_build_logout_url,
-        mock_revoke_cas_session,
-    ):
-        """Test logout skips CAS server logout redirect when CAS_LOGOUT_URL is empty."""
-        mock_client = MagicMock()
-        mock_get_client.return_value = mock_client
-        mock_extract_session_id.return_value = "sid-1"
-        mock_build_logout_url.return_value = ""
-
-        response = client.post(
-            "/user/logout",
-            headers={"Authorization": "Bearer token"}
-        )
-
-        assert response.status_code == HTTPStatus.OK
-        data = response.json()
-        assert data["data"]["cas_logout_url"] == ""
-        mock_revoke_cas_session.assert_called_once_with("sid-1", actor="user")
-        mock_build_logout_url.assert_called_once_with()
-        mock_client.auth.sign_out.assert_called_once()
-
     @patch('apps.user_management_app.get_authorized_client')
     def test_logout_error(self, mock_get_client):
         """Test logout with error"""
@@ -770,47 +707,11 @@ def test_current_user_info_success(self, mock_get_user_info, mock_validate_token
         assert data["data"]["user"]["tenant_id"] == "tenant456"
         assert data["data"]["user"]["user_email"] == "test@example.com"
         assert data["data"]["user"]["user_role"] == "USER"
-        assert data["data"]["user"]["auth_provider"] == "local"
         assert data["data"]["user"]["permissions"] == [
             "agent:create", "agent:read"]
         assert data["data"]["user"]["accessibleRoutes"] == ["chat", "agents"]
         mock_get_user_info.assert_called_once_with("user123")
 
-    @patch('apps.user_management_app.extract_session_id_from_authorization')
-    @patch('apps.user_management_app.validate_token')
-    @patch('apps.user_management_app.get_user_info', new_callable=AsyncMock)
-    def test_current_user_info_marks_cas_user(
-        self,
-        mock_get_user_info,
-        mock_validate_token,
-        mock_extract_session_id,
-    ):
-        """Test CAS-authenticated current user info includes auth provider"""
-        mock_user = MockUser("user123", "test@example.com")
-        mock_validate_token.return_value = (True, mock_user)
-        mock_extract_session_id.return_value = "cas-session-123"
-        mock_get_user_info.return_value = {
-            "user": {
-                "user_id": "user123",
-                "group_ids": [1],
-                "tenant_id": "tenant456",
-                "user_email": "test@example.com",
-                "user_role": "USER",
-                "permissions": ["agent:read"],
-                "accessibleRoutes": ["chat"]
-            }
-        }
-
-        response = client.get(
-            "/user/current_user_info",
-            headers={"Authorization": "Bearer cas-token"}
-        )
-
-        assert response.status_code == HTTPStatus.OK
-        data = response.json()
-        assert data["data"]["user"]["auth_provider"] == "cas"
-        mock_extract_session_id.assert_called_once_with("Bearer cas-token")
-
     def test_current_user_info_no_authorization(self):
         """Test current user info retrieval without authorization header"""
         response = client.get("/user/current_user_info")
diff --git a/test/backend/app/test_vectordatabase_app.py b/test/backend/app/test_vectordatabase_app.py
index cd684512f..c4820d177 100644
--- a/test/backend/app/test_vectordatabase_app.py
+++ b/test/backend/app/test_vectordatabase_app.py
@@ -1624,23 +1624,20 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
+            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
+        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "scope": "full",
-            "deleted_es_count": 5,
-            "source_available": False,
+            "deleted_count": 5
         }
-        mock_delete_by_scope.return_value = es_result
+        mock_delete_docs.return_value = es_result
 
+        # Setup the mock for delete_document_records
         redis_result = {
             "index_name": index_name,
             "path_or_url": path_or_url,
@@ -1650,10 +1647,9 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
         }
         redis_service_mock.delete_document_records.return_value = redis_result
 
+        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "full"},
-        )
+            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
 
         # Verify expected 200 status code
         assert response.status_code == 200
@@ -1672,46 +1668,13 @@ async def test_delete_documents_success(vdb_core_mock, redis_service_mock):
         assert "redis_cleanup" in actual_response
         assert actual_response["redis_cleanup"] == redis_result
 
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "full", ANY
-        )
+        # Verify delete_documents was called with the correct parameters
+        # Use ANY for the vdb_core parameter because the actual object may differ
+        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
 
-@pytest.mark.asyncio
-async def test_delete_documents_source_only_skips_redis(vdb_core_mock, redis_service_mock):
-    """source_only scope must not trigger Redis document cleanup."""
-    with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
-            patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
-
-        index_name = "test_index"
-        path_or_url = "knowledge_base/test.pdf"
-        mock_delete_by_scope.return_value = {
-            "status": "success",
-            "scope": "source_only",
-            "deleted_es_count": 0,
-            "deleted_minio": True,
-            "source_available": False,
-        }
-
-        response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "source_only"},
-        )
-
-        assert response.status_code == 200
-        assert response.json()["scope"] == "source_only"
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "source_only", ANY
-        )
-        redis_service_mock.delete_document_records.assert_not_called()
-
-
 @pytest.mark.asyncio
 async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
     """
@@ -1721,30 +1684,27 @@ async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
+            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
+        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "scope": "full",
-            "deleted_es_count": 5,
+            "deleted_count": 5
         }
-        mock_delete_by_scope.return_value = es_result
+        mock_delete_docs.return_value = es_result
 
+        # Setup redis error
         redis_error_message = "Redis connection failed"
         redis_service_mock.delete_document_records.side_effect = Exception(
             redis_error_message)
 
+        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "full"},
-        )
+            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
 
         # Verify expected 200 status code (the operation should still succeed even with Redis errors)
         assert response.status_code == 200
@@ -1762,9 +1722,9 @@ async def test_delete_documents_redis_error(vdb_core_mock, redis_service_mock):
         assert "redis_cleanup_error" in actual_response
         assert actual_response["redis_cleanup_error"] == redis_error_message
 
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "full", ANY
-        )
+        # Verify delete_documents was called
+        # Use ANY for the vdb_core parameter because the actual object may differ
+        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
@@ -1777,28 +1737,29 @@ async def test_delete_documents_es_exception(vdb_core_mock):
     """
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
+            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        mock_delete_by_scope.side_effect = Exception(
+        # Setup the mock to raise an exception
+        mock_delete_docs.side_effect = Exception(
             "Elasticsearch deletion failed")
 
+        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "full"},
-        )
+            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
 
+        # Verify expected 500 status code
         assert response.status_code == 500
+
+        # Verify error response
         expected_error_detail = "Error delete indexing documents: Elasticsearch deletion failed"
         assert response.json() == {"detail": expected_error_detail}
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "full", ANY
-        )
+
+        # Verify delete_documents was called
+        # Use ANY for the vdb_core parameter because the actual object may differ
+        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
 
 
 @pytest.mark.asyncio
@@ -1810,22 +1771,20 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
             patch("backend.apps.vectordatabase_app.get_redis_service", return_value=redis_service_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
+            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
+        # Setup the return value for delete_documents
         es_result = {
             "status": "success",
             "message": "Documents deleted successfully",
-            "scope": "full",
-            "deleted_es_count": 5,
+            "deleted_count": 5
         }
-        mock_delete_by_scope.return_value = es_result
+        mock_delete_docs.return_value = es_result
 
+        # Setup the mock for delete_document_records with warnings
         redis_result = {
             "index_name": index_name,
             "path_or_url": path_or_url,
@@ -1836,10 +1795,9 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
         }
         redis_service_mock.delete_document_records.return_value = redis_result
 
+        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "full"},
-        )
+            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
 
         # Verify expected 200 status code
         assert response.status_code == 200
@@ -1858,9 +1816,9 @@ async def test_delete_documents_redis_warnings(vdb_core_mock, redis_service_mock
         assert actual_response["redis_warnings"] == [
             "Some cache keys could not be deleted"]
 
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "full", ANY
-        )
+        # Verify delete_documents was called
+        # Use ANY for the vdb_core parameter because the actual object may differ
+        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
         redis_service_mock.delete_document_records.assert_called_once_with(
             index_name, path_or_url)
 
@@ -1873,27 +1831,29 @@ async def test_delete_documents_validation_exception(vdb_core_mock):
     """
     # Setup mocks
     with patch("backend.apps.vectordatabase_app.get_vector_db_core", return_value=vdb_core_mock), \
-            patch(
-                "backend.apps.vectordatabase_app.ElasticSearchService.delete_document_by_scope",
-                new_callable=AsyncMock,
-            ) as mock_delete_by_scope:
+            patch("backend.apps.vectordatabase_app.ElasticSearchService.delete_documents") as mock_delete_docs:
 
         index_name = "test_index"
         path_or_url = "test_document.pdf"
 
-        mock_delete_by_scope.side_effect = ValueError(
+        # Setup the mock to raise a validation exception
+        mock_delete_docs.side_effect = ValueError(
             "Invalid document path format")
 
+        # Execute request
         response = client.delete(
-            f"/indices/{index_name}/documents",
-            params={"path_or_url": path_or_url, "scope": "source_only"},
-        )
+            f"/indices/{index_name}/documents", params={"path_or_url": path_or_url})
 
-        assert response.status_code == 400
-        assert response.json() == {"detail": "Invalid document path format"}
-        mock_delete_by_scope.assert_called_once_with(
-            index_name, path_or_url, "source_only", ANY
-        )
+        # Verify expected 500 status code
+        assert response.status_code == 500
+
+        # Verify error response
+        expected_error_detail = "Error delete indexing documents: Invalid document path format"
+        assert response.json() == {"detail": expected_error_detail}
+
+        # Verify delete_documents was called
+        # Use ANY for the vdb_core parameter because the actual object may differ
+        mock_delete_docs.assert_called_once_with(index_name, path_or_url, ANY)
 
 
 @pytest.mark.asyncio
diff --git a/test/backend/data_process/test_tasks.py b/test/backend/data_process/test_tasks.py
index cc7eadfcb..379989581 100644
--- a/test/backend/data_process/test_tasks.py
+++ b/test/backend/data_process/test_tasks.py
@@ -51,26 +51,24 @@ def import_tasks_with_fake_ray(monkeypatch, initialized=False):
         backends_base_mod = types.ModuleType("celery.backends.base")
         backends_base_mod.DisabledBackend = type("DisabledBackend", (), {})
         sys.modules["celery.backends.base"] = backends_base_mod
-
+    
     if "celery.exceptions" not in sys.modules:
         exceptions_mod = types.ModuleType("celery.exceptions")
         exceptions_mod.Retry = type("Retry", (Exception,), {})
         sys.modules["celery.exceptions"] = exceptions_mod
-
+    
     if "celery.result" not in sys.modules:
         result_mod = types.ModuleType("celery.result")
         result_mod.AsyncResult = type("AsyncResult", (), {})
-
         @contextmanager
         def _allow_join_result():
             yield
         result_mod.allow_join_result = _allow_join_result
         sys.modules["celery.result"] = result_mod
-
+    
     if "celery.signals" not in sys.modules:
         signals_mod = types.ModuleType("celery.signals")
         # Create fake signal objects with connect method
-
         class FakeSignal:
             def connect(self, func):
                 return func
@@ -82,34 +80,32 @@ def connect(self, func):
         signals_mod.task_postrun = FakeSignal()
         signals_mod.task_failure = FakeSignal()
         sys.modules["celery.signals"] = signals_mod
-
+    
     if "celery" not in sys.modules:
         celery_mod = types.ModuleType("celery")
         # Create a Celery class that accepts any arguments and has required attributes
-
         class FakeBackend:
             pass
-
+        
         class FakeCelery:
             def __init__(self, *args, **kwargs):
                 # Set backend to a non-DisabledBackend instance
                 self.backend = FakeBackend()
                 # Create a conf object with update method
                 self.conf = types.SimpleNamespace(update=lambda **kwargs: None)
-
+            
             def task(self, *args, **kwargs):
                 # Return a decorator that returns the function unchanged
                 def decorator(func):
                     return func
                 return decorator
-
+        
         # Stub classes and functions needed by tasks.py
         celery_mod.Celery = FakeCelery
         celery_mod.Task = type("Task", (), {})
         celery_mod.chain = lambda *args: None
         celery_mod.group = lambda *args, **kwargs: []
-        celery_mod.chord = lambda *args, **kwargs: (lambda callback: types.SimpleNamespace(
-            get=lambda: {"success": True, "total_indexed": 0, "total_submitted": 0}))
+        celery_mod.chord = lambda *args, **kwargs: (lambda callback: types.SimpleNamespace(get=lambda: {"success": True, "total_indexed": 0, "total_submitted": 0}))
         celery_mod.states = types.SimpleNamespace(
             PENDING="PENDING",
             STARTED="STARTED",
@@ -119,7 +115,7 @@ def decorator(func):
             REVOKED="REVOKED"
         )
         sys.modules["celery"] = celery_mod
-
+    
     # Stub modules that ray_actors depends on to avoid importing real MinIO
     # Also stub consts package and consts.const module to provide required constants at import time
     if "consts" not in sys.modules:
@@ -167,14 +163,9 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["database.attachment_db"] = types.SimpleNamespace(
             get_file_stream=lambda source: io.BytesIO(b"stub-bytes"),
             get_file_size_from_minio=lambda object_name, bucket=None: 0,
-            # NOSONAR
-            build_s3_url=lambda bucket_name, object_name: f"http://mock-s3/{bucket_name}/{object_name}",
+            build_s3_url=lambda bucket_name, object_name: f"http://mock-s3/{bucket_name}/{object_name}",  # NOSONAR
             upload_fileobj=lambda file_obj, bucket_name, object_name: "mock-etag",
         )
-    if "database.knowledge_db" not in sys.modules:
-        sys.modules["database.knowledge_db"] = types.SimpleNamespace(
-            get_knowledge_record=lambda query=None: {},
-        )
     # Stub model_management_db module required by ray_actors
     if "database.model_management_db" not in sys.modules:
         sys.modules["database.model_management_db"] = types.SimpleNamespace(
@@ -189,8 +180,6 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
             sys.modules["database.attachment_db"])
     setattr(sys.modules["database"], "model_management_db",
             sys.modules["database.model_management_db"])
-    setattr(sys.modules["database"], "knowledge_db",
-            sys.modules["database.knowledge_db"])
 
     # Stub out auth and config utils to avoid importing real dependencies in file_management_utils
     if "utils.auth_utils" not in sys.modules:
@@ -206,10 +195,9 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["utils.config_utils"] = cfg_mod
     if "nexent.data_process" not in sys.modules:
         sys.modules["nexent.data_process"] = types.SimpleNamespace(
-            DataProcessCore=type(
-                "_Core", (), {"__init__": lambda self: None, "file_process": lambda *a, **k: []})
+            DataProcessCore=type("_Core", (), {"__init__": lambda self: None, "file_process": lambda *a, **k: []})
         )
-
+    
     # Stub external dependencies (required by utils.file_management_utils)
     if "aiofiles" not in sys.modules:
         sys.modules["aiofiles"] = types.SimpleNamespace(
@@ -224,21 +212,7 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
     if "httpx" not in sys.modules:
         sys.modules["httpx"] = types.SimpleNamespace()
     if "requests" not in sys.modules:
-        class _FakeResponse:
-            def __init__(self, status_code=200, json_data=None, text=""):
-                self.status_code = status_code
-                self._json_data = json_data
-                self.text = text
-
-            def json(self):
-                if self._json_data is None:
-                    raise ValueError("no json")
-                return self._json_data
-
-        sys.modules["requests"] = types.SimpleNamespace(
-            delete=lambda *a, **k: _FakeResponse(status_code=200, json_data={
-                                                 "status": "success"}, text=""),
-        )
+        sys.modules["requests"] = types.SimpleNamespace()
     if "redis" not in sys.modules:
         sys.modules["redis"] = types.SimpleNamespace(
             Redis=types.SimpleNamespace(
@@ -254,7 +228,7 @@ def json(self):
         fastapi_mod = types.ModuleType("fastapi")
         fastapi_mod.UploadFile = type("UploadFile", (), {})
         sys.modules["fastapi"] = fastapi_mod
-
+    
     # Stub utils.file_management_utils (required by tasks.py)
     if "utils.file_management_utils" not in sys.modules:
         file_utils_mod = types.ModuleType("utils.file_management_utils")
@@ -268,31 +242,26 @@ def json(self):
         class _StubRedisService:
             def save_error_info(self, *args, **kwargs):
                 return True
-
             def is_task_cancelled(self, *args, **kwargs):
                 return False
-
             def save_progress_info(self, *args, **kwargs):
                 return True
-
             def increment_progress_info(self, *args, **kwargs):
                 return True
 
         redis_service_mod.get_redis_service = lambda: _StubRedisService()
         sys.modules["services.redis_service"] = redis_service_mod
-
+    
     # Stub aiohttp (required by tasks.py)
     if "aiohttp" not in sys.modules:
         sys.modules["aiohttp"] = types.SimpleNamespace()
-
+    
     import backend.data_process.tasks as tasks
     importlib.reload(tasks)
     # Provide a Celery task shim that allows direct calls and supports .s for chaining
-
     class _SignatureShim:
         def __init__(self):
             pass
-
         def set(self, **_kw):
             return self
 
@@ -300,12 +269,10 @@ class _CeleryTaskShim:
         def __init__(self, run_func, preprocess=None):
             self._run_func = run_func
             self._preprocess = preprocess
-
         def __call__(self, *args, **kwargs):
             if self._preprocess is not None:
                 args, kwargs = self._preprocess(args, kwargs)
             return self._run_func(*args, **kwargs)
-
         def s(self, **_kw):
             return _SignatureShim()
 
@@ -329,19 +296,15 @@ def _unbound_run(task_obj):
     default_actor = types.SimpleNamespace(
         ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"),
         split_file=types.SimpleNamespace(remote=lambda *a, **k: []),
-        process_bytes=types.SimpleNamespace(
-            remote=lambda *a, **k: "ref-bytes"),
+        process_bytes=types.SimpleNamespace(remote=lambda *a, **k: "ref-bytes"),
         process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref"),
-        store_chunks_in_redis=types.SimpleNamespace(
-            remote=lambda *a, **k: None),
+        store_chunks_in_redis=types.SimpleNamespace(remote=lambda *a, **k: None),
     )
     if not hasattr(tasks, "DataProcessorRayActor") or not hasattr(getattr(tasks, "DataProcessorRayActor"), "remote"):
-        tasks.DataProcessorRayActor = types.SimpleNamespace(
-            remote=lambda: default_actor)
+        tasks.DataProcessorRayActor = types.SimpleNamespace(remote=lambda: default_actor)
     # Keep split path stable across tests even when get_ray_actor is monkeypatched.
     tasks._get_split_actor = lambda: types.SimpleNamespace(
-        split_file=types.SimpleNamespace(
-            remote=lambda *a, **k: "__split_parts__")
+        split_file=types.SimpleNamespace(remote=lambda *a, **k: "__split_parts__")
     )
 
     # Preprocess for forward: drop empty/whitespace-only chunks before calling real run
@@ -402,15 +365,11 @@ def _forward_preprocess(args, kwargs):
     maybe = _unbound_run(getattr(tasks, "aggregate_store_chunks", None))
     if maybe is not None:
         tasks.aggregate_store_chunks = _CeleryTaskShim(maybe)
-    maybe = _unbound_run(getattr(tasks, "cleanup_source", None))
-    if maybe is not None:
-        tasks.cleanup_source = _CeleryTaskShim(maybe)
     return tasks, fake_ray
 
 
 def test_init_ray_in_worker_initializes_once(monkeypatch):
-    tasks, fake_ray = import_tasks_with_fake_ray(
-        monkeypatch, initialized=False)
+    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
     # First call initializes
     tasks.init_ray_in_worker()
     assert fake_ray.inits and fake_ray.inits[-1]["configure_logging"] is False
@@ -424,11 +383,10 @@ def test_init_ray_in_worker_initializes_once(monkeypatch):
 
 def test_init_ray_in_worker_respects_disable_dashboard_setting(monkeypatch):
     """Test that init_ray_in_worker respects DISABLE_RAY_DASHBOARD setting"""
-    tasks, fake_ray = import_tasks_with_fake_ray(
-        monkeypatch, initialized=False)
+    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
     # Patch DISABLE_RAY_DASHBOARD in tasks module to True
     monkeypatch.setattr(tasks, "DISABLE_RAY_DASHBOARD", True)
-
+    
     # First call initializes with include_dashboard=False
     tasks.init_ray_in_worker()
     assert fake_ray.inits and fake_ray.inits[-1]["configure_logging"] is False
@@ -439,16 +397,14 @@ def test_init_ray_in_worker_respects_disable_dashboard_setting(monkeypatch):
 
 def test_init_ray_in_worker_raises_on_init_failure(monkeypatch):
     """Test that init_ray_in_worker logs error and re-raises exception when ray.init() fails"""
-    tasks, fake_ray = import_tasks_with_fake_ray(
-        monkeypatch, initialized=False)
-
+    tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=False)
+    
     # Make ray.init() raise an exception
     init_exception = RuntimeError("Ray initialization failed")
-
     def failing_init(**kwargs):
         raise init_exception
     fake_ray.init = failing_init
-
+    
     # Verify that the exception is re-raised
     with pytest.raises(RuntimeError) as exc_info:
         tasks.init_ray_in_worker()
@@ -462,8 +418,7 @@ async def sample():
         return 42
 
     # Force RuntimeError in get_running_loop to trigger asyncio.run path
-    monkeypatch.setattr(asyncio, "get_running_loop", lambda: (
-        _ for _ in ()).throw(RuntimeError("no loop")))
+    monkeypatch.setattr(asyncio, "get_running_loop", lambda: (_ for _ in ()).throw(RuntimeError("no loop")))
     result = tasks.run_async(sample())
     assert result == 42
 
@@ -487,17 +442,14 @@ def run_until_complete(self, coro):
 def test_get_ray_actor_returns_actor(monkeypatch):
     tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch, initialized=True)
 
-    actor_obj = types.SimpleNamespace(
-        ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"))
+    actor_obj = types.SimpleNamespace(ping=types.SimpleNamespace(remote=lambda *a, **k: "pong"))
 
     class _ManagerHandle:
         def __init__(self, actor):
-            self.get_actor = types.SimpleNamespace(
-                remote=lambda: "__actor_ref__")
+            self.get_actor = types.SimpleNamespace(remote=lambda: "__actor_ref__")
             self._actor = actor
 
-    monkeypatch.setattr(
-        tasks, "_get_or_create_global_pool_manager", lambda: _ManagerHandle(actor_obj))
+    monkeypatch.setattr(tasks, "_get_or_create_global_pool_manager", lambda: _ManagerHandle(actor_obj))
     fake_ray.get_returns = {"__actor_ref__": actor_obj}
     actor = tasks.get_ray_actor()
     assert actor is actor_obj
@@ -531,13 +483,10 @@ class FakeActor:
         class P:
             def __init__(self, *a, **k):
                 self.args = (a, k)
-
         def __init__(self):
             self.calls = []
-            self.process_file = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref1")
-            self.store_chunks_in_redis = types.SimpleNamespace(
-                remote=lambda *a, **k: None)
+            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref1")
+            self.store_chunks_in_redis = types.SimpleNamespace(remote=lambda *a, **k: None)
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     # Mock ray.get to return chunks instead of reference
@@ -545,8 +494,7 @@ def __init__(self):
 
     self = FakeSelf("p1")
 
-    result = tasks.process(self, source=str(f), source_type="local",
-                           chunking_strategy="basic", index_name="idx", original_filename="a.txt")
+    result = tasks.process(self, source=str(f), source_type="local", chunking_strategy="basic", index_name="idx", original_filename="a.txt")
     assert result["redis_key"].startswith("dp:p1:chunks")
     # success state updated twice: STARTED and SUCCESS
     assert any(s.get("state") == tasks.states.SUCCESS for s in self.states)
@@ -564,18 +512,15 @@ def test_process_minio_path(monkeypatch):
 
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref")
-            self.store_chunks_in_redis = types.SimpleNamespace(
-                remote=lambda *a, **k: None)
+            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref")
+            self.store_chunks_in_redis = types.SimpleNamespace(remote=lambda *a, **k: None)
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     # Mock ray.get to return chunks
     fake_ray.get_returns = mock_chunks
 
     self = FakeSelf("m1")
-    result = tasks.process(self, source="http://minio/bucket/x",
-                           source_type="minio", chunking_strategy="basic")
+    result = tasks.process(self, source="http://minio/bucket/x", source_type="minio", chunking_strategy="basic")
     assert result["redis_key"].startswith("dp:m1:chunks")
     # Verify chunks_count is set
     success_state = [s for s in self.states if s.get(
@@ -1010,7 +955,7 @@ class DummyClientConnectorError(Exception):
     json.loads(str(ei.value))
 
 
-def test_submit_process_forward_chain_returns_empty_when_apply_async_none(monkeypatch):
+def test_process_and_forward_returns_empty_when_apply_async_none(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
 
     class FakeChain:
@@ -1018,25 +963,18 @@ def apply_async(self):
             return None
 
     monkeypatch.setattr(tasks, "chain", lambda *a, **k: FakeChain())
+    # Ensure process and forward are accessible from the tasks module for process_and_forward
+    # The function looks up process and forward from the module at runtime
     import backend.data_process.tasks as tasks_module
+    # Process and forward should already be shimmed in import_tasks_with_fake_ray
+    # But we need to ensure they're accessible in the module namespace
     tasks_module.process = tasks.process
     tasks_module.forward = tasks.forward
-    tasks_module.cleanup_source = tasks.cleanup_source
-    out = tasks.submit_process_forward_chain(
-        source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
-    assert out == ""
-
-
-def test_process_and_forward_returns_empty_when_apply_async_none(monkeypatch):
-    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(
-        tasks, "submit_process_forward_chain", lambda **kwargs: "")
     self = FakeSelf("chain_none")
     out = tasks.process_and_forward(
         self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
     assert out == ""
 
-
 def test_process_unsupported_source_type(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch, initialized=True)
     self = FakeSelf("e2")
@@ -1053,16 +991,14 @@ def test_forward_with_chunks_success(monkeypatch):
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 123)
 
     # run_async should return a successful response matching formatted chunk count (1)
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {
-                        "success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
 
     self = FakeSelf("f1")
     chunks = [
         {"content": "text", "metadata": {"creation_date": "2024-01-01"}},
         {"content": "", "metadata": {}},
     ]
-    result = tasks.forward(self, processed_data={
-                           "chunks": chunks}, index_name="idx", source="/a.txt", source_type="local", original_filename="a.txt")
+    result = tasks.forward(self, processed_data={"chunks": chunks}, index_name="idx", source="/a.txt", source_type="local", original_filename="a.txt")
     assert result["chunks_stored"] == 1
 
 
@@ -1070,12 +1006,10 @@ def test_forward_partial_success_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 0)
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {
-                        "success": True, "total_indexed": 0, "total_submitted": 1, "message": "partial"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 0, "total_submitted": 1, "message": "partial"})
     self = FakeSelf("f2")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {
-        }}]}, index_name="idx", source="/a.txt", source_type="local")
+        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt", source_type="local")
     json.loads(str(ei.value))
 
 
@@ -1083,8 +1017,7 @@ def test_forward_no_chunks_and_no_redis_key_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     self = FakeSelf("f3")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={},
-                      index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={}, index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1092,8 +1025,7 @@ def test_forward_formats_to_empty_then_raises(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     self = FakeSelf("f4")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [
-                      {"content": "  ", "metadata": {}}]}, index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={"chunks": [{"content": "  ", "metadata": {}}]}, index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1103,8 +1035,7 @@ def test_forward_missing_es_env_raises(monkeypatch):
     monkeypatch.setattr(tasks, "get_file_size", lambda *a, **k: 0)
     self = FakeSelf("f5")
     with pytest.raises(Exception) as ei:
-        tasks.forward(self, processed_data={"chunks": [
-                      {"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt")
+        tasks.forward(self, processed_data={"chunks": [{"content": "x", "metadata": {}}]}, index_name="idx", source="/a.txt")
     json.loads(str(ei.value))
 
 
@@ -1116,27 +1047,22 @@ def test_forward_loads_chunks_from_redis(monkeypatch):
 
     class FakeRedisClient:
         def __init__(self):
-            self.kv = {"dp:rid:chunks": json.dumps(
-                [{"content": "x", "metadata": {}}])}
-
+            self.kv = {"dp:rid:chunks": json.dumps([{"content": "x", "metadata": {}}])}
         def get(self, k):
             return self.kv.get(k)
 
-    fake_redis_mod = types.SimpleNamespace(Redis=types.SimpleNamespace(
-        from_url=lambda url, decode_responses=True: FakeRedisClient()))
+    fake_redis_mod = types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda url, decode_responses=True: FakeRedisClient()))
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
 
     # run_async returns success for 1 chunk
-    monkeypatch.setattr(tasks, "run_async", lambda coro: {
-                        "success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
+    monkeypatch.setattr(tasks, "run_async", lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"})
 
     self = FakeSelf("f6")
-    result = tasks.forward(self, processed_data={
-                           "redis_key": "dp:rid:chunks"}, index_name="idx", source="/a.txt")
+    result = tasks.forward(self, processed_data={"redis_key": "dp:rid:chunks"}, index_name="idx", source="/a.txt")
     assert result["chunks_stored"] == 1
 
 
-def test_submit_process_forward_chain_returns_chain_id(monkeypatch):
+def test_process_and_forward_returns_chain_id(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
 
     class FakeResult:
@@ -1148,24 +1074,8 @@ def apply_async(self):
             return FakeResult("123")
 
     monkeypatch.setattr(tasks, "chain", lambda *a, **k: FakeChain())
-    import backend.data_process.tasks as tasks_module
-    tasks_module.process = tasks.process
-    tasks_module.forward = tasks.forward
-    tasks_module.cleanup_source = tasks.cleanup_source
-    chain_id = tasks.submit_process_forward_chain(
-        source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
-    assert chain_id == "123"
-
-
-def test_process_and_forward_returns_chain_id(monkeypatch):
-    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(
-        tasks, "submit_process_forward_chain",
-        lambda **kwargs: "123",
-    )
     self = FakeSelf("c1")
-    chain_id = tasks.process_and_forward(
-        self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
+    chain_id = tasks.process_and_forward(self, source="/a.txt", source_type="local", chunking_strategy="basic", index_name="idx")
     assert chain_id == "123"
 
 
@@ -1215,8 +1125,7 @@ def save_error_info(self, tid, reason):
         "backend.data_process.tasks.logger.info", lambda msg: infos.append(msg)
     )
     monkeypatch.setattr(
-        "backend.data_process.tasks.logger.error", lambda *a, **k: warnings.append(
-            a[0])
+        "backend.data_process.tasks.logger.error", lambda *a, **k: warnings.append(a[0])
     )
 
     # empty task_id
@@ -1287,8 +1196,7 @@ def test_process_error_fallback_when_save_error_raises(monkeypatch, tmp_path):
 
     # State should still be updated in fallback branch
     assert any(
-        s.get("meta", {}).get("stage") in {
-            "text_extraction_failed", "extracting_text"}
+        s.get("meta", {}).get("stage") in {"text_extraction_failed", "extracting_text"}
         for s in self.states
     ) or self.states == []
 
@@ -1303,8 +1211,7 @@ def test_process_error_truncates_reason_when_no_error_code(monkeypatch, tmp_path
     # Provide actor but make ray.get raise inside the try block
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref_err")
+            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref_err")
             self.store_chunks_in_redis = types.SimpleNamespace(
                 remote=lambda *a, **k: None)
 
@@ -1351,15 +1258,13 @@ def test_forward_cancel_check_warning_then_continue(monkeypatch):
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
 
     # make cancellation check raise to hit warning path
-    monkeypatch.setattr(tasks, "get_redis_service", lambda: (
-        _ for _ in ()).throw(RuntimeError("boom")))
+    monkeypatch.setattr(tasks, "get_redis_service", lambda: (_ for _ in ()).throw(RuntimeError("boom")))
 
     # run index_documents normally via stubbed run_async returning success
     monkeypatch.setattr(
         tasks,
         "run_async",
-        lambda coro: {"success": True, "total_indexed": 1,
-                      "total_submitted": 1, "message": "ok"},
+        lambda coro: {"success": True, "total_indexed": 1, "total_submitted": 1, "message": "ok"},
     )
 
     self = FakeSelf("warn-cancel")
@@ -1558,8 +1463,7 @@ def post(self, *a, **k):
             index_name="idx",
             source="/a.txt",
         )
-    assert "Failed to connect to API" in str(
-        exc.value) or "timeout" in str(exc.value).lower()
+    assert "Failed to connect to API" in str(exc.value) or "timeout" in str(exc.value).lower()
 
 
 def test_forward_truncates_reason_when_no_error_code(monkeypatch):
@@ -1570,14 +1474,12 @@ def test_forward_truncates_reason_when_no_error_code(monkeypatch):
 
     long_msg = json.dumps({"message": "m" * 250})
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (
-            _ for _ in ()).throw(Exception(long_msg))
+        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception(long_msg))
     )
 
     reasons: list[str] = []
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(
-            reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(reason)
     )
 
     self = FakeSelf("f-trunc")
@@ -1603,14 +1505,12 @@ def test_forward_fallback_truncates_on_non_json_error(monkeypatch):
     monkeypatch.setattr(tasks, "extract_error_code", lambda *a, **k: None)
 
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (
-            _ for _ in ()).throw(Exception("n" * 250))
+        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception("n" * 250))
     )
 
     reasons: list[str] = []
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(
-            reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: reasons.append(reason)
     )
 
     self = FakeSelf("f-fallback")
@@ -1634,13 +1534,11 @@ def test_forward_error_truncates_reason_and_uses_save(monkeypatch):
     long_message = "m" * 250
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (_ for _ in ()).throw(
-            Exception(json.dumps({"message": long_message})))
+        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception(json.dumps({"message": long_message})))
     )
     captured = {}
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault(
-            "reason", reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault("reason", reason)
     )
 
     self = FakeSelf("trunc")
@@ -1659,13 +1557,11 @@ def test_forward_error_fallback_when_json_loads_fails(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
     monkeypatch.setattr(
-        tasks, "run_async", lambda coro: (
-            _ for _ in ()).throw(Exception("not-json-error"))
+        tasks, "run_async", lambda coro: (_ for _ in ()).throw(Exception("not-json-error"))
     )
     captured = {}
     monkeypatch.setattr(
-        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault(
-            "reason", reason)
+        tasks, "save_error_to_redis", lambda tid, reason, st: captured.setdefault("reason", reason)
     )
 
     self = FakeSelf("fallback-forward")
@@ -1688,8 +1584,7 @@ def test_process_sync_local_returns(monkeypatch):
 
     class FakeActor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref1")
+            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref1")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: FakeActor())
     fake_ray.get_returns = [{"content": "a"}, {"content": "b"}]
@@ -1719,16 +1614,13 @@ def test_build_balanced_batches_balances_image_chunks(monkeypatch):
         {"content": f"img-{i}", "process_source": tasks.IMAGE_METADATA_PROCESS_SOURCE}
         for i in range(6)
     ]
-    text_chunks = [{"content": f"txt-{i}",
-                    "process_source": "Unstructured"} for i in range(4)]
-    batches = tasks._build_balanced_batches(
-        image_chunks + text_chunks, batch_size=4)
+    text_chunks = [{"content": f"txt-{i}", "process_source": "Unstructured"} for i in range(4)]
+    batches = tasks._build_balanced_batches(image_chunks + text_chunks, batch_size=4)
 
     assert len(batches) == 3
     assert all(len(batch) <= 4 for batch in batches)
     image_counts = [
-        sum(1 for chunk in batch if chunk.get("process_source")
-            == tasks.IMAGE_METADATA_PROCESS_SOURCE)
+        sum(1 for chunk in batch if chunk.get("process_source") == tasks.IMAGE_METADATA_PROCESS_SOURCE)
         for batch in batches
     ]
     assert max(image_counts) - min(image_counts) <= 1
@@ -1753,7 +1645,6 @@ def test_forward_large_chunks_uses_chord_batches(monkeypatch):
     class _RedisSvc:
         def save_progress_info(self, *args, **kwargs):
             return True
-
         def is_task_cancelled(self, *args, **kwargs):
             return False
 
@@ -1762,15 +1653,12 @@ def is_task_cancelled(self, *args, **kwargs):
     class _Sig:
         def __init__(self, kwargs):
             self.kwargs = kwargs
-
         def set(self, **_kw):
             return self
 
     captured = {"group_sigs": None}
-    monkeypatch.setattr(tasks, "forward_part", types.SimpleNamespace(
-        s=lambda **kwargs: _Sig(kwargs)))
-    monkeypatch.setattr(tasks, "aggregate_forward_parts",
-                        types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
+    monkeypatch.setattr(tasks, "forward_part", types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
+    monkeypatch.setattr(tasks, "aggregate_forward_parts", types.SimpleNamespace(s=lambda **kwargs: _Sig(kwargs)))
 
     def _fake_group(sig_iter):
         sigs = list(sig_iter)
@@ -1779,11 +1667,9 @@ def _fake_group(sig_iter):
 
     def _fake_chord(group_tasks):
         def _runner(_callback):
-            total = sum(len(sig.kwargs.get("chunks", []))
-                        for sig in group_tasks)
+            total = sum(len(sig.kwargs.get("chunks", [])) for sig in group_tasks)
             return types.SimpleNamespace(
-                get=lambda: {"success": True, "total_indexed": total,
-                             "total_submitted": total, "message": "ok"}
+                get=lambda: {"success": True, "total_indexed": total, "total_submitted": total, "message": "ok"}
             )
         return _runner
 
@@ -1796,8 +1682,7 @@ def _fake_allow_join_result():
     monkeypatch.setattr(tasks, "allow_join_result", _fake_allow_join_result)
 
     self = FakeSelf("forward-batch")
-    large_chunks = [{"content": f"content-{i}", "metadata": {}}
-                    for i in range(70)]
+    large_chunks = [{"content": f"content-{i}", "metadata": {}} for i in range(70)]
     out = tasks.forward(
         self,
         processed_data={"chunks": large_chunks},
@@ -1810,8 +1695,7 @@ def _fake_allow_join_result():
     assert out["chunks_stored"] == 70
     assert captured["group_sigs"] is not None
     assert len(captured["group_sigs"]) == 2
-    assert all(sig.kwargs.get("large_mode")
-               is True for sig in captured["group_sigs"])
+    assert all(sig.kwargs.get("large_mode") is True for sig in captured["group_sigs"])
 
 
 def test_process_sync_unsupported_raises_and_updates_state(monkeypatch):
@@ -1819,15 +1703,13 @@ def test_process_sync_unsupported_raises_and_updates_state(monkeypatch):
     monkeypatch.setattr(
         tasks,
         "get_ray_actor",
-        lambda: types.SimpleNamespace(
-            process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref")),
+        lambda: types.SimpleNamespace(process_file=types.SimpleNamespace(remote=lambda *a, **k: "ref")),
     )
     self = FakeSelf("s2")
     with pytest.raises(NotImplementedError):
         tasks.process_sync(self, source="/a.txt", source_type="minio")
     # check that failure meta was updated
-    assert any("sync_processing_failed" in s.get(
-        "meta", {}).get("stage", "") for s in self.states)
+    assert any("sync_processing_failed" in s.get("meta", {}).get("stage", "") for s in self.states)
 
 
 def test_forward_redis_key_requires_backend_url_raises(monkeypatch):
@@ -2049,8 +1931,7 @@ def get(self, key):
         Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeClient())
     )
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
-    assert tasks._wait_for_split_ready(
-        "dp:k", timeout_s=1, poll_interval_ms=1) == 2
+    assert tasks._wait_for_split_ready("dp:k", timeout_s=1, poll_interval_ms=1) == 2
 
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "")
     with pytest.raises(RuntimeError):
@@ -2069,8 +1950,7 @@ def get(self, key):
         Redis=types.SimpleNamespace(from_url=lambda *a, **k: ClientBadJson())
     )
     monkeypatch.setitem(sys.modules, "redis", fake_redis_mod)
-    assert tasks._wait_for_split_ready(
-        "dp:k", timeout_s=1, poll_interval_ms=1) == 0
+    assert tasks._wait_for_split_ready("dp:k", timeout_s=1, poll_interval_ms=1) == 0
 
     class ClientNeverReady:
         def get(self, key):
@@ -2079,8 +1959,7 @@ def get(self, key):
     monkeypatch.setitem(
         sys.modules,
         "redis",
-        types.SimpleNamespace(Redis=types.SimpleNamespace(
-            from_url=lambda *a, **k: ClientNeverReady())),
+        types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: ClientNeverReady())),
     )
     monkeypatch.setattr(tasks.time, "sleep", lambda _s: None)
     t = {"v": 0.0}
@@ -2109,8 +1988,7 @@ def test_estimate_parallel_parts_and_batch_helpers(monkeypatch):
 def test_extract_error_code_from_es_response_detail_string(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     parsed = {"detail": "{\"error_code\":\"es_detail_code\"}"}
-    assert tasks._extract_error_code_from_es_response(
-        parsed, "x") == "es_detail_code"
+    assert tasks._extract_error_code_from_es_response(parsed, "x") == "es_detail_code"
 
 
 def test_run_async_loop_not_running_branch(monkeypatch):
@@ -2156,8 +2034,7 @@ class Actor:
         def __init__(self):
             self.ping = types.SimpleNamespace(remote=lambda: "pong")
 
-    monkeypatch.setattr(tasks, "DataProcessorRayActor",
-                        types.SimpleNamespace(remote=lambda: Actor()))
+    monkeypatch.setattr(tasks, "DataProcessorRayActor", types.SimpleNamespace(remote=lambda: Actor()))
     monkeypatch.setattr(tasks.ray, "get", lambda ref, timeout=None: True)
     manager = tasks.GlobalRayActorPoolManager(warm_timeout_s=1)
     assert manager.ensure_pool(desired=2, max_allowed=3) == 2
@@ -2171,10 +2048,8 @@ class Actor:
         def __init__(self):
             self.ping = types.SimpleNamespace(remote=lambda: "x")
 
-    monkeypatch.setattr(tasks, "DataProcessorRayActor",
-                        types.SimpleNamespace(remote=lambda: Actor()))
-    monkeypatch.setattr(tasks.ray, "get", lambda *a, **
-                        k: (_ for _ in ()).throw(RuntimeError("warm fail")))
+    monkeypatch.setattr(tasks, "DataProcessorRayActor", types.SimpleNamespace(remote=lambda: Actor()))
+    monkeypatch.setattr(tasks.ray, "get", lambda *a, **k: (_ for _ in ()).throw(RuntimeError("warm fail")))
     monkeypatch.setattr(tasks.ray, "kill", lambda *a, **k: None, raising=False)
     manager = tasks.GlobalRayActorPoolManager(warm_timeout_s=1)
     assert manager.ensure_pool(desired=1, max_allowed=1) == 0
@@ -2191,17 +2066,14 @@ def options(self, **_kw):
             raise TypeError("no get_if_exists")
 
     monkeypatch.setattr(tasks, "GlobalRayActorPoolManager", _Opts())
-    monkeypatch.setattr(tasks.ray, "get_actor", lambda *a,
-                        **k: "manager", raising=False)
+    monkeypatch.setattr(tasks.ray, "get_actor", lambda *a, **k: "manager", raising=False)
     assert tasks._get_or_create_global_pool_manager() == "manager"
 
 
 def test_prewarm_ray_actors(monkeypatch):
     tasks, fake_ray = import_tasks_with_fake_ray(monkeypatch)
-    manager = types.SimpleNamespace(
-        ensure_pool=types.SimpleNamespace(remote=lambda **k: "ref"))
-    monkeypatch.setattr(
-        tasks, "_get_or_create_global_pool_manager", lambda: manager)
+    manager = types.SimpleNamespace(ensure_pool=types.SimpleNamespace(remote=lambda **k: "ref"))
+    monkeypatch.setattr(tasks, "_get_or_create_global_pool_manager", lambda: manager)
     monkeypatch.setattr(tasks, "_estimate_parallel_parts", lambda: 4)
     monkeypatch.setattr(fake_ray, "get", lambda ref: 3)
     assert tasks.prewarm_ray_actors(target_size=3) == 3
@@ -2213,8 +2085,7 @@ def test_process_part_success_and_failure(monkeypatch):
 
     class Actor:
         def __init__(self):
-            self.process_bytes = types.SimpleNamespace(
-                remote=lambda *a, **k: "chunks-ref")
+            self.process_bytes = types.SimpleNamespace(remote=lambda *a, **k: "chunks-ref")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: Actor())
     fake_ray.get_returns = {"chunks-ref": [{"content": "x"}]}
@@ -2228,11 +2099,9 @@ def set(self, k, v):
         def expire(self, *a, **k):
             return True
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
-        Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
     out = tasks.process_part(
-        types.SimpleNamespace(request=types.SimpleNamespace(
-            id="p1"), retry=lambda **k: None),
+        types.SimpleNamespace(request=types.SimpleNamespace(id="p1"), retry=lambda **k: None),
         part_bytes=b"a", filename="a.txt", chunking_strategy="basic", part_redis_key="k1",
         source="s", source_type="local"
     )
@@ -2241,8 +2110,7 @@ def expire(self, *a, **k):
 
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "")
     out2 = tasks.process_part(
-        types.SimpleNamespace(request=types.SimpleNamespace(
-            id="p2"), retry=lambda **k: None),
+        types.SimpleNamespace(request=types.SimpleNamespace(id="p2"), retry=lambda **k: None),
         part_bytes=b"a", filename="a.txt", chunking_strategy="basic", part_redis_key="k2",
         source="s", source_type="local"
     )
@@ -2272,12 +2140,10 @@ def expire(self, *a, **k):
         def delete(self, k):
             kv.pop(k, None)
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
-        Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: Client())))
     res = tasks.aggregate_store_chunks(
         self,
-        parts_results=[{"part_redis_key": "part1"},
-                       {"part_redis_key": "part2"}],
+        parts_results=[{"part_redis_key": "part1"}, {"part_redis_key": "part2"}],
         redis_key="maink",
         source="s",
         index_name="idx",
@@ -2292,8 +2158,7 @@ def test_forward_part_success_and_progress(monkeypatch):
     monkeypatch.setattr(
         tasks,
         "_send_chunks_to_es",
-        lambda **kwargs: {"success": True,
-                          "total_indexed": 2, "total_submitted": 2},
+        lambda **kwargs: {"success": True, "total_indexed": 2, "total_submitted": 2},
     )
     calls = {"inc": 0}
 
@@ -2308,8 +2173,7 @@ def increment_progress_info(self, **kwargs):
     monkeypatch.setattr(tasks, "get_redis_service", lambda: _Svc())
     self = types.SimpleNamespace(
         request=types.SimpleNamespace(id="fp1", retries=0),
-        retry=lambda **k: (_ for _ in ()
-                           ).throw(RuntimeError("should not retry")),
+        retry=lambda **k: (_ for _ in ()).throw(RuntimeError("should not retry")),
     )
     out = tasks.forward_part(
         self,
@@ -2326,16 +2190,14 @@ def increment_progress_info(self, **kwargs):
 
 def test_forward_part_failure_retries(monkeypatch):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(tasks, "_send_chunks_to_es", lambda **
-                        kwargs: {"success": False, "message": "bad"})
+    monkeypatch.setattr(tasks, "_send_chunks_to_es", lambda **kwargs: {"success": False, "message": "bad"})
     captured = {}
 
     def _retry(**kwargs):
         captured.update(kwargs)
         raise RuntimeError("retried")
 
-    self = types.SimpleNamespace(
-        request=types.SimpleNamespace(id="fp2", retries=1), retry=_retry)
+    self = types.SimpleNamespace(request=types.SimpleNamespace(id="fp2", retries=1), retry=_retry)
     with pytest.raises(RuntimeError, match="retried"):
         tasks.forward_part(
             self,
@@ -2369,14 +2231,11 @@ def test_run_processing_for_parts_single_and_multi(monkeypatch):
 
     class Actor:
         def __init__(self):
-            self.process_file = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref-file")
-            self.process_bytes = types.SimpleNamespace(
-                remote=lambda *a, **k: "ref-bytes")
+            self.process_file = types.SimpleNamespace(remote=lambda *a, **k: "ref-file")
+            self.process_bytes = types.SimpleNamespace(remote=lambda *a, **k: "ref-bytes")
 
     monkeypatch.setattr(tasks, "get_ray_actor", lambda: Actor())
-    fake_ray.get_returns = {
-        "ref-bytes": [{"content": "c1"}], "ref-file": [{"content": "cf"}]}
+    fake_ray.get_returns = {"ref-bytes": [{"content": "c1"}], "ref-file": [{"content": "cf"}]}
 
     split_async, chunks, split_chunk_count = tasks._run_processing_for_parts(
         request_id="r1",
@@ -2397,13 +2256,10 @@ def __init__(self):
     assert split_chunk_count is None
 
     captured = {}
-    monkeypatch.setattr(tasks, "process_part", types.SimpleNamespace(
-        s=lambda **kwargs: types.SimpleNamespace(kwargs=kwargs)))
-    monkeypatch.setattr(tasks, "aggregate_store_chunks", types.SimpleNamespace(
-        s=lambda **kwargs: types.SimpleNamespace(set=lambda **kw: {"kwargs": kwargs, "set": kw})))
+    monkeypatch.setattr(tasks, "process_part", types.SimpleNamespace(s=lambda **kwargs: types.SimpleNamespace(kwargs=kwargs)))
+    monkeypatch.setattr(tasks, "aggregate_store_chunks", types.SimpleNamespace(s=lambda **kwargs: types.SimpleNamespace(set=lambda **kw: {"kwargs": kwargs, "set": kw})))
     monkeypatch.setattr(tasks, "group", lambda gen: list(gen))
-    monkeypatch.setattr(tasks, "chord", lambda group_tasks: (
-        lambda callback: captured.update({"group": group_tasks, "callback": callback})))
+    monkeypatch.setattr(tasks, "chord", lambda group_tasks: (lambda callback: captured.update({"group": group_tasks, "callback": callback})))
     monkeypatch.setattr(tasks, "_compute_split_wait_timeout", lambda n: 9)
     monkeypatch.setattr(tasks, "_estimate_parallel_parts", lambda: 2)
     monkeypatch.setattr(tasks, "_wait_for_split_ready", lambda **kwargs: 6)
@@ -2431,17 +2287,14 @@ def __init__(self):
 def test_process_split_async_redis_image_metadata_count(monkeypatch, tmp_path):
     tasks, _ = import_tasks_with_fake_ray(monkeypatch)
     monkeypatch.setattr(tasks, "REDIS_BACKEND_URL", "redis://test")
-    monkeypatch.setattr(tasks, "_process_source_with_split",
-                        lambda **kwargs: (True, None, 2))
-    monkeypatch.setattr(
-        tasks, "_count_image_metadata_chunks", lambda chunks: 1)
+    monkeypatch.setattr(tasks, "_process_source_with_split", lambda **kwargs: (True, None, 2))
+    monkeypatch.setattr(tasks, "_count_image_metadata_chunks", lambda chunks: 1)
 
     class FakeRedisClient:
         def get(self, key):
             return json.dumps([{"metadata": {"content_type": "image"}}, {"metadata": {}}])
 
-    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(
-        Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeRedisClient())))
+    monkeypatch.setitem(sys.modules, "redis", types.SimpleNamespace(Redis=types.SimpleNamespace(from_url=lambda *a, **k: FakeRedisClient())))
 
     f = tmp_path / "x.txt"
     f.write_text("hello")
@@ -2456,88 +2309,5 @@ def get(self, key):
     )
     assert out["split_async"] is True
     assert out["image_metadata_chunk_count"] == 1
-    success_state = [s for s in self.states if s.get(
-        "state") == tasks.states.SUCCESS][0]
+    success_state = [s for s in self.states if s.get("state") == tasks.states.SUCCESS][0]
     assert success_state["meta"]["chunks_count"] == 2
-
-
-def test_cleanup_source_skips_when_preserve_true(monkeypatch):
-    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
-    monkeypatch.setattr(tasks, "get_knowledge_record",
-                        lambda query=None: {"preserve_source_file": True})
-
-    called = {"delete": 0}
-
-    def _delete(*_a, **_k):
-        called["delete"] += 1
-        raise AssertionError(
-            "requests.delete should not be called when preserve_source_file is True")
-
-    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
-
-    self = FakeSelf("cleanup-skip-1")
-    out = tasks.cleanup_source(
-        self,
-        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
-    )
-    assert out["source_cleanup"]["attempted"] is False
-    assert out["source_cleanup"]["skipped_reason"] == "preserve_source_file_true"
-    assert called["delete"] == 0
-
-
-def test_cleanup_source_calls_delete_with_scope_source_only(monkeypatch):
-    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
-    monkeypatch.setattr(tasks, "get_knowledge_record",
-                        lambda query=None: {"preserve_source_file": False})
-
-    captured = {}
-
-    class FakeResponse:
-        status_code = 200
-        text = ""
-
-        @staticmethod
-        def json():
-            return {"status": "success"}
-
-    def _delete(url, params=None, timeout=None):
-        captured["url"] = url
-        captured["params"] = params
-        captured["timeout"] = timeout
-        return FakeResponse()
-
-    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
-
-    self = FakeSelf("cleanup-call-1")
-    out = tasks.cleanup_source(
-        self,
-        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
-    )
-    assert captured["url"] == "http://api/indices/idx/documents"
-    assert captured["params"]["path_or_url"] == "/a.txt"
-    assert captured["params"]["scope"] == "source_only"
-    assert out["source_cleanup"]["attempted"] is True
-    assert out["source_cleanup"]["success"] is True
-
-
-def test_cleanup_source_failure_is_warning_only(monkeypatch):
-    tasks, _ = import_tasks_with_fake_ray(monkeypatch)
-    monkeypatch.setattr(tasks, "ELASTICSEARCH_SERVICE", "http://api")
-    monkeypatch.setattr(tasks, "get_knowledge_record",
-                        lambda query=None: {"preserve_source_file": False})
-
-    def _delete(*_a, **_k):
-        raise RuntimeError("boom")
-
-    monkeypatch.setattr(tasks.requests, "delete", _delete, raising=True)
-
-    self = FakeSelf("cleanup-fail-1")
-    out = tasks.cleanup_source(
-        self,
-        {"task_id": "t1", "index_name": "idx", "source": "/a.txt"},
-    )
-    assert out["source_cleanup"]["attempted"] is True
-    assert out["source_cleanup"]["success"] is False
-    assert "boom" in (out["source_cleanup"]["error"] or "")
diff --git a/test/backend/data_process/test_worker.py b/test/backend/data_process/test_worker.py
index 79875ba5a..da4408e2f 100644
--- a/test/backend/data_process/test_worker.py
+++ b/test/backend/data_process/test_worker.py
@@ -185,12 +185,7 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
             get_model_by_model_id=lambda model_id, tenant_id=None: None
         )
         setattr(sys.modules["database"], "model_management_db", sys.modules["database.model_management_db"])
-    if "database.knowledge_db" not in sys.modules:
-        sys.modules["database.knowledge_db"] = types.SimpleNamespace(
-            get_knowledge_record=lambda query=None: {},
-        )
-        setattr(sys.modules["database"], "knowledge_db", sys.modules["database.knowledge_db"])
-
+    
     # Stub utils modules (required by utils.file_management_utils)
     if "utils.auth_utils" not in sys.modules:
         sys.modules["utils.auth_utils"] = types.SimpleNamespace(
@@ -218,19 +213,6 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         sys.modules["httpx"] = types.SimpleNamespace()
     if "requests" not in sys.modules:
         sys.modules["requests"] = types.SimpleNamespace()
-    if "redis" not in sys.modules:
-        sys.modules["redis"] = types.SimpleNamespace(
-            Redis=types.SimpleNamespace(
-                from_url=lambda *args, **kwargs: types.SimpleNamespace(
-                    get=lambda *a, **k: None,
-                    set=lambda *a, **k: True,
-                    expire=lambda *a, **k: True,
-                    delete=lambda *a, **k: True,
-                    ping=lambda: True,
-                )
-            ),
-            from_url=lambda *args, **kwargs: types.SimpleNamespace(ping=lambda: True),
-        )
     if "fastapi" not in sys.modules:
         fastapi_mod = types.ModuleType("fastapi")
         fastapi_mod.UploadFile = type("UploadFile", (), {})
@@ -241,27 +223,7 @@ def __init__(self, chunking_strategy: str, source_type: str, index_name: str, au
         file_utils_mod = types.ModuleType("utils.file_management_utils")
         file_utils_mod.get_file_size = lambda *args, **kwargs: 0
         sys.modules["utils.file_management_utils"] = file_utils_mod
-
-    # Stub services.redis_service (required by tasks.py via package __init__)
-    if "services.redis_service" not in sys.modules:
-        redis_service_mod = types.ModuleType("services.redis_service")
-
-        class _StubRedisService:
-            def save_error_info(self, *args, **kwargs):
-                return True
-
-            def is_task_cancelled(self, *args, **kwargs):
-                return False
-
-            def save_progress_info(self, *args, **kwargs):
-                return True
-
-            def increment_progress_info(self, *args, **kwargs):
-                return True
-
-        redis_service_mod.get_redis_service = lambda: _StubRedisService()
-        sys.modules["services.redis_service"] = redis_service_mod
-
+    
     # Stub ray_actors (required by tasks.py)
     if "backend.data_process.ray_actors" not in sys.modules:
         ray_actors_mod = types.ModuleType("backend.data_process.ray_actors")
diff --git a/test/backend/database/test_agent_db.py b/test/backend/database/test_agent_db.py
index 77a1d82a9..de2ed8864 100644
--- a/test/backend/database/test_agent_db.py
+++ b/test/backend/database/test_agent_db.py
@@ -77,12 +77,6 @@
 db_models_mock.ToolInstance = MagicMock()
 db_models_mock.AgentRelation = MagicMock()
 
-# Mock database.agent_version_db before agent_db imports it
-agent_version_db_mock = MagicMock()
-agent_version_db_mock.query_current_version_no = MagicMock(return_value=3)
-sys.modules['database.agent_version_db'] = agent_version_db_mock
-sys.modules['backend.database.agent_version_db'] = agent_version_db_mock
-
 # 将模拟的db_models模块添加到sys.modules中
 sys.modules['database.db_models'] = db_models_mock
 sys.modules['backend.database.db_models'] = db_models_mock
@@ -93,8 +87,6 @@
     search_agent_id_by_agent_name,
     search_blank_sub_agent_by_main_agent_id,
     query_sub_agents_id_list,
-    query_sub_agent_relations,
-    resolve_sub_agent_version_no,
     create_agent,
     update_agent,
     delete_agent_by_id,
@@ -132,17 +124,13 @@ def __init__(self):
         self.group_ids = None
         self.is_new = True
         self.enable_context_manager = False
-        self.verification_config = None
-        self.greeting_message = None
-        self.example_questions = None
         self.current_version_no = None
         self.version_no = 0
         self.created_by = None
 
 class MockAgentRelation:
-    def __init__(self, selected_agent_version_no=None):
+    def __init__(self):
         self.selected_agent_id = 2
-        self.selected_agent_version_no = selected_agent_version_no
 
 @pytest.fixture
 def mock_session():
@@ -288,69 +276,6 @@ def test_query_sub_agents_id_list(monkeypatch, mock_session):
 
     assert result == [2]
 
-
-def test_query_sub_agent_relations(monkeypatch, mock_session):
-    """Test querying sub-agent relations including pinned version"""
-    session, query = mock_session
-    mock_relation = MockAgentRelation(selected_agent_version_no=2)
-
-    mock_all = MagicMock()
-    mock_all.return_value = [mock_relation]
-    mock_filter = MagicMock()
-    mock_filter.all = mock_all
-    query.filter.return_value = mock_filter
-
-    mock_ctx = MagicMock()
-    mock_ctx.__enter__.return_value = session
-    mock_ctx.__exit__.return_value = None
-    monkeypatch.setattr("backend.database.agent_db.get_db_session", lambda: mock_ctx)
-    monkeypatch.setattr("backend.database.agent_db.as_dict", lambda obj: obj.__dict__)
-
-    result = query_sub_agent_relations(1, "tenant1", version_no=1)
-
-    assert len(result) == 1
-    assert result[0]["selected_agent_id"] == 2
-    assert result[0]["selected_agent_version_no"] == 2
-
-
-def test_resolve_sub_agent_version_no_pinned(monkeypatch):
-    """Test resolve uses pinned version when set"""
-    result = resolve_sub_agent_version_no(
-        selected_agent_id=2,
-        selected_agent_version_no=5,
-        tenant_id="tenant1",
-    )
-    assert result == 5
-
-
-def test_resolve_sub_agent_version_no_fallback(monkeypatch):
-    """Test resolve falls back to child current_version_no when pin is NULL"""
-    monkeypatch.setattr(
-        "backend.database.agent_db.query_current_version_no",
-        MagicMock(return_value=3),
-    )
-    result = resolve_sub_agent_version_no(
-        selected_agent_id=2,
-        selected_agent_version_no=None,
-        tenant_id="tenant1",
-    )
-    assert result == 3
-
-
-def test_resolve_sub_agent_version_no_fallback_to_draft(monkeypatch):
-    """Test resolve falls back to draft when child has no published version"""
-    monkeypatch.setattr(
-        "backend.database.agent_db.query_current_version_no",
-        MagicMock(return_value=None),
-    )
-    result = resolve_sub_agent_version_no(
-        selected_agent_id=2,
-        selected_agent_version_no=None,
-        tenant_id="tenant1",
-    )
-    assert result == 0
-
-
 def test_create_agent_success(monkeypatch, mock_session):
     """测试成功创建agent"""
     session, query = mock_session
diff --git a/test/backend/database/test_agent_version_db.py b/test/backend/database/test_agent_version_db.py
index fd354b29c..cd9ad8714 100644
--- a/test/backend/database/test_agent_version_db.py
+++ b/test/backend/database/test_agent_version_db.py
@@ -171,7 +171,6 @@ def __init__(self):
         self.id = 1
         self.parent_agent_id = 1
         self.selected_agent_id = 2
-        self.selected_agent_version_no = 3
         self.tenant_id = "tenant1"
         self.version_no = 1
         self.delete_flag = "N"
@@ -179,7 +178,6 @@ def __init__(self):
             "id": 1,
             "parent_agent_id": 1,
             "selected_agent_id": 2,
-            "selected_agent_version_no": 3,
             "tenant_id": "tenant1",
             "version_no": 1,
             "delete_flag": "N",
@@ -544,25 +542,6 @@ def query_side_effect(model_class):
     assert tools_list[0]["tool_id"] == 1
     assert len(relations_list) == 1
     assert relations_list[0]["selected_agent_id"] == 2
-    assert relations_list[0]["selected_agent_version_no"] == 3
-
-
-def test_restore_agent_draft_relation_copy_preserves_selected_agent_version_no():
-    """Verify restore draft relation copy keeps selected_agent_version_no unchanged."""
-    rel = {
-        "relation_id": 10,
-        "parent_agent_id": 1,
-        "selected_agent_id": 2,
-        "selected_agent_version_no": 3,
-        "tenant_id": "tenant1",
-        "version_no": 2,
-    }
-    rel_copy = {k: v for k, v in rel.items() if k not in ("version_no",)}
-    rel_copy["version_no"] = 0
-
-    assert rel_copy["selected_agent_version_no"] == 3
-    assert rel_copy["version_no"] == 0
-    assert rel_copy["selected_agent_id"] == 2
 
 
 def test_query_agent_snapshot_no_agent(monkeypatch, mock_session):
diff --git a/test/backend/services/test_agent_repository_service.py b/test/backend/services/test_agent_repository_service.py
deleted file mode 100644
index 648d20385..000000000
--- a/test/backend/services/test_agent_repository_service.py
+++ /dev/null
@@ -1,398 +0,0 @@
-"""Unit tests for agent marketplace repository service."""
-
-import sys
-from pathlib import Path
-from unittest.mock import AsyncMock, MagicMock, patch
-
-import pytest
-
-_REPO_ROOT = Path(__file__).resolve().parents[3]
-if str(_REPO_ROOT) not in sys.path:
-    sys.path.insert(0, str(_REPO_ROOT))
-
-# Mock DB layer before importing the service under test
-sys.modules.setdefault("sqlalchemy", MagicMock())
-sys.modules.setdefault("sqlalchemy.dialects", MagicMock())
-sys.modules.setdefault("sqlalchemy.dialects.postgresql", MagicMock())
-
-_agent_repo_db_mock = MagicMock()
-_agent_repo_db_mock.STATUS_PENDING_REVIEW = "PENDING_REVIEW"
-_agent_repo_db_mock.VALID_REPOSITORY_STATUSES = frozenset({
-    "NOT_SHARED",
-    "PENDING_REVIEW",
-    "REJECTED",
-    "SHARED",
-})
-_agent_repo_db_mock.get_agent_repository_by_id = MagicMock()
-_agent_repo_db_mock.get_agent_repository_by_agent_id = MagicMock()
-_agent_repo_db_mock.insert_agent_repository_record = MagicMock()
-_agent_repo_db_mock.update_agent_repository_by_id = MagicMock()
-sys.modules["database.agent_repository_db"] = _agent_repo_db_mock
-
-_agent_db_mock = MagicMock()
-_agent_db_mock.search_agent_info_by_agent_id = MagicMock()
-sys.modules["database.agent_db"] = _agent_db_mock
-
-_agent_version_db_mock = MagicMock()
-_agent_version_db_mock.search_version_by_version_no = MagicMock()
-sys.modules["database.agent_version_db"] = _agent_version_db_mock
-
-class _SkillZipEntryMock:
-    def __init__(self, skill_name: str, skill_zip_base64: str):
-        self.skill_name = skill_name
-        self.skill_zip_base64 = skill_zip_base64
-
-
-class _AgentRepositorySnapshotMock:
-    def __init__(self, **kwargs):
-        self._data = kwargs
-
-    def model_dump(self):
-        data = dict(self._data)
-        skills = data.get("skills")
-        if skills:
-            data["skills"] = [
-                {
-                    "skill_name": entry.skill_name,
-                    "skill_zip_base64": entry.skill_zip_base64,
-                }
-                for entry in skills
-            ]
-        return data
-
-
-_consts_model_mock = MagicMock()
-_consts_model_mock.AgentRepositorySnapshot = _AgentRepositorySnapshotMock
-_consts_model_mock.SkillZipEntry = _SkillZipEntryMock
-sys.modules["consts.model"] = _consts_model_mock
-
-_agent_service_mock = MagicMock()
-_agent_service_mock.collect_skill_zip_entries = MagicMock(return_value=[])
-_agent_service_mock.export_agent_dict_for_repository_impl = AsyncMock(return_value={
-    "agent_id": 1,
-    "agent_info": {
-        "1": {
-            "agent_id": 1,
-            "name": "agent_one",
-            "description": "desc",
-            "business_description": "biz",
-            "max_steps": 5,
-            "provide_run_summary": False,
-            "enabled": True,
-            "tools": [],
-            "managed_agents": [],
-        }
-    },
-    "mcp_info": [],
-})
-sys.modules["services.agent_service"] = _agent_service_mock
-
-from consts.const import ASSET_OWNER_TENANT_ID
-
-from backend.services import agent_repository_service as ars
-
-
-@pytest.mark.asyncio
-async def test_create_agent_repository_listing_impl_success():
-    agent_info_json = {
-        "agent_id": 1,
-        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
-        "mcp_info": [],
-        "skills": None,
-    }
-    with patch.object(
-        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
-    ) as mock_build_data, patch.object(
-        ars, "get_agent_repository_by_agent_id"
-    ) as mock_get_by_agent_id, patch.object(
-        ars, "insert_agent_repository_record"
-    ) as mock_insert, patch.object(
-        ars, "get_agent_repository_by_id"
-    ) as mock_get_by_id:
-        mock_build_data.return_value = {
-            "agent_id": 1,
-            "source_version_no": 1,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "status": "PENDING_REVIEW",
-        }
-        mock_get_by_agent_id.return_value = None
-        mock_insert.return_value = 42
-        mock_get_by_id.return_value = {
-            "agent_repository_id": 42,
-            "agent_id": 1,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "source_version_no": 1,
-            "status": "PENDING_REVIEW",
-            "tags": [],
-        }
-
-        result = await ars.create_agent_repository_listing_impl(
-            agent_id=1,
-            tenant_id="tenant_a",
-            user_id="user_a",
-            version_no=1,
-        )
-
-    assert result["agent_repository_id"] == 42
-    assert result["agent_info_json"] == agent_info_json
-    assert result["is_updated"] is False
-    mock_insert.assert_called_once()
-    mock_get_by_agent_id.assert_called_once_with(1)
-
-
-@pytest.mark.asyncio
-async def test_create_agent_repository_listing_impl_updates_existing():
-    agent_info_json = {
-        "agent_id": 1,
-        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
-        "mcp_info": [],
-        "skills": None,
-    }
-    with patch.object(
-        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
-    ) as mock_build_data, patch.object(
-        ars, "get_agent_repository_by_agent_id"
-    ) as mock_get_by_agent_id, patch.object(
-        ars, "update_agent_repository_by_id"
-    ) as mock_update, patch.object(
-        ars, "get_agent_repository_by_id"
-    ) as mock_get_by_id:
-        mock_build_data.return_value = {
-            "agent_id": 1,
-            "source_version_no": 2,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "status": "PENDING_REVIEW",
-        }
-        mock_get_by_agent_id.return_value = {"agent_repository_id": 42}
-        mock_update.return_value = 1
-        mock_get_by_id.return_value = {
-            "agent_repository_id": 42,
-            "agent_id": 1,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "source_version_no": 2,
-            "status": "PENDING_REVIEW",
-            "tags": [],
-        }
-
-        result = await ars.create_agent_repository_listing_impl(
-            agent_id=1,
-            tenant_id="tenant_a",
-            user_id="user_a",
-            version_no=2,
-        )
-
-    assert result["agent_repository_id"] == 42
-    assert result["is_updated"] is True
-    mock_update.assert_called_once()
-    mock_update.assert_called_with(
-        repository_id=42,
-        publisher_tenant_id="tenant_a",
-        user_id="user_a",
-        updates={
-            "source_version_no": 2,
-            "agent_info_json": agent_info_json,
-            "status": "PENDING_REVIEW",
-        },
-    )
-
-
-@pytest.mark.asyncio
-async def test_create_agent_repository_listing_impl_accepts_draft_version():
-    agent_info_json = {
-        "agent_id": 1,
-        "agent_info": {"1": {"agent_id": 1, "name": "agent_one"}},
-        "mcp_info": [],
-        "skills": None,
-    }
-    with patch.object(
-        ars, "_build_repository_data_from_agent", new_callable=AsyncMock
-    ) as mock_build_data, patch.object(
-        ars, "get_agent_repository_by_agent_id"
-    ) as mock_get_by_agent_id, patch.object(
-        ars, "insert_agent_repository_record"
-    ) as mock_insert, patch.object(
-        ars, "get_agent_repository_by_id"
-    ) as mock_get_by_id:
-        mock_build_data.return_value = {
-            "agent_id": 1,
-            "source_version_no": 0,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "status": "PENDING_REVIEW",
-        }
-        mock_get_by_agent_id.return_value = None
-        mock_insert.return_value = 42
-        mock_get_by_id.return_value = {
-            "agent_repository_id": 42,
-            "agent_id": 1,
-            "name": "agent_one",
-            "agent_info_json": agent_info_json,
-            "source_version_no": 0,
-            "status": "PENDING_REVIEW",
-            "tags": [],
-        }
-
-        result = await ars.create_agent_repository_listing_impl(
-            agent_id=1,
-            tenant_id="tenant_a",
-            user_id="user_a",
-            version_no=0,
-        )
-
-    assert result["agent_repository_id"] == 42
-    assert result["source_version_no"] == 0
-    mock_build_data.assert_awaited_once_with(1, "tenant_a", "user_a", 0)
-
-
-@pytest.mark.asyncio
-async def test_create_agent_repository_listing_impl_rejects_negative_version():
-    with pytest.raises(ValueError, match="version_no must be >= 0"):
-        await ars.create_agent_repository_listing_impl(
-            agent_id=1,
-            tenant_id="tenant_a",
-            user_id="user_a",
-            version_no=-1,
-        )
-
-
-def test_validate_create_payload_requires_agent_info_json():
-    with pytest.raises(ValueError, match="agent_info_json"):
-        ars._validate_create_payload({
-            "agent_id": 1,
-            "source_version_no": 1,
-            "name": "agent_one",
-        })
-
-    with pytest.raises(ValueError, match="agent_info_json must contain"):
-        ars._validate_create_payload({
-            "agent_id": 1,
-            "source_version_no": 1,
-            "name": "agent_one",
-            "agent_info_json": {"agent_id": 1},
-        })
-
-
-@pytest.mark.asyncio
-async def test_build_repository_data_from_agent_includes_skills():
-    SkillZipEntry = _consts_model_mock.SkillZipEntry
-
-    _agent_db_mock.search_agent_info_by_agent_id.return_value = {
-        "name": "agent_one",
-        "display_name": "Agent One",
-        "description": "desc",
-        "author": "author",
-    }
-    _agent_service_mock.export_agent_dict_for_repository_impl.return_value = {
-        "agent_id": 1,
-        "agent_info": {
-            "1": {
-                "agent_id": 1,
-                "name": "agent_one",
-                "description": "desc",
-                "business_description": "biz",
-                "max_steps": 5,
-                "provide_run_summary": False,
-                "enabled": True,
-                "tools": [],
-                "managed_agents": [],
-            }
-        },
-        "mcp_info": [],
-    }
-    _agent_service_mock.collect_skill_zip_entries.return_value = [
-        SkillZipEntry(skill_name="SkillA", skill_zip_base64="abc=")
-    ]
-    _agent_version_db_mock.search_version_by_version_no.return_value = {
-        "version_name": "v1.0"
-    }
-
-    result = await ars._build_repository_data_from_agent(
-        agent_id=1,
-        tenant_id="tenant_a",
-        user_id="user_a",
-        version_no=1,
-    )
-
-    assert result["agent_info_json"]["agent_id"] == 1
-    assert result["agent_info_json"]["skills"][0]["skill_name"] == "SkillA"
-    assert result["version_label"] == "v1.0"
-
-
-def test_validate_agent_info_json_rejects_asset_owner_agent():
-    agent_info_json = {
-        "agent_id": 1,
-        "agent_info": {
-            "1": {"agent_id": 1, "tenant_id": ASSET_OWNER_TENANT_ID, "name": "owner_agent"},
-        },
-        "mcp_info": [],
-    }
-    with pytest.raises(ValueError, match="租户管理员智能体无法共享"):
-        ars._validate_agent_info_json_shareable(agent_info_json)
-
-
-def test_validate_agent_info_json_allows_normal_tenant():
-    agent_info_json = {
-        "agent_id": 1,
-        "agent_info": {
-            "1": {"agent_id": 1, "tenant_id": "tenant_a", "name": "agent_one"},
-            "2": {"agent_id": 2, "tenant_id": "tenant_b", "name": "sub_agent"},
-        },
-        "mcp_info": [],
-    }
-    ars._validate_agent_info_json_shareable(agent_info_json)
-
-
-@pytest.mark.asyncio
-async def test_build_repository_data_from_agent_rejects_asset_owner():
-    _agent_db_mock.search_agent_info_by_agent_id.return_value = {
-        "name": "agent_one",
-        "display_name": "Agent One",
-        "description": "desc",
-        "author": "author",
-    }
-    _agent_service_mock.export_agent_dict_for_repository_impl.return_value = {
-        "agent_id": 1,
-        "agent_info": {
-            "1": {
-                "agent_id": 1,
-                "tenant_id": "tenant_a",
-                "name": "agent_one",
-                "description": "desc",
-                "business_description": "biz",
-                "max_steps": 5,
-                "provide_run_summary": False,
-                "enabled": True,
-                "tools": [],
-                "managed_agents": [],
-            },
-            "2": {
-                "agent_id": 2,
-                "tenant_id": ASSET_OWNER_TENANT_ID,
-                "name": "sub_owner_agent",
-                "description": "desc",
-                "business_description": "biz",
-                "max_steps": 5,
-                "provide_run_summary": False,
-                "enabled": True,
-                "tools": [],
-                "managed_agents": [],
-            },
-        },
-        "mcp_info": [],
-    }
-    _agent_service_mock.collect_skill_zip_entries.return_value = []
-    _agent_version_db_mock.search_version_by_version_no.return_value = {
-        "version_name": "v1.0"
-    }
-
-    with pytest.raises(ValueError, match="租户管理员智能体无法共享"):
-        await ars._build_repository_data_from_agent(
-            agent_id=1,
-            tenant_id="tenant_a",
-            user_id="user_a",
-            version_no=1,
-        )
diff --git a/test/backend/services/test_agent_service.py b/test/backend/services/test_agent_service.py
index 6cd7b5da4..86c8a5e2c 100644
--- a/test/backend/services/test_agent_service.py
+++ b/test/backend/services/test_agent_service.py
@@ -92,7 +92,6 @@ def model_dump(self, **kwargs):
 sys.modules['services.agent_version_service'] = agent_version_service_mock
 sys.modules['services.skill_service'] = skill_service_mock
 sys.modules['services.prompt_template_service'] = prompt_template_service_mock
-sys.modules['services.file_management_service'] = MagicMock()
 sys.modules['services.skill_service'] = MagicMock()
 setattr(services_module, 'skill_service', sys.modules['services.skill_service'])
 
@@ -333,10 +332,6 @@ def apply_default_prompt_template_request_fields(request, prompt_template_id=Non
         request.related_agent_ids = None
     if not hasattr(request, "enabled_tool_ids"):
         request.enabled_tool_ids = None
-    if not hasattr(request, "example_questions"):
-        request.example_questions = None
-    if not hasattr(request, "greeting_message"):
-        request.greeting_message = None
     return request
 
 
@@ -505,7 +500,6 @@ async def test_get_agent_info_impl_success(mock_search_agent_info, mock_search_t
     mock_check_availability.assert_called_once()
 
 
-@patch('backend.services.agent_service.query_current_version_no')
 @patch('backend.services.agent_service.SkillService')
 @patch('backend.services.agent_service.query_external_sub_agents')
 @patch('backend.services.agent_service.check_agent_availability')
@@ -514,7 +508,7 @@ async def test_get_agent_info_impl_success(mock_search_agent_info, mock_search_t
 @patch('backend.services.agent_service.search_tools_for_sub_agent')
 @patch('backend.services.agent_service.search_agent_info_by_agent_id')
 @pytest.mark.asyncio
-async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_search_tools, mock_query_sub_agents_id, mock_get_model_by_model_id, mock_check_availability, mock_query_external_sub_agents, mock_skill_service, mock_query_current_version_no):
+async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_search_tools, mock_query_sub_agents_id, mock_get_model_by_model_id, mock_check_availability, mock_query_external_sub_agents, mock_skill_service):
     """
     Test get_agent_info_impl with explicit version_no parameter.
 
@@ -550,9 +544,6 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
     # Mock check_agent_availability - agent is available
     mock_check_availability.return_value = (True, [])
 
-    # Mock query_current_version_no - return 5 as the current version
-    mock_query_current_version_no.return_value = 5
-
     # Execute with explicit version_no
     result = await get_agent_info_impl(agent_id=123, tenant_id="test_tenant", version_no=5)
 
@@ -570,8 +561,7 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
         "prompt_template_id": 0,
         "prompt_template_name": "system_default",
         "is_available": True,
-        "unavailable_reasons": [],
-        "current_version_no": 5
+        "unavailable_reasons": []
     }
     assert result == expected_result
     # Verify version_no is passed correctly
@@ -581,8 +571,6 @@ async def test_get_agent_info_impl_with_version_no(mock_search_agent_info, mock_
     mock_query_sub_agents_id.assert_called_once_with(
         main_agent_id=123, tenant_id="test_tenant")
     mock_check_availability.assert_called_once()
-    # Verify query_current_version_no is called for version_no > 0
-    mock_query_current_version_no.assert_called_once_with(123, "test_tenant")
 
 
 @patch('backend.services.agent_service.get_model_by_model_id')
@@ -756,7 +744,6 @@ async def test_update_agent_info_impl_exception_handling(mock_get_current_user_i
     request.display_name = "Test Display Name"
     request.enabled_tool_ids = None
     request.related_agent_ids = None
-    request.example_questions = None
     apply_default_prompt_template_request_fields(request)
 
     # Execute & Assert
@@ -1443,7 +1430,7 @@ async def test_export_agent_impl_success(mock_get_current_user_info, mock_export
     # Verify function calls
     mock_get_current_user_info.assert_called_once_with("Bearer token")
     mock_export_agent_by_id.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
+        agent_id=123, tenant_id="test_tenant", user_id="test_user")
     mock_get_mcp_server.assert_called_once_with(
         "test_mcp_server", "test_tenant")
     mock_export_data_format.assert_called_once()
@@ -1523,7 +1510,7 @@ async def test_export_agent_impl_no_mcp_tools(mock_get_current_user_info, mock_e
     # Verify function calls
     mock_get_current_user_info.assert_called_once_with("Bearer token")
     mock_export_agent_by_id.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
+        agent_id=123, tenant_id="test_tenant", user_id="test_user")
     # Should not be called when no MCP tools
     mock_get_mcp_server.assert_not_called()
     mock_export_data_format.assert_called_once()
@@ -2995,8 +2982,7 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
         "duty_prompt": "Test duty prompt",
         "constraint_prompt": "Test constraint prompt",
         "few_shots_prompt": "Test few shots prompt",
-        "enabled": True,
-        "tenant_id": "test_tenant",
+        "enabled": True
     }
     mock_search_agent_info.return_value = mock_agent_info
 
@@ -3072,7 +3058,6 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
 
     # Assert
     assert result.agent_id == 123
-    assert result.tenant_id == "test_tenant"
     assert result.name == "Test Agent"
     assert result.business_description == "For testing purposes"
     assert len(result.tools) == 5
@@ -3098,11 +3083,11 @@ async def test_export_agent_by_agent_id_success(mock_search_agent_info, mock_cre
 
     # Verify function calls
     mock_search_agent_info.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", version_no=0)
+        agent_id=123, tenant_id="test_tenant")
     mock_create_tool_config.assert_called_once_with(
-        agent_id=123, tenant_id="test_tenant", user_id="test_user", version_no=0)
+        agent_id=123, tenant_id="test_tenant", user_id="test_user")
     mock_query_sub_agents_id.assert_called_once_with(
-        main_agent_id=123, tenant_id="test_tenant", version_no=0)
+        main_agent_id=123, tenant_id="test_tenant")
 
 
 @patch('backend.services.agent_service.create_or_update_tool_by_tool_info')
@@ -5172,7 +5157,6 @@ async def test_export_agent_includes_model_names(
         "constraint_prompt": "Test constraints",
         "few_shots_prompt": "Test examples",
         "enabled": True,
-        "tenant_id": "test_tenant",
         "model_id": 5,
         "business_logic_model_id": 4
     }
@@ -5238,7 +5222,6 @@ async def test_export_agent_with_null_model_id(
         "constraint_prompt": "Test constraints",
         "few_shots_prompt": "Test examples",
         "enabled": True,
-        "tenant_id": "test_tenant",
         "model_id": None,  # NULL in database
         "business_logic_model_id": None  # NULL in database
     }
@@ -5301,7 +5284,6 @@ async def test_export_then_import_preserves_model_names(
         "constraint_prompt": "Follow safety rules",
         "few_shots_prompt": "Example tasks",
         "enabled": True,
-        "tenant_id": "source_tenant",
         "model_id": 10,  # Model ID in source tenant
         "business_logic_model_id": 9  # Business logic model ID in source tenant
     }
@@ -5417,7 +5399,6 @@ async def test_export_agent_model_not_found(
         "constraint_prompt": "Test",
         "few_shots_prompt": "Test",
         "enabled": True,
-        "tenant_id": "test_tenant",
         "model_id": 999,  # This model doesn't exist
         "business_logic_model_id": 998  # This model doesn't exist
     }
@@ -8751,176 +8732,6 @@ def convert_side_effect(x):
     assert result[0]["permission"] == PERMISSION_READ
 
 
-def _mock_get_agent_info_impl_dependencies(
-    mock_search_agent_info,
-    mock_search_tools,
-    mock_query_sub_agents_id,
-    mock_get_model_by_model_id,
-    mock_check_availability,
-    mock_query_external_sub_agents,
-    mock_skill_service,
-    agent_info,
-):
-    """Configure common mocks for get_agent_info_impl permission tests."""
-    defaults = {"model_id": None}
-    mock_search_agent_info.return_value = {**defaults, **agent_info}
-    mock_search_tools.return_value = []
-    mock_query_sub_agents_id.return_value = []
-    mock_query_external_sub_agents.return_value = []
-    mock_get_model_by_model_id.return_value = None
-    mock_check_availability.return_value = (True, [])
-    mock_skill_service_instance = MagicMock()
-    mock_skill_service_instance.list_skill_instances.return_value = []
-    mock_skill_service.return_value = mock_skill_service_instance
-
-
-@patch("backend.services.agent_service.SkillService")
-@patch("backend.services.agent_service.query_external_sub_agents")
-@patch("backend.services.agent_service.check_agent_availability")
-@patch("backend.services.agent_service.get_model_by_model_id")
-@patch("backend.services.agent_service.query_sub_agents_id_list")
-@patch("backend.services.agent_service.search_tools_for_sub_agent")
-@patch("backend.services.agent_service.search_agent_info_by_agent_id")
-@patch("backend.services.agent_service.get_user_tenant_by_user_id")
-@pytest.mark.asyncio
-async def test_get_agent_info_impl_asset_owner_agent_read_only_for_admin(
-    mock_get_user_tenant,
-    mock_search_agent_info,
-    mock_search_tools,
-    mock_query_sub_agents_id,
-    mock_get_model_by_model_id,
-    mock_check_availability,
-    mock_query_external_sub_agents,
-    mock_skill_service,
-):
-    """ASSET_OWNER-scoped agent detail is READ_ONLY for ADMIN viewers."""
-    from consts.const import ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
-
-    agent_info = {
-        "agent_id": 99,
-        "tenant_id": ASSET_OWNER_TENANT_ID,
-        "created_by": "admin_user",
-        "ingroup_permission": PERMISSION_EDIT,
-    }
-    _mock_get_agent_info_impl_dependencies(
-        mock_search_agent_info,
-        mock_search_tools,
-        mock_query_sub_agents_id,
-        mock_get_model_by_model_id,
-        mock_check_availability,
-        mock_query_external_sub_agents,
-        mock_skill_service,
-        agent_info,
-    )
-    mock_get_user_tenant.return_value = {"user_role": "ADMIN"}
-
-    result = await get_agent_info_impl(
-        agent_id=99,
-        tenant_id="regular_tenant",
-        user_id="admin_user",
-    )
-
-    assert result["permission"] == PERMISSION_READ
-
-
-@patch("backend.services.agent_service.SkillService")
-@patch("backend.services.agent_service.query_external_sub_agents")
-@patch("backend.services.agent_service.check_agent_availability")
-@patch("backend.services.agent_service.get_model_by_model_id")
-@patch("backend.services.agent_service.query_sub_agents_id_list")
-@patch("backend.services.agent_service.search_tools_for_sub_agent")
-@patch("backend.services.agent_service.search_agent_info_by_agent_id")
-@patch("backend.services.agent_service.get_user_tenant_by_user_id")
-@pytest.mark.asyncio
-async def test_get_agent_info_impl_asset_owner_agent_read_only_for_dev(
-    mock_get_user_tenant,
-    mock_search_agent_info,
-    mock_search_tools,
-    mock_query_sub_agents_id,
-    mock_get_model_by_model_id,
-    mock_check_availability,
-    mock_query_external_sub_agents,
-    mock_skill_service,
-):
-    """ASSET_OWNER-scoped agent detail is READ_ONLY for DEV even with ingroup EDIT."""
-    from consts.const import ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
-
-    agent_info = {
-        "agent_id": 99,
-        "tenant_id": ASSET_OWNER_TENANT_ID,
-        "created_by": "asset_owner_user",
-        "ingroup_permission": PERMISSION_EDIT,
-    }
-    _mock_get_agent_info_impl_dependencies(
-        mock_search_agent_info,
-        mock_search_tools,
-        mock_query_sub_agents_id,
-        mock_get_model_by_model_id,
-        mock_check_availability,
-        mock_query_external_sub_agents,
-        mock_skill_service,
-        agent_info,
-    )
-    mock_get_user_tenant.return_value = {"user_role": "DEV"}
-
-    result = await get_agent_info_impl(
-        agent_id=99,
-        tenant_id="regular_tenant",
-        user_id="dev_user",
-    )
-
-    assert result["permission"] == PERMISSION_READ
-
-
-@patch("backend.services.agent_service.SkillService")
-@patch("backend.services.agent_service.query_external_sub_agents")
-@patch("backend.services.agent_service.check_agent_availability")
-@patch("backend.services.agent_service.get_model_by_model_id")
-@patch("backend.services.agent_service.query_sub_agents_id_list")
-@patch("backend.services.agent_service.search_tools_for_sub_agent")
-@patch("backend.services.agent_service.search_agent_info_by_agent_id")
-@patch("backend.services.agent_service.get_user_tenant_by_user_id")
-@pytest.mark.asyncio
-async def test_get_agent_info_impl_asset_owner_role_gets_edit(
-    mock_get_user_tenant,
-    mock_search_agent_info,
-    mock_search_tools,
-    mock_query_sub_agents_id,
-    mock_get_model_by_model_id,
-    mock_check_availability,
-    mock_query_external_sub_agents,
-    mock_skill_service,
-):
-    """ASSET_OWNER role creator retains EDIT on ASSET_OWNER-scoped agent detail."""
-    from consts.const import ASSET_OWNER_ROLE, ASSET_OWNER_TENANT_ID, PERMISSION_EDIT, PERMISSION_READ
-
-    agent_info = {
-        "agent_id": 99,
-        "tenant_id": ASSET_OWNER_TENANT_ID,
-        "created_by": "asset_owner_user",
-        "ingroup_permission": PERMISSION_READ,
-    }
-    _mock_get_agent_info_impl_dependencies(
-        mock_search_agent_info,
-        mock_search_tools,
-        mock_query_sub_agents_id,
-        mock_get_model_by_model_id,
-        mock_check_availability,
-        mock_query_external_sub_agents,
-        mock_skill_service,
-        agent_info,
-    )
-    mock_get_user_tenant.return_value = {"user_role": ASSET_OWNER_ROLE}
-
-    result = await get_agent_info_impl(
-        agent_id=99,
-        tenant_id=ASSET_OWNER_TENANT_ID,
-        user_id="asset_owner_user",
-    )
-
-    assert result["permission"] == PERMISSION_EDIT
-
-
 @pytest.mark.asyncio
 @patch("backend.services.agent_service.get_model_by_model_id")
 @patch("backend.services.agent_service.check_agent_availability")
@@ -9243,8 +9054,6 @@ async def test_update_agent_info_impl_skill_update_exception(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     mock_query_skills.return_value = []
     mock_create_skill.side_effect = Exception("Skill update failed")
@@ -9305,73 +9114,79 @@ def test_generate_stream_with_memory_decorated():
 # =============================================================================
 
 @pytest.mark.asyncio
-@patch('backend.services.agent_service.collect_skill_zip_entries')
-@patch('backend.services.agent_service.export_agent_dict_impl')
+@patch('backend.services.agent_service.search_agent_info_by_agent_id')
+@patch('backend.services.agent_service.export_agent_impl')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_no_skills(
-    mock_get_user_info, mock_export_dict_impl, mock_collect_skills
-):
-    """Test export_agent_with_skills_impl returns dict when agent has no skill instances."""
+async def test_export_agent_with_skills_impl_no_skills(mock_get_user_info, mock_export_impl, mock_search_info):
+    """Test export_agent_with_skills_impl returns JSON when agent has no skill instances."""
     from backend.services.agent_service import export_agent_with_skills_impl
+    from backend.services import agent_service as ag_svc
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
-    mock_export_dict_impl.return_value = {"agent_id": 1, "agent_info": {}}
-    mock_collect_skills.return_value = []
+    mock_export_impl.return_value = '{"agent_id": 1, "agent_info": {}}'
+    mock_search_info.return_value = {"name": "test_agent"}
 
-    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    # Mock skill_db.query_skill_instances_by_agent_id to return empty list
+    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[]):
+        result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
-    assert result == {"agent_id": 1, "agent_info": {}}
-    mock_export_dict_impl.assert_called_once_with(
-        1, "Bearer token", version_no=0
-    )
+    assert result == '{"agent_id": 1, "agent_info": {}}'
+    mock_export_impl.assert_called_once_with(1, "Bearer token")
 
 
 @pytest.mark.asyncio
-@patch('backend.services.agent_service.collect_skill_zip_entries')
-@patch('backend.services.agent_service.export_agent_dict_impl')
+@patch('backend.services.agent_service.search_agent_info_by_agent_id')
+@patch('backend.services.agent_service.export_agent_impl')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_skills_but_no_names(
-    mock_get_user_info, mock_export_dict_impl, mock_collect_skills
-):
-    """Test export_agent_with_skills_impl returns dict when skill export yields nothing."""
+async def test_export_agent_with_skills_impl_skills_but_no_names(mock_get_user_info, mock_export_impl, mock_search_info):
+    """Test export_agent_with_skills_impl returns JSON when skill instances have no names."""
     from backend.services.agent_service import export_agent_with_skills_impl
+    from backend.services import agent_service as ag_svc
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
-    mock_export_dict_impl.return_value = {"agent_id": 1, "agent_info": {}}
-    mock_collect_skills.return_value = []
+    mock_export_impl.return_value = '{"agent_id": 1, "agent_info": {}}'
+    mock_search_info.return_value = {"name": "test_agent"}
 
-    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    # Mock skill_db to return skill instances without names
+    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[{"skill_id": 1}]):
+        with patch.object(ag_svc.skill_db, 'get_skill_by_id', return_value=None):
+            result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
-    assert result == {"agent_id": 1, "agent_info": {}}
-    mock_export_dict_impl.assert_called_once()
+    assert result == '{"agent_id": 1, "agent_info": {}}'
+    mock_export_impl.assert_called_once()
 
 
 @pytest.mark.asyncio
 @patch('backend.services.agent_service.search_agent_info_by_agent_id')
-@patch('backend.services.agent_service.collect_skill_zip_entries')
 @patch('backend.services.agent_service.get_current_user_info')
-async def test_export_agent_with_skills_impl_with_zip(
-    mock_get_user_info, mock_collect_skills, mock_search_info
-):
+async def test_export_agent_with_skills_impl_with_zip(mock_get_user_info, mock_search_info):
     """Test export_agent_with_skills_impl returns ZIP when agent has skills."""
     from backend.services.agent_service import export_agent_with_skills_impl
     from backend.services import agent_service as ag_svc
-    from consts.model import SkillZipEntry
     import io
     import zipfile
 
     mock_get_user_info.return_value = ("user_123", "tenant_abc", "en")
     mock_search_info.return_value = {"name": "my_agent"}
-    mock_collect_skills.return_value = [
-        SkillZipEntry(skill_name="TestSkill", skill_zip_base64="SGVsbG8gV29ybGQ=")
+
+    skill_instance = {"skill_id": 100}
+    skill_info = {"name": "TestSkill", "skill_id": 100}
+
+    mock_skill_service = MagicMock()
+    mock_skill_service.export_skills_by_names.return_value = [
+        {"skill_name": "TestSkill", "skill_zip_base64": "SGVsbG8gV29ybGQ="}  # "Hello World" in base64
     ]
 
-    with patch.object(ag_svc, 'export_agent_impl', return_value='{"agent_id": 1}'):
-        result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
+    with patch.object(ag_svc.skill_db, 'query_skill_instances_by_agent_id', return_value=[skill_instance]):
+        with patch.object(ag_svc.skill_db, 'get_skill_by_id', return_value=skill_info):
+            with patch.object(ag_svc, 'export_agent_impl', return_value='{"agent_id": 1}'):
+                with patch('services.skill_service.SkillService', return_value=mock_skill_service):
+                    result = await export_agent_with_skills_impl(agent_id=1, authorization="Bearer token")
 
     assert result["_zip"] is True
     assert "data" in result
     assert result["filename"] == "my_agent.zip"
+    # Verify it's a valid ZIP
     zip_data = io.BytesIO(result["data"])
     with zipfile.ZipFile(zip_data, 'r') as zf:
         assert "agent.json" in zf.namelist()
@@ -9507,8 +9322,6 @@ async def test_update_agent_info_impl_related_agent_query_error(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     # Make query_sub_agents_id_list raise exception during circular check
     mock_query_sub.side_effect = Exception("Query error")
@@ -9558,8 +9371,6 @@ async def test_update_agent_info_impl_related_external_agents(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     # Mock current relations (empty)
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent', return_value=[]):
@@ -9610,8 +9421,6 @@ async def test_update_agent_info_impl_external_agent_remove_relation(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     # Mock current relations has the ID
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
@@ -9663,8 +9472,6 @@ async def test_update_agent_info_impl_external_agent_relation_exists(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     # Mock current relations includes the same ID - add should raise ValueError (already exists)
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
@@ -9777,8 +9584,6 @@ async def test_update_agent_info_impl_skill_unselected(
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     result = await update_agent_info_impl(mock_request, authorization="Bearer token")
 
@@ -10127,126 +9932,8 @@ async def test_update_agent_info_impl_external_agent_list_error(mock_get_user):
     mock_request.ingroup_permission = None
     mock_request.prompt_template_id = None
     mock_request.prompt_template_name = None
-    mock_request.example_questions = None
-    mock_request.greeting_message = None
 
     with patch.object(ag_svc.a2a_agent_db, 'list_external_relations_by_local_agent',
                      side_effect=Exception("DB error")):
         with pytest.raises(ValueError, match="Failed to update related external agents"):
             await update_agent_info_impl(mock_request, authorization="Bearer token")
-
-
-@patch('backend.services.agent_service.get_current_user_info')
-@pytest.mark.asyncio
-async def test_update_agent_info_impl_example_questions_exceed_limit(mock_get_current_user_info):
-    """Test update_agent_info_impl raises AppException when example_questions exceeds 6 items."""
-    from consts.error_code import ErrorCode
-    from consts.exceptions import AppException
-
-    mock_get_current_user_info.return_value = ("test_user", "test_tenant", "en")
-
-    request = MagicMock()
-    request.agent_id = 123
-    request.model_id = None
-    request.example_questions = ["q1", "q2", "q3", "q4", "q5", "q6", "q7"]
-    request.enabled_tool_ids = None
-    request.related_agent_ids = None
-    apply_default_prompt_template_request_fields(request)
-
-    with pytest.raises(AppException) as exc_info:
-        await update_agent_info_impl(request, authorization="Bearer token")
-
-    assert exc_info.value.error_code == ErrorCode.COMMON_PARAMETER_INVALID
-
-
-# =============================================================================
-# Tests for version_no export and repository export helpers
-# =============================================================================
-
-@pytest.mark.asyncio
-@patch('backend.services.agent_service.resolve_sub_agent_version_no')
-@patch('backend.services.agent_service.query_sub_agent_relations')
-@patch('backend.services.agent_service.export_agent_by_agent_id')
-async def test_export_agent_dict_impl_uses_pinned_sub_agent_versions(
-    mock_export_agent_by_id,
-    mock_query_relations,
-    mock_resolve_version,
-):
-    """BFS export should enqueue sub-agents with their pinned version numbers."""
-    from backend.services.agent_service import export_agent_dict_impl
-    from consts.model import ExportAndImportAgentInfo
-
-    root_agent = ExportAndImportAgentInfo(
-        agent_id=1,
-        name="root",
-        display_name="Root",
-        description="desc",
-        business_description="biz",
-        max_steps=5,
-        provide_run_summary=False,
-        enabled=True,
-        tools=[],
-        managed_agents=[2],
-    )
-    child_agent = ExportAndImportAgentInfo(
-        agent_id=2,
-        name="child",
-        display_name="Child",
-        description="desc",
-        business_description="biz",
-        max_steps=5,
-        provide_run_summary=False,
-        enabled=True,
-        tools=[],
-        managed_agents=[],
-    )
-
-    async def _export_side_effect(agent_id, tenant_id, user_id, version_no=0):
-        if agent_id == 1:
-            return root_agent
-        return child_agent
-
-    mock_export_agent_by_id.side_effect = _export_side_effect
-    mock_query_relations.side_effect = [
-        [{"selected_agent_id": 2, "selected_agent_version_no": 3}],
-        [],
-    ]
-    mock_resolve_version.return_value = 3
-
-    with patch('backend.services.agent_service.get_current_user_info', return_value=("u", "t", "en")):
-        result = await export_agent_dict_impl(agent_id=1, authorization="Bearer token", version_no=2)
-
-    assert result["agent_id"] == 1
-    assert "1" in result["agent_info"]
-    assert "2" in result["agent_info"]
-    mock_export_agent_by_id.assert_any_call(
-        agent_id=1, tenant_id="t", user_id="u", version_no=2
-    )
-    mock_export_agent_by_id.assert_any_call(
-        agent_id=2, tenant_id="t", user_id="u", version_no=3
-    )
-
-
-@pytest.mark.asyncio
-@patch('backend.services.agent_service._export_agent_dict_core')
-async def test_export_agent_dict_for_repository_impl(mock_export_core):
-    """Repository export helper should delegate to core export without auth header."""
-    from backend.services.agent_service import export_agent_dict_for_repository_impl
-
-    mock_export_core.return_value = {
-        "agent_id": 10,
-        "agent_info": {},
-        "mcp_info": [],
-    }
-
-    result = await export_agent_dict_for_repository_impl(
-        agent_id=10, tenant_id="tenant_a", user_id="user_a", version_no=1
-    )
-
-    assert result["agent_id"] == 10
-    mock_export_core.assert_called_once_with(
-        root_agent_id=10,
-        tenant_id="tenant_a",
-        user_id="user_a",
-        version_no=1,
-    )
diff --git a/test/backend/services/test_agent_version_service.py b/test/backend/services/test_agent_version_service.py
index 10cf67ca1..5c3f231b5 100644
--- a/test/backend/services/test_agent_version_service.py
+++ b/test/backend/services/test_agent_version_service.py
@@ -1,6 +1,5 @@
 import asyncio
 import sys
-import types
 import pytest
 from unittest.mock import patch, MagicMock
 from contextlib import contextmanager
@@ -19,26 +18,10 @@
 consts_mock.const.POSTGRES_DB = "test_db"
 consts_mock.const.POSTGRES_PORT = 5432
 consts_mock.const.DEFAULT_TENANT_ID = "default_tenant"
-consts_mock.const.AGENT_PROMPTS_HIDDEN_FLAG = "prompts_hidden"
-consts_mock.const.ASSET_OWNER_ROLE = "ASSET_OWNER"
-consts_mock.const.ASSET_OWNER_TENANT_ID = "asset_owner_tenant_id"
-consts_mock.const.ENABLE_ASSET_OWNER_ROLE = False
-consts_mock.const.PERMISSION_EDIT = "EDIT"
-consts_mock.const.PERMISSION_READ = "READ_ONLY"
 
 sys.modules['consts'] = consts_mock
 sys.modules['consts.const'] = consts_mock.const
 
-consts_exceptions_mod = types.ModuleType("consts.exceptions")
-
-
-class ValidationError(Exception):
-    pass
-
-
-consts_exceptions_mod.ValidationError = ValidationError
-sys.modules['consts.exceptions'] = consts_exceptions_mod
-
 # Mock consts.agent_unavailable_reasons
 agent_unavailable_reasons_mock = MagicMock()
 agent_unavailable_reasons_mock.AgentUnavailableReason = type('AgentUnavailableReason', (), {
@@ -223,13 +206,8 @@ def mock_tools_draft():
 
 
 @pytest.fixture
-def mock_relations_draft(monkeypatch):
+def mock_relations_draft():
     """Mock relations draft data"""
-    monkeypatch.setattr(
-        agent_version_service_module,
-        "query_current_version_no",
-        MagicMock(return_value=1),
-    )
     return [
         {
             "id": 1,
@@ -301,34 +279,9 @@ def test_publish_version_impl_success(monkeypatch, mock_agent_draft, mock_tools_
     mock_insert_agent.assert_called_once()
     assert mock_insert_tool.call_count == 2
     assert mock_insert_relation.call_count == 1
-    relation_snapshot = mock_insert_relation.call_args[0][0]
-    assert relation_snapshot["selected_agent_version_no"] == 1
     assert mock_insert_skill.call_count == 1
 
 
-def test_publish_version_impl_unpublished_sub_agent(
-    monkeypatch, mock_agent_draft, mock_tools_draft, mock_relations_draft, mock_skills_draft
-):
-    """Test publishing fails when a sub-agent has no published version"""
-    mock_query_draft = MagicMock(
-        return_value=(mock_agent_draft, mock_tools_draft, mock_relations_draft)
-    )
-    monkeypatch.setattr(agent_version_service_module, "query_agent_draft", mock_query_draft)
-    monkeypatch.setattr(
-        agent_version_service_module,
-        "query_current_version_no",
-        MagicMock(return_value=None),
-    )
-    monkeypatch.setattr(agent_version_service_module, "get_next_version_no", MagicMock(return_value=1))
-
-    with pytest.raises(ValueError, match="Sub-agent 2 has no published version"):
-        publish_version_impl(
-            agent_id=1,
-            tenant_id="tenant1",
-            user_id="user1",
-        )
-
-
 def test_publish_version_impl_no_draft(monkeypatch):
     """Test publishing when draft doesn't exist"""
     mock_query_draft = MagicMock(return_value=(None, [], []))
@@ -1331,7 +1284,6 @@ def test_get_version_detail_or_draft_draft_version(monkeypatch):
     assert result["version"]["version_status"] == "DRAFT"
     assert len(result["tools"]) == 1
     assert result["sub_agent_id_list"] == [2]
-    assert result["sub_agent_relations"] == [{"agent_id": 2, "version_no": None}]
     assert len(result["skills"]) == 1
 
 
@@ -1535,7 +1487,7 @@ def test_list_published_agents_impl_success(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    agent_service_mock.get_model_by_model_id = MagicMock(
+    model_management_db_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
@@ -1688,15 +1640,15 @@ def test_list_published_agents_impl_user_with_groups(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    agent_service_mock.get_model_by_model_id = MagicMock(
+    model_management_db_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
     result = asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
 
     assert len(result) == 1
-    # User should have READ_ONLY permission (not EDIT)
-    assert result[0]["permission"] == "READ_ONLY"
+    # User should have READ permission (not EDIT)
+    assert result[0]["permission"] == "READ"
 
 
 def test_list_published_agents_impl_model_cache(monkeypatch):
@@ -1738,7 +1690,7 @@ def test_list_published_agents_impl_model_cache(monkeypatch):
         return_value=(True, [])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    agent_service_mock.get_model_by_model_id = MagicMock(
+    model_management_db_mock.get_model_by_model_id = MagicMock(
         return_value={"display_name": "Test Model", "model_name": "test_model"}
     )
 
@@ -1819,7 +1771,7 @@ def test_list_published_agents_impl_is_available_false(monkeypatch):
         return_value=(False, ["model_not_configured"])
     )
     agent_service_mock._apply_duplicate_name_availability_rules = MagicMock()
-    agent_service_mock.get_model_by_model_id = MagicMock(return_value=None)
+    model_management_db_mock.get_model_by_model_id = MagicMock(return_value=None)
 
     result = asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
 
@@ -1828,7 +1780,8 @@ def test_list_published_agents_impl_is_available_false(monkeypatch):
     assert "model_not_configured" in result[0]["unavailable_reasons"]
 
 
-def test_list_published_agents_impl_exception_handling(monkeypatch):
+@pytest.mark.asyncio
+async def test_list_published_agents_impl_exception_handling(monkeypatch):
     """Test exception handling in list_published_agents_impl"""
     # Mock query_all_agent_info_by_tenant_id to raise an exception
     test_exception = RuntimeError("Database connection failed")
@@ -1843,7 +1796,7 @@ def test_list_published_agents_impl_exception_handling(monkeypatch):
 
     # Verify that the exception is caught and re-raised as ValueError
     with pytest.raises(ValueError, match="Failed to list published agents: Database connection failed"):
-        asyncio.run(list_published_agents_impl(tenant_id="tenant1", user_id="user1"))
+        await list_published_agents_impl(tenant_id="tenant1", user_id="user1")
 
 
 def test_publish_version_impl_with_a2a_new_agent(monkeypatch, mock_agent_draft, mock_tools_draft, mock_relations_draft, mock_skills_draft):
diff --git a/test/backend/services/test_cas_service.py b/test/backend/services/test_cas_service.py
deleted file mode 100644
index 158847e5a..000000000
--- a/test/backend/services/test_cas_service.py
+++ /dev/null
@@ -1,240 +0,0 @@
-import os
-import sys
-import unittest
-from datetime import datetime
-from unittest.mock import MagicMock
-
-test_dir = os.path.dirname(__file__)
-backend_dir = os.path.abspath(os.path.join(test_dir, "../../../backend"))
-sys.path.insert(0, backend_dir)
-
-_MODULES_TO_RESTORE = [
-    "consts",
-    "consts.const",
-    "database.cas_session_db",
-    "database.oauth_account_db",
-    "database.user_tenant_db",
-    "services.oauth_service",
-    "services.skill_service",
-    "services.tool_configuration_service",
-    "utils.auth_utils",
-]
-_ORIGINAL_MODULES = {name: sys.modules.get(name) for name in _MODULES_TO_RESTORE}
-
-consts_mock = MagicMock()
-consts_mock.const = MagicMock()
-consts_mock.const.CAS_CA_BUNDLE = ""
-consts_mock.const.CAS_CALLBACK_BASE_URL = "http://localhost:3000"
-consts_mock.const.CAS_EMAIL_ATTRIBUTE = "mail"
-consts_mock.const.CAS_ENABLED = True
-consts_mock.const.CAS_LOGIN_MODE = "button"
-consts_mock.const.CAS_LOGOUT_URL = ""
-consts_mock.const.CAS_RENEW_BEFORE_SECONDS = 300
-consts_mock.const.CAS_RENEW_TIMEOUT_SECONDS = 10
-consts_mock.const.CAS_ROLE_ATTRIBUTE = "memberOf"
-consts_mock.const.CAS_ROLE_MAP_JSON = '{"cn=admins":"ADMIN"}'
-consts_mock.const.CAS_SERVER_URL = "https://cas.example.com/cas"
-consts_mock.const.CAS_SESSION_MAX_AGE_SECONDS = 3600
-consts_mock.const.CAS_SSL_VERIFY = True
-consts_mock.const.CAS_SYNTHETIC_EMAIL_DOMAIN = "cas.local"
-consts_mock.const.CAS_TENANT_ATTRIBUTE = "tenant"
-consts_mock.const.CAS_USER_ATTRIBUTE = "uid"
-consts_mock.const.CAS_VALIDATE_PATH = "/p3/serviceValidate"
-consts_mock.const.DEFAULT_TENANT_ID = "tenant_id"
-consts_mock.const.LOCAL_SESSION_MAX_AGE_SECONDS = 3600
-sys.modules["consts"] = consts_mock
-sys.modules["consts.const"] = consts_mock.const
-
-sys.modules["database.cas_session_db"] = MagicMock()
-sys.modules["database.oauth_account_db"] = MagicMock()
-sys.modules["database.user_tenant_db"] = MagicMock()
-sys.modules["services.oauth_service"] = MagicMock()
-sys.modules["services.skill_service"] = MagicMock()
-sys.modules["services.tool_configuration_service"] = MagicMock()
-sys.modules["utils.auth_utils"] = MagicMock()
-
-from services.cas_service import (  # noqa: E402
-    CasAuthenticationError,
-    build_login_url,
-    build_logout_url,
-    parse_logout_request,
-    parse_service_validate_response,
-    revoke_from_logout_request,
-)
-
-for _name, _module in _ORIGINAL_MODULES.items():
-    if _module is None:
-        sys.modules.pop(_name, None)
-    else:
-        sys.modules[_name] = _module
-sys.modules.pop("services.cas_service", None)
-
-
-class TestCasServiceParsing(unittest.TestCase):
-    def test_parse_success_response_with_attributes(self):
-        xml = """
-        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
-          <cas:authenticationSuccess>
-            <cas:user>fallback-user</cas:user>
-            <cas:attributes>
-              <cas:uid>cas-user-1</cas:uid>
-              <cas:mail>User@Example.com</cas:mail>
-              <cas:memberOf>cn=admins</cas:memberOf>
-              <cas:tenant>tenant-a</cas:tenant>
-              <cas:SessionIndex>ST-123</cas:SessionIndex>
-              <cas:expiresAt>2026-05-26T10:00:00Z</cas:expiresAt>
-            </cas:attributes>
-          </cas:authenticationSuccess>
-        </cas:serviceResponse>
-        """
-
-        principal = parse_service_validate_response(xml, fallback_session_index="ST-fallback")
-
-        self.assertEqual(principal.cas_user_id, "cas-user-1")
-        self.assertEqual(principal.email, "user@example.com")
-        self.assertEqual(principal.role, "ADMIN")
-        self.assertEqual(principal.tenant_id, "tenant-a")
-        self.assertEqual(principal.session_index, "ST-123")
-        self.assertIsInstance(principal.expires_at, datetime)
-
-    def test_parse_failure_response_raises(self):
-        xml = """
-        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
-          <cas:authenticationFailure code="INVALID_TICKET">bad ticket</cas:authenticationFailure>
-        </cas:serviceResponse>
-        """
-
-        with self.assertRaises(CasAuthenticationError):
-            parse_service_validate_response(xml)
-
-    def test_parse_service_validate_response_rejects_xml_entities(self):
-        xml = """<?xml version="1.0"?>
-        <!DOCTYPE foo [<!ENTITY xxe "expanded-user">]>
-        <cas:serviceResponse xmlns:cas="http://www.yale.edu/tp/cas">
-          <cas:authenticationSuccess>
-            <cas:user>&xxe;</cas:user>
-          </cas:authenticationSuccess>
-        </cas:serviceResponse>
-        """
-
-        with self.assertRaises(CasAuthenticationError):
-            parse_service_validate_response(xml)
-
-    def test_parse_logout_request_supports_user_and_session_index(self):
-        xml = """
-        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
-          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
-          <saml:NameID>cas-user-1</saml:NameID>
-          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
-        </samlp:LogoutRequest>
-        """
-
-        result = parse_logout_request(xml)
-
-        self.assertEqual(result["cas_user_id"], "cas-user-1")
-        self.assertEqual(result["session_index"], "ST-123")
-
-    def test_parse_logout_request_rejects_xml_entities(self):
-        xml = """<?xml version="1.0"?>
-        <!DOCTYPE foo [<!ENTITY xxe "cas-user-1">]>
-        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
-          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
-          <saml:NameID>&xxe;</saml:NameID>
-          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
-        </samlp:LogoutRequest>
-        """
-
-        result = parse_logout_request(xml)
-
-        self.assertEqual(result, {"cas_user_id": "", "session_index": ""})
-
-    def test_revoke_logout_request_falls_back_to_session_index_when_name_id_misses(self):
-        xml = """
-        <samlp:LogoutRequest xmlns:samlp="urn:oasis:names:tc:SAML:2.0:protocol"
-          xmlns:saml="urn:oasis:names:tc:SAML:2.0:assertion">
-          <saml:NameID>different-cas-user</saml:NameID>
-          <samlp:SessionIndex>ST-123</samlp:SessionIndex>
-        </samlp:LogoutRequest>
-        """
-        original_revoke_by_user = revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"]
-        original_revoke_by_index = revoke_from_logout_request.__globals__["revoke_cas_session_by_index"]
-        revoke_by_user = MagicMock(return_value=0)
-        revoke_by_index = MagicMock(return_value=1)
-        revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"] = revoke_by_user
-        revoke_from_logout_request.__globals__["revoke_cas_session_by_index"] = revoke_by_index
-        try:
-            result = revoke_from_logout_request(xml)
-        finally:
-            revoke_from_logout_request.__globals__["revoke_cas_sessions_by_user_id"] = original_revoke_by_user
-            revoke_from_logout_request.__globals__["revoke_cas_session_by_index"] = original_revoke_by_index
-
-        self.assertEqual(result["revoked"], 1)
-        self.assertEqual(result["cas_user_id"], "different-cas-user")
-        self.assertEqual(result["session_index"], "ST-123")
-        revoke_by_user.assert_called_once_with("different-cas-user")
-        revoke_by_index.assert_called_once_with("ST-123")
-
-    def test_build_login_url_includes_service_redirect(self):
-        url = build_login_url("/space")
-
-        self.assertIn("https://cas.example.com/cas/login?", url)
-        self.assertIn("service=http://localhost:3000/api/user/cas/callback?redirect=/space", url)
-
-    def test_build_logout_url_returns_empty_when_logout_url_is_not_configured(self):
-        url = build_logout_url()
-
-        self.assertEqual(url, "")
-
-    def test_build_logout_url_adds_nexent_service_to_configured_bare_logout_url(self):
-        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
-        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "https://sso.example.com/cas/logout"
-        try:
-            url = build_logout_url()
-        finally:
-            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
-
-        self.assertEqual(
-            url,
-            "https://sso.example.com/cas/logout?service=http://localhost:3000",
-        )
-
-    def test_build_logout_url_resolves_absolute_path_against_cas_server_url(self):
-        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
-        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "/logout"
-        try:
-            url = build_logout_url()
-        finally:
-            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
-
-        self.assertEqual(
-            url,
-            "https://cas.example.com/cas/logout?service=http://localhost:3000",
-        )
-
-    def test_build_logout_url_resolves_relative_path_against_cas_server_url(self):
-        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
-        build_logout_url.__globals__["CAS_LOGOUT_URL"] = "logout"
-        try:
-            url = build_logout_url()
-        finally:
-            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
-
-        self.assertEqual(
-            url,
-            "https://cas.example.com/cas/logout?service=http://localhost:3000",
-        )
-
-    def test_build_logout_url_preserves_configured_logout_url_with_query(self):
-        original = build_logout_url.__globals__["CAS_LOGOUT_URL"]
-        configured = "https://sso.example.com/cas/logout?redirect=https%3A%2F%2Fidp.example.com%2Flogin"
-        build_logout_url.__globals__["CAS_LOGOUT_URL"] = configured
-        try:
-            url = build_logout_url()
-        finally:
-            build_logout_url.__globals__["CAS_LOGOUT_URL"] = original
-
-        self.assertEqual(url, configured)
-
-
-if __name__ == "__main__":
-    unittest.main()
diff --git a/test/backend/services/test_data_process_service.py b/test/backend/services/test_data_process_service.py
index f93d54f4c..27ab679d2 100644
--- a/test/backend/services/test_data_process_service.py
+++ b/test/backend/services/test_data_process_service.py
@@ -1595,21 +1595,43 @@ def test_get_data_process_service(self, mock_service_class):
         self.assertEqual(service2, mock_service)
         self.assertEqual(service1, service2)
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_success(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_success(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing successful batch task creation.
 
         This test verifies that the service correctly creates batch tasks.
         It ensures that:
         1. Individual tasks are created for each source in the request
-        2. submit_process_forward_chain is called with correct parameters
+        2. The process_and_forward.delay method is called with correct parameters
         3. Task IDs are collected and returned
         4. All valid source configurations are processed
         """
-        mock_submit_chain.side_effect = ["task_id_1", "task_id_2"]
-
+        # Setup Celery signature mocks
+        process_sig_1 = MagicMock()
+        process_sig_1.set.return_value = process_sig_1
+        process_sig_2 = MagicMock()
+        process_sig_2.set.return_value = process_sig_2
+        forward_sig_1 = MagicMock()
+        forward_sig_1.set.return_value = forward_sig_1
+        forward_sig_2 = MagicMock()
+        forward_sig_2.set.return_value = forward_sig_2
+
+        # process.s returns different sig objects per call
+        mock_process.s.side_effect = [process_sig_1, process_sig_2]
+        mock_forward.s.side_effect = [forward_sig_1, forward_sig_2]
+
+        # chain(...).apply_async() returns result with id
+        chain_inst_1 = MagicMock()
+        chain_inst_1.apply_async.return_value = MagicMock(id="task_id_1")
+        chain_inst_2 = MagicMock()
+        chain_inst_2.apply_async.return_value = MagicMock(id="task_id_2")
+        mock_chain.side_effect = [chain_inst_1, chain_inst_2]
+
+        # Create test request
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1630,23 +1652,27 @@ async def async_test_create_batch_tasks_impl_success(self, mock_submit_chain):
             ]
         )
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result
         self.assertEqual(len(result), 2)
         self.assertEqual(result[0], "task_id_1")
         self.assertEqual(result[1], "task_id_2")
-        self.assertEqual(mock_submit_chain.call_count, 2)
 
-        expected_calls = [
+        # Verify chain was invoked for each source
+        self.assertEqual(mock_chain.call_count, 2)
+
+        # Verify process.s and forward.s were called with correct params
+        expected_process_calls = [
             {
                 'source': 'http://example.com/doc1.pdf',
                 'source_type': 'url',
                 'chunking_strategy': 'semantic',
                 'index_name': 'test_index_1',
                 'original_filename': 'doc1.pdf',
-                'authorization': 'Bearer test_token',
                 'embedding_model_id': None,
-                'tenant_id': None,
+                'tenant_id': None
             },
             {
                 'source': 'http://example.com/doc2.pdf',
@@ -1654,17 +1680,43 @@ async def async_test_create_batch_tasks_impl_success(self, mock_submit_chain):
                 'chunking_strategy': 'fixed',
                 'index_name': 'test_index_2',
                 'original_filename': 'doc2.pdf',
-                'authorization': 'Bearer test_token',
                 'embedding_model_id': None,
-                'tenant_id': None,
-            },
+                'tenant_id': None
+            }
         ]
-        actual_calls = [kwargs for args, kwargs in mock_submit_chain.call_args_list]
-        self.assertEqual(actual_calls, expected_calls)
+        actual_process_calls = [kwargs for args,
+                                kwargs in mock_process.s.call_args_list]
+        self.assertEqual(actual_process_calls, expected_process_calls)
+        process_sig_1.set.assert_called_once_with(queue='process_q')
+        process_sig_2.set.assert_called_once_with(queue='process_q')
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+        expected_forward_calls = [
+            {
+                'index_name': 'test_index_1',
+                'source': 'http://example.com/doc1.pdf',
+                'source_type': 'url',
+                'original_filename': 'doc1.pdf',
+                'authorization': 'Bearer test_token'
+            },
+            {
+                'index_name': 'test_index_2',
+                'source': 'http://example.com/doc2.pdf',
+                'source_type': 'url',
+                'original_filename': 'doc2.pdf',
+                'authorization': 'Bearer test_token'
+            }
+        ]
+        actual_forward_calls = [kwargs for args,
+                                kwargs in mock_forward.s.call_args_list]
+        self.assertEqual(actual_forward_calls, expected_forward_calls)
+        forward_sig_1.set.assert_called_once_with(queue='forward_q')
+        forward_sig_2.set.assert_called_once_with(queue='forward_q')
+
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_source(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_missing_source(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation with missing source field.
 
@@ -1675,8 +1727,18 @@ async def async_test_create_batch_tasks_impl_missing_source(self, mock_submit_ch
         3. Only valid source configurations are processed
         4. The method continues processing other sources
         """
-        mock_submit_chain.return_value = "task_id_1"
-
+        # Setup signature mocks
+        process_sig = MagicMock()
+        process_sig.set.return_value = process_sig
+        forward_sig = MagicMock()
+        forward_sig.set.return_value = forward_sig
+        mock_process.s.return_value = process_sig
+        mock_forward.s.return_value = forward_sig
+        chain_inst = MagicMock()
+        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
+        mock_chain.return_value = chain_inst
+
+        # Create test request with missing source
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1697,19 +1759,27 @@ async def async_test_create_batch_tasks_impl_missing_source(self, mock_submit_ch
             ]
         )
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result - only one task should be created
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-        mock_submit_chain.assert_called_once()
+
+        # Verify chain called once with built signatures
+        mock_chain.assert_called_once()
+        mock_process.s.assert_called_once()
+        mock_forward.s.assert_called_once()
         self.assertEqual(
-            mock_submit_chain.call_args[1]['source'], 'http://example.com/doc2.pdf')
+            mock_process.s.call_args[1]['source'], 'http://example.com/doc2.pdf')
         self.assertEqual(
-            mock_submit_chain.call_args[1]['index_name'], 'test_index_2')
+            mock_process.s.call_args[1]['index_name'], 'test_index_2')
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation with missing index_name field.
 
@@ -1720,8 +1790,18 @@ async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_submi
         3. Only valid source configurations are processed
         4. The method continues processing other sources
         """
-        mock_submit_chain.return_value = "task_id_1"
-
+        # Setup signature mocks
+        process_sig = MagicMock()
+        process_sig.set.return_value = process_sig
+        forward_sig = MagicMock()
+        forward_sig.set.return_value = forward_sig
+        mock_process.s.return_value = process_sig
+        mock_forward.s.return_value = forward_sig
+        chain_inst = MagicMock()
+        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
+        mock_chain.return_value = chain_inst
+
+        # Create test request with missing index_name
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1742,19 +1822,27 @@ async def async_test_create_batch_tasks_impl_missing_index_name(self, mock_submi
             ]
         )
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result - only one task should be created
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-        mock_submit_chain.assert_called_once()
+
+        # Verify chain called once with built signatures
+        mock_chain.assert_called_once()
+        mock_process.s.assert_called_once()
+        mock_forward.s.assert_called_once()
         self.assertEqual(
-            mock_submit_chain.call_args[1]['source'], 'http://example.com/doc2.pdf')
+            mock_process.s.call_args[1]['source'], 'http://example.com/doc2.pdf')
         self.assertEqual(
-            mock_submit_chain.call_args[1]['index_name'], 'test_index_2')
+            mock_process.s.call_args[1]['index_name'], 'test_index_2')
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_missing_both_required_fields(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_missing_both_required_fields(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation with both required fields missing.
 
@@ -1765,6 +1853,7 @@ async def async_test_create_batch_tasks_impl_missing_both_required_fields(self,
         3. No tasks are created when all sources are invalid
         4. The method returns an empty list
         """
+        # Create test request with all sources missing required fields
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1783,14 +1872,22 @@ async def async_test_create_batch_tasks_impl_missing_both_required_fields(self,
             ]
         )
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result - no tasks should be created
         self.assertEqual(len(result), 0)
-        mock_submit_chain.assert_not_called()
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+        # Verify no chain created
+        mock_chain.assert_not_called()
+        mock_process.s.assert_not_called()
+        mock_forward.s.assert_not_called()
+
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_empty_sources(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_empty_sources(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation with empty sources list.
 
@@ -1800,17 +1897,26 @@ async def async_test_create_batch_tasks_impl_empty_sources(self, mock_submit_cha
         2. The method returns an empty list
         3. No errors occur during processing
         """
+        # Create test request with empty sources
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(sources=[])
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result - no tasks should be created
         self.assertEqual(len(result), 0)
-        mock_submit_chain.assert_not_called()
 
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+        # Verify no chain created
+        mock_chain.assert_not_called()
+        mock_process.s.assert_not_called()
+        mock_forward.s.assert_not_called()
+
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_optional_fields(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_optional_fields(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation with optional fields.
 
@@ -1820,8 +1926,18 @@ async def async_test_create_batch_tasks_impl_optional_fields(self, mock_submit_c
         2. Optional fields are passed as None when not provided
         3. The method processes all valid sources regardless of optional field presence
         """
-        mock_submit_chain.return_value = "task_id_1"
-
+        # Setup signature mocks
+        process_sig = MagicMock()
+        process_sig.set.return_value = process_sig
+        forward_sig = MagicMock()
+        forward_sig.set.return_value = forward_sig
+        mock_process.s.return_value = process_sig
+        mock_forward.s.return_value = forward_sig
+        chain_inst = MagicMock()
+        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
+        mock_chain.return_value = chain_inst
+
+        # Create test request with minimal required fields only
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1833,22 +1949,31 @@ async def async_test_create_batch_tasks_impl_optional_fields(self, mock_submit_c
             ]
         )
 
+        # Create batch tasks
         result = await self.service.create_batch_tasks_impl("Bearer test_token", request)
 
+        # Verify result
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-        mock_submit_chain.assert_called_once()
-        kwargs = mock_submit_chain.call_args[1]
-        self.assertEqual(kwargs['source'], 'http://example.com/doc1.pdf')
-        self.assertEqual(kwargs['index_name'], 'test_index_1')
-        self.assertIsNone(kwargs['source_type'])
-        self.assertIsNone(kwargs['chunking_strategy'])
-        self.assertIsNone(kwargs['original_filename'])
-        self.assertEqual(kwargs['authorization'], 'Bearer test_token')
-
-    @patch('backend.services.data_process_service.submit_process_forward_chain')
+
+        # Verify signatures built with None optional fields for process, and authorization on forward
+        mock_process.s.assert_called_once()
+        proc_kwargs = mock_process.s.call_args[1]
+        self.assertEqual(proc_kwargs['source'], 'http://example.com/doc1.pdf')
+        self.assertEqual(proc_kwargs['index_name'], 'test_index_1')
+        self.assertIsNone(proc_kwargs['source_type'])
+        self.assertIsNone(proc_kwargs['chunking_strategy'])
+        self.assertIsNone(proc_kwargs['original_filename'])
+
+        mock_forward.s.assert_called_once()
+        fwd_kwargs = mock_forward.s.call_args[1]
+        self.assertEqual(fwd_kwargs['authorization'], 'Bearer test_token')
+
+    @patch('backend.services.data_process_service.chain')
+    @patch('backend.services.data_process_service.forward')
+    @patch('backend.services.data_process_service.process')
     @pytest.mark.asyncio
-    async def async_test_create_batch_tasks_impl_no_authorization(self, mock_submit_chain):
+    async def async_test_create_batch_tasks_impl_no_authorization(self, mock_process, mock_forward, mock_chain):
         """
         Async implementation for testing batch task creation without authorization.
 
@@ -1858,8 +1983,18 @@ async def async_test_create_batch_tasks_impl_no_authorization(self, mock_submit_
         2. None is passed as authorization parameter
         3. The method processes all valid sources
         """
-        mock_submit_chain.return_value = "task_id_1"
-
+        # Setup signature mocks
+        process_sig = MagicMock()
+        process_sig.set.return_value = process_sig
+        forward_sig = MagicMock()
+        forward_sig.set.return_value = forward_sig
+        mock_process.s.return_value = process_sig
+        mock_forward.s.return_value = forward_sig
+        chain_inst = MagicMock()
+        chain_inst.apply_async.return_value = MagicMock(id="task_id_1")
+        mock_chain.return_value = chain_inst
+
+        # Create test request
         from consts.model import BatchTaskRequest
         request = BatchTaskRequest(
             sources=[
@@ -1873,15 +2008,19 @@ async def async_test_create_batch_tasks_impl_no_authorization(self, mock_submit_
             ]
         )
 
+        # Create batch tasks without authorization
         result = await self.service.create_batch_tasks_impl(None, request)
 
+        # Verify result
         self.assertEqual(len(result), 1)
         self.assertEqual(result[0], "task_id_1")
-        mock_submit_chain.assert_called_once()
-        kwargs = mock_submit_chain.call_args[1]
-        self.assertEqual(kwargs['source'], 'http://example.com/doc1.pdf')
-        self.assertEqual(kwargs['index_name'], 'test_index_1')
-        self.assertIsNone(kwargs['authorization'])
+
+        # Verify forward.s called with None authorization
+        mock_forward.s.assert_called_once()
+        fwd_kwargs = mock_forward.s.call_args[1]
+        self.assertEqual(fwd_kwargs['source'], 'http://example.com/doc1.pdf')
+        self.assertEqual(fwd_kwargs['index_name'], 'test_index_1')
+        self.assertIsNone(fwd_kwargs['authorization'])
 
     def test_create_batch_tasks_impl(self):
         """
@@ -1918,14 +2057,11 @@ async def async_test_process_uploaded_text_file(self, mock_data_process_core):
         """
         # Arrange: mock DataProcessCore.file_process to return mixed chunks
         mock_instance = MagicMock()
-        mock_instance.file_process.return_value = (
-            [
-                {"content": "First chunk"},
-                {"no_content": True},
-                {"content": "Second chunk"},
-            ],
-            []  # images_info
-        )
+        mock_instance.file_process.return_value = [
+            {"content": "First chunk"},
+            {"no_content": True},
+            {"content": "Second chunk"},
+        ]
         mock_data_process_core.return_value = mock_instance
 
         filename = "test.txt"
diff --git a/test/backend/services/test_mcp_service.py b/test/backend/services/test_mcp_service.py
index 280e96954..f5443bac7 100644
--- a/test/backend/services/test_mcp_service.py
+++ b/test/backend/services/test_mcp_service.py
@@ -432,10 +432,6 @@ def test_mixed_special_chars(self):
 class TestRegisterOpenapiService:
     """Test register_openapi_service function"""
 
-    @staticmethod
-    def _headers_template():
-        return {}
-
     def test_register_service_success(self):
         """Test successful OpenAPI service registration"""
         service_name = "test_service"
@@ -446,12 +442,7 @@ def test_register_service_success(self):
         }
         server_url = "https://api.example.com"
 
-        result = mcp_service.register_openapi_service(
-            service_name,
-            openapi_json,
-            server_url,
-            self._headers_template()
-        )
+        result = mcp_service.register_openapi_service(service_name, openapi_json, server_url)
 
         assert result is True
         assert service_name in mcp_service._openapi_mcp_services
@@ -459,12 +450,12 @@ def test_register_service_success(self):
 
     def test_register_service_empty_name(self):
         """Test registration with empty service name"""
-        result = mcp_service.register_openapi_service("", {}, "https://api.example.com", self._headers_template())
+        result = mcp_service.register_openapi_service("", {}, "https://api.example.com")
         assert result is False
 
     def test_register_service_none_name(self):
         """Test registration with None service name"""
-        result = mcp_service.register_openapi_service(None, {}, "https://api.example.com", self._headers_template())
+        result = mcp_service.register_openapi_service(None, {}, "https://api.example.com")
         assert result is False
 
     def test_register_duplicate_service(self):
@@ -473,21 +464,11 @@ def test_register_duplicate_service(self):
         openapi_json = {"openapi": "3.0.0", "info": {}, "paths": {}}
 
         # First registration
-        result1 = mcp_service.register_openapi_service(
-            service_name,
-            openapi_json,
-            "https://api.example.com",
-            self._headers_template()
-        )
+        result1 = mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
         assert result1 is True
 
         # Second registration should fail
-        result2 = mcp_service.register_openapi_service(
-            service_name,
-            openapi_json,
-            "https://api.example.com",
-            self._headers_template()
-        )
+        result2 = mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
         assert result2 is False
 
     def test_register_service_without_server_url(self):
@@ -495,7 +476,7 @@ def test_register_service_without_server_url(self):
         service_name = "no_url_service"
         openapi_json = {"openapi": "3.0.0", "info": {}, "paths": {}}
 
-        result = mcp_service.register_openapi_service(service_name, openapi_json, "", self._headers_template())
+        result = mcp_service.register_openapi_service(service_name, openapi_json, "")
 
         assert result is True
 
@@ -506,46 +487,12 @@ def test_register_service_copies_openapi_spec(self):
 
         original_json = openapi_json.copy()
 
-        mcp_service.register_openapi_service(
-            service_name,
-            openapi_json,
-            "https://api.example.com",
-            self._headers_template()
-        )
+        mcp_service.register_openapi_service(service_name, openapi_json, "https://api.example.com")
 
         # Verify original was not modified
         assert openapi_json == original_json
         assert "servers" not in openapi_json
 
-    @patch.object(mcp_service, 'FastMCP')
-    @patch.object(mcp_service.httpx, 'AsyncClient')
-    def test_register_service_passes_headers_template_to_async_client(
-        self, mock_async_client, mock_fastmcp
-    ):
-        """Test registration passes headers_template to HTTP client."""
-        mock_client = MagicMock()
-        mock_async_client.return_value = mock_client
-        mock_fastmcp.from_openapi.return_value = MagicMock()
-        headers_template = {
-            "Authorization": "Bearer {{token}}",
-            "X-Tenant-ID": "{{tenant_id}}"
-        }
-
-        result = mcp_service.register_openapi_service(
-            "headers_service",
-            {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com",
-            headers_template
-        )
-
-        assert result is True
-        mock_async_client.assert_called_once_with(
-            base_url="https://api.example.com",
-            timeout=120.0,
-            headers=headers_template
-        )
-        mock_fastmcp.from_openapi.assert_called_once()
-
     @patch.object(mcp_service, 'FastMCP')
     def test_register_service_from_openapi_failure(self, mock_fastmcp):
         """Test handling of FastMCP.from_openapi failure"""
@@ -554,8 +501,7 @@ def test_register_service_from_openapi_failure(self, mock_fastmcp):
         result = mcp_service.register_openapi_service(
             "fail_service",
             {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com",
-            self._headers_template()
+            "https://api.example.com"
         )
 
         assert result is False
@@ -569,8 +515,7 @@ def test_register_service_returns_none(self, mock_fastmcp):
         result = mcp_service.register_openapi_service(
             "none_service",
             {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com",
-            self._headers_template()
+            "https://api.example.com"
         )
 
         assert result is False
@@ -707,38 +652,6 @@ def test_refresh_clears_existing_services(self):
         assert "old_service" not in mcp_service._openapi_mcp_services
         assert "new_service" in mcp_service._openapi_mcp_services
 
-    @patch.object(mcp_service, 'register_openapi_service')
-    def test_refresh_passes_headers_template_to_register(self, mock_register):
-        """Test refresh passes headers_template to register_openapi_service."""
-        services_data = [
-            {
-                "mcp_service_name": "api_service_1",
-                "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api1.example.com",
-                "headers_template": {
-                    "Authorization": "Bearer {{token}}",
-                    "X-Tenant-ID": "{{tenant_id}}"
-                }
-            }
-        ]
-        mcp_service.query_available_openapi_services.return_value = services_data
-        mock_register.return_value = True
-
-        result = mcp_service.refresh_openapi_services_by_tenant("tenant1")
-
-        assert result["registered"] == 1
-        assert result["skipped"] == 0
-        assert result["total"] == 1
-        mock_register.assert_called_once_with(
-            "api_service_1",
-            {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api1.example.com",
-            {
-                "Authorization": "Bearer {{token}}",
-                "X-Tenant-ID": "{{tenant_id}}"
-            }
-        )
-
     def test_refresh_remounts_local_service(self):
         """Test that refresh re-mounts local MCP service"""
         mcp_service.query_available_openapi_services.return_value = []
@@ -759,21 +672,13 @@ def test_refresh_remounts_local_service(self):
 class TestRefreshSingleOpenapiService:
     """Test refresh_single_openapi_service function"""
 
-    @staticmethod
-    def _headers_template():
-        return {
-            "Authorization": "Bearer {{token}}",
-            "X-Tenant-ID": "{{tenant_id}}"
-        }
-
     def test_refresh_existing_service(self):
         """Test refreshing an existing service"""
         services_data = [
             {
                 "mcp_service_name": "target_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com",
-                "headers_template": self._headers_template()
+                "server_url": "https://api.example.com"
             }
         ]
         mcp_service.query_available_openapi_services.return_value = services_data
@@ -832,8 +737,7 @@ def test_refresh_removes_old_instance(self):
             {
                 "mcp_service_name": "old_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com",
-                "headers_template": self._headers_template()
+                "server_url": "https://api.example.com"
             }
         ]
         mcp_service.query_available_openapi_services.return_value = services_data
@@ -842,30 +746,6 @@ def test_refresh_removes_old_instance(self):
 
         assert result["status"] == "refreshed"
 
-    @patch.object(mcp_service, 'register_openapi_service')
-    def test_refresh_existing_service_passes_headers_template(self, mock_register):
-        """Test refreshing a service passes headers_template to register_openapi_service."""
-        services_data = [
-            {
-                "mcp_service_name": "target_service",
-                "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com",
-                "headers_template": self._headers_template()
-            }
-        ]
-        mcp_service.query_available_openapi_services.return_value = services_data
-        mock_register.return_value = True
-
-        result = mcp_service.refresh_single_openapi_service("target_service", "tenant1")
-
-        assert result["status"] == "refreshed"
-        mock_register.assert_called_once_with(
-            "target_service",
-            {"openapi": "3.0.0", "info": {}, "paths": {}},
-            "https://api.example.com",
-            self._headers_template()
-        )
-
     def test_refresh_deleted_service_removes_from_mounted_servers(self):
         """Test that deleting a service removes it from mounted_servers"""
         service_name = "mounted_delete_test"
@@ -954,13 +834,14 @@ def test_app_creates_once(self):
     def test_app_has_routes(self):
         """Test that app has expected routes"""
         app = mcp_service.get_mcp_management_app()
-        paths = app.openapi()["paths"]
 
-        assert "/tools/outer_api/refresh" in paths
-        assert "/tools/openapi_service/refresh" in paths
-        assert "/tools/openapi_service" in paths
-        assert "/tools/openapi_service/{service_name}/refresh" in paths
-        assert "/tools/outer_api" in paths
+        routes = [route.path for route in app.routes]
+
+        assert "/tools/outer_api/refresh" in routes
+        assert "/tools/openapi_service/refresh" in routes
+        assert "/tools/openapi_service" in routes
+        assert "/tools/openapi_service/{service_name}/refresh" in routes
+        assert "/tools/outer_api" in routes
 
 
 # ---------------------------------------------------------------------------
@@ -1125,11 +1006,7 @@ async def test_refresh_single_service_success(self):
             {
                 "mcp_service_name": "target_service",
                 "openapi_json": {"openapi": "3.0.0", "info": {}, "paths": {}},
-                "server_url": "https://api.example.com",
-                "headers_template": {
-                    "Authorization": "Bearer {{token}}",
-                    "X-Tenant-ID": "{{tenant_id}}"
-                }
+                "server_url": "https://api.example.com"
             }
         ]
 
diff --git a/test/backend/services/test_northbound_service.py b/test/backend/services/test_northbound_service.py
index e98fc4ca1..0d658e198 100644
--- a/test/backend/services/test_northbound_service.py
+++ b/test/backend/services/test_northbound_service.py
@@ -1,148 +1,93 @@
-"""
-Tests for backend.services.northbound_service module.
-
-This module tests the northbound-facing service layer functions including:
-- Streaming chat (start/stop)
-- Conversation management (list, history, title update)
-- Agent info listing
-- Rate limiting and idempotency
-"""
 import sys
 import os
-import types
-from unittest.mock import MagicMock, AsyncMock, patch
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../.."))
 
 import pytest
+from unittest.mock import MagicMock, AsyncMock, patch
 
-# Add project root to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../.."))
-
-# =============================================================================
-# Mock all required modules BEFORE importing northbound_service
-# =============================================================================
 
-# Mock consts.exceptions
+# First mock the consts module to avoid ModuleNotFoundError
+consts_mock = MagicMock()
+consts_mock.const = MagicMock()
+consts_mock.const.MINIO_ENDPOINT = "http://localhost:9000"
+consts_mock.const.MINIO_ACCESS_KEY = "test_access_key"
+consts_mock.const.MINIO_SECRET_KEY = "test_secret_key"
+consts_mock.const.MINIO_REGION = "us-east-1"
+consts_mock.const.MINIO_DEFAULT_BUCKET = "test-bucket"
+consts_mock.const.POSTGRES_HOST = "localhost"
+consts_mock.const.POSTGRES_USER = "test_user"
+consts_mock.const.NEXENT_POSTGRES_PASSWORD = "test_password"
+consts_mock.const.POSTGRES_DB = "test_db"
+consts_mock.const.POSTGRES_PORT = 5432
+consts_mock.const.DEFAULT_TENANT_ID = "default_tenant"
+
+sys.modules['consts'] = consts_mock
+sys.modules['consts.const'] = consts_mock.const
+
+# Mock exceptions module
 class LimitExceededError(Exception):
     pass
 
 class UnauthorizedError(Exception):
     pass
 
-class ConversationNotFoundError(Exception):
-    pass
-
-consts_exceptions_mod = types.ModuleType("consts.exceptions")
-consts_exceptions_mod.LimitExceededError = LimitExceededError
-consts_exceptions_mod.UnauthorizedError = UnauthorizedError
-consts_exceptions_mod.ConversationNotFoundError = ConversationNotFoundError
-sys.modules["consts.exceptions"] = consts_exceptions_mod
-sys.modules["backend.consts.exceptions"] = consts_exceptions_mod
-
-# Mock consts.const
-consts_const_mod = types.ModuleType("consts.const")
-consts_const_mod.ASSET_OWNER_TENANT_ID = "asset-owner-tenant"
-sys.modules["consts.const"] = consts_const_mod
-
-# Mock consts package
-consts_package = types.ModuleType("consts")
-consts_package.exceptions = consts_exceptions_mod
-consts_package.const = consts_const_mod
-sys.modules["consts"] = consts_package
-
-# Mock database modules
-db_client_mod = types.ModuleType("database.client")
-db_client_mod.get_db_session = MagicMock()
-db_client_mod.as_dict = MagicMock()
-sys.modules["database.client"] = db_client_mod
-sys.modules["backend.database.client"] = db_client_mod
-
-db_package = types.ModuleType("database")
-db_package.client = db_client_mod
-sys.modules["database"] = db_package
-
-# Mock token_db
-token_db_mod = types.ModuleType("database.token_db")
-token_db_mod.log_token_usage = MagicMock(return_value=1)
-token_db_mod.get_latest_usage_metadata = MagicMock(return_value={"query": "test"})
-sys.modules["database.token_db"] = token_db_mod
-
-# Mock conversation_db
-conversation_db_mod = types.ModuleType("database.conversation_db")
-conversation_db_mod.get_conversation_messages = MagicMock(return_value=[
+exceptions_mock = MagicMock()
+exceptions_mock.LimitExceededError = LimitExceededError
+exceptions_mock.UnauthorizedError = UnauthorizedError
+sys.modules['consts.exceptions'] = exceptions_mock
+sys.modules['backend.consts.exceptions'] = exceptions_mock
+
+# Mock database client
+client_mock = MagicMock()
+client_mock.MinioClient = MagicMock()
+client_mock.get_db_session = MagicMock()
+sys.modules['database.client'] = client_mock
+sys.modules['backend.database.client'] = client_mock
+
+# Mock token_db module
+token_db_mock = MagicMock()
+token_db_mock.log_token_usage = MagicMock(return_value=1)
+token_db_mock.get_latest_usage_metadata = MagicMock(return_value={"query": "test"})
+sys.modules['database.token_db'] = token_db_mock
+sys.modules['backend.database.token_db'] = token_db_mock
+
+# Mock conversation_db module
+conversation_db_mock = MagicMock()
+conversation_db_mock.get_conversation_messages = MagicMock(return_value=[
     {"message_role": "user", "message_content": "Hello"}
 ])
-conversation_db_mod.get_source_searches_by_message = MagicMock(return_value=[])
-sys.modules["database.conversation_db"] = conversation_db_mod
-
-# Mock attachment_db
-attachment_db_mod = types.ModuleType("database.attachment_db")
-attachment_db_mod.build_s3_url = MagicMock(return_value="s3://bucket/file")
-attachment_db_mod.get_file_url = MagicMock(return_value={"success": True, "url": "https://proxy.example/file"})
-attachment_db_mod.get_file_size_from_minio = MagicMock(return_value=0)
-attachment_db_mod._build_mcp_presigned_url = MagicMock(side_effect=lambda url: url)
-sys.modules["database.attachment_db"] = attachment_db_mod
-
-# Mock nexent.multi_modal.utils
-nexent_utils_mod = types.ModuleType("nexent.multi_modal.utils")
-nexent_utils_mod.parse_s3_url = MagicMock(return_value=("bucket", "path/file.txt"))
-sys.modules["nexent"] = types.ModuleType("nexent")
-sys.modules["nexent.multi_modal"] = types.ModuleType("nexent.multi_modal")
-sys.modules["nexent.multi_modal.utils"] = nexent_utils_mod
-
-# Mock services modules
-services_package = types.ModuleType("services")
-
-# Mock agent_service
-agent_service_mod = types.ModuleType("services.agent_service")
-agent_service_mod.run_agent_stream = AsyncMock()
-agent_service_mod.stop_agent_tasks = MagicMock(return_value={"message": "stopped"})
-agent_service_mod.get_agent_id_by_name = AsyncMock(return_value=1)
-sys.modules["services.agent_service"] = agent_service_mod
-
-# Mock conversation_management_service
-conv_mgmt_mod = types.ModuleType("services.conversation_management_service")
-conv_mgmt_mod.save_conversation_user = MagicMock()
-conv_mgmt_mod.get_conversation_list_service = MagicMock(return_value=[
+sys.modules['database.conversation_db'] = conversation_db_mock
+sys.modules['backend.database.conversation_db'] = conversation_db_mock
+
+# Mock agent_service module
+agent_service_mock = MagicMock()
+agent_service_mock.run_agent_stream = AsyncMock()
+agent_service_mock.stop_agent_tasks = MagicMock(return_value={"message": "stopped"})
+agent_service_mock.list_all_agent_info_impl = AsyncMock(return_value=[{"agent_id": 1, "name": "test_agent"}])
+agent_service_mock.get_agent_id_by_name = AsyncMock(return_value=1)
+sys.modules['services.agent_service'] = agent_service_mock
+sys.modules['backend.services.agent_service'] = agent_service_mock
+
+# Mock conversation_management_service module
+conv_mgmt_mock = MagicMock()
+conv_mgmt_mock.save_conversation_user = MagicMock()
+conv_mgmt_mock.get_conversation_list_service = MagicMock(return_value=[
     {"conversation_id": "1", "title": "Test"}
 ])
-conv_mgmt_mod.create_new_conversation = MagicMock(return_value={"conversation_id": 123})
-conv_mgmt_mod.update_conversation_title = MagicMock()
-sys.modules["services.conversation_management_service"] = conv_mgmt_mod
-
-# Mock agent_version_service
-agent_version_mod = types.ModuleType("services.agent_version_service")
-agent_version_mod.list_published_agents_impl = AsyncMock(return_value=[
-    {"agent_id": 1, "name": "test_agent", "description": "Test agent"}
-])
-sys.modules["services.agent_version_service"] = agent_version_mod
-
-# Mock file_management_service
-file_mgmt_mod = types.ModuleType("services.file_management_service")
-file_mgmt_mod.upload_to_minio = AsyncMock(return_value=[])
-file_mgmt_mod.resolve_minio_upload_folder = MagicMock(return_value="attachments/user")
-file_mgmt_mod.validate_urls_access = MagicMock()
-sys.modules["services.file_management_service"] = file_mgmt_mod
-
-# Add to services package
-services_package.agent_service = agent_service_mod
-services_package.agent_version_service = agent_version_mod
-services_package.conversation_management_service = conv_mgmt_mod
-services_package.file_management_service = file_mgmt_mod
-sys.modules["services"] = services_package
-
-# Mock consts.model - create stub classes
-class AgentRequestStub:
-    def __init__(self, **kwargs):
-        for k, v in kwargs.items():
-            setattr(self, k, v)
-
-class ToolParamsRequestStub:
-    pass
+conv_mgmt_mock.create_new_conversation = MagicMock(return_value={"conversation_id": 123})
+conv_mgmt_mock.update_conversation_title_service = MagicMock()
+sys.modules['services.conversation_management_service'] = conv_mgmt_mock
+sys.modules['backend.services.conversation_management_service'] = conv_mgmt_mock
 
-consts_model_mod = types.ModuleType("consts.model")
-consts_model_mod.AgentRequest = AgentRequestStub
-consts_model_mod.ToolParamsRequest = ToolParamsRequestStub
-sys.modules["consts.model"] = consts_model_mod
+# Mock consts.model
+consts_model_mock = MagicMock()
+AgentRequest_mock = MagicMock()
+consts_model_mock.AgentRequest = AgentRequest_mock
+sys.modules['consts.model'] = consts_model_mock
+
+# Mock database.db_models
+db_models_mock = MagicMock()
+sys.modules['database.db_models'] = db_models_mock
 
 # Now import the module under test
 from backend.services import northbound_service as ns
@@ -162,12 +107,13 @@ def __init__(self, request_id="req-123", tenant_id="tenant-1", user_id="user-1",
 @pytest.fixture(autouse=True)
 def reset_test_isolation():
     """Reset test isolation state before each test."""
+    # Clear idempotency state
     ns._IDEMPOTENCY_RUNNING.clear()
-    ns._RATE_STATE.clear()
-    token_db_mod.log_token_usage.reset_mock()
+    # Reset mock call counts
+    token_db_mock.log_token_usage.reset_mock()
     yield
+    # Cleanup after test
     ns._IDEMPOTENCY_RUNNING.clear()
-    ns._RATE_STATE.clear()
 
 
 class TestNorthboundContext:
@@ -203,155 +149,23 @@ def test_build_idempotency_key_normal(self):
         key = ns._build_idempotency_key("tenant1", "123", "agent1", "query")
         assert "tenant1" in key
         assert "123" in key
-        assert key.count(":") == 3
 
     def test_build_idempotency_key_with_none(self):
-        """Test with None values are converted to empty string."""
+        """Test with None values."""
         key = ns._build_idempotency_key("tenant1", None, "query")
         assert "tenant1" in key
+        # None values are converted to empty string
         assert "None" not in key
+        # Should contain the empty string from None conversion
+        assert "tenant1::" in key or ":query" in key
 
-    def test_build_idempotency_key_long_string_hashed(self):
+    def test_build_idempotency_key_long_string(self):
         """Test with long string gets hashed."""
         long_string = "a" * 100
         key = ns._build_idempotency_key(long_string)
+        # Should be hashed (not the full string)
         assert len(key) < 100
 
-    def test_build_idempotency_key_mixed_long_short(self):
-        """Test with mixed long and short values."""
-        long_val = "x" * 100
-        key = ns._build_idempotency_key("short", long_val, "another_short")
-        assert len(key) < 200
-
-    def test_build_idempotency_key_empty(self):
-        """Test with all empty values."""
-        key = ns._build_idempotency_key()
-        assert key == ""
-
-    def test_build_idempotency_key_single_value(self):
-        """Test with single value."""
-        key = ns._build_idempotency_key("only")
-        assert key == "only"
-
-
-class TestBuildTitleUpdateIdempotencyKey:
-    """Tests for _build_title_update_idempotency_key function."""
-
-    def test_title_update_key_format(self):
-        """Test that title is hashed in the key."""
-        key = ns._build_title_update_idempotency_key("tenant1", 123, "My Title")
-        assert "tenant1" in key
-        assert "123" in key
-        # Title should be hashed (SHA256 hex = 64 chars)
-        parts = key.split(":")
-        assert len(parts) == 3
-        assert len(parts[2]) == 64  # SHA256 hex digest
-
-    def test_title_update_key_different_titles_different_keys(self):
-        """Test that different titles produce different keys."""
-        key1 = ns._build_title_update_idempotency_key("tenant", 1, "Title A")
-        key2 = ns._build_title_update_idempotency_key("tenant", 1, "Title B")
-        assert key1 != key2
-
-    def test_title_update_key_same_inputs_same_key(self):
-        """Test that same inputs produce same key."""
-        key1 = ns._build_title_update_idempotency_key("tenant", 1, "Same Title")
-        key2 = ns._build_title_update_idempotency_key("tenant", 1, "Same Title")
-        assert key1 == key2
-
-
-class TestIdempotencyStartEnd:
-    """Tests for idempotency_start and idempotency_end functions."""
-
-    @pytest.mark.asyncio
-    async def test_idempotency_start_new_key(self):
-        """Test starting idempotency with new key succeeds."""
-        await ns.idempotency_start("new-key")
-        assert "new-key" in ns._IDEMPOTENCY_RUNNING
-
-    @pytest.mark.asyncio
-    async def test_idempotency_start_duplicate_key_raises(self):
-        """Test that duplicate key raises LimitExceededError."""
-        await ns.idempotency_start("duplicate-key")
-        with pytest.raises(LimitExceededError):
-            await ns.idempotency_start("duplicate-key")
-
-    @pytest.mark.asyncio
-    async def test_idempotency_end_removes_key(self):
-        """Test that idempotency_end removes the key."""
-        await ns.idempotency_start("end-key")
-        assert "end-key" in ns._IDEMPOTENCY_RUNNING
-        await ns.idempotency_end("end-key")
-        assert "end-key" not in ns._IDEMPOTENCY_RUNNING
-
-    @pytest.mark.asyncio
-    async def test_idempotency_end_nonexistent_key(self):
-        """Test that ending nonexistent key does not raise."""
-        await ns.idempotency_end("nonexistent-key")  # Should not raise
-
-    @pytest.mark.asyncio
-    async def test_idempotency_expired_key_can_be_reused(self, reset_test_isolation):
-        """Test that expired keys can be reused after TTL."""
-        # Use a very short TTL
-        await ns.idempotency_start("expire-key", ttl_seconds=1)
-        assert "expire-key" in ns._IDEMPOTENCY_RUNNING
-        # Wait for expiration
-        import asyncio
-        await asyncio.sleep(1.1)
-        # Should be able to start again with same key
-        await ns.idempotency_start("expire-key", ttl_seconds=1)
-
-
-class TestRateLimiting:
-    """Tests for rate limiting functionality."""
-
-    @pytest.mark.asyncio
-    async def test_rate_limit_first_request_allowed(self):
-        """Test first request under limit is allowed."""
-        await ns.check_and_consume_rate_limit("tenant-rate")
-        assert ns._RATE_STATE["tenant-rate"].get(ns._minute_bucket(), 0) == 1
-
-    @pytest.mark.asyncio
-    async def test_rate_limit_multiple_requests(self):
-        """Test multiple requests increment counter."""
-        for _ in range(5):
-            await ns.check_and_consume_rate_limit("tenant-multi")
-        assert ns._RATE_STATE["tenant-multi"].get(ns._minute_bucket(), 0) == 5
-
-    @pytest.mark.asyncio
-    async def test_rate_limit_exceeded_raises(self):
-        """Test that exceeding limit raises LimitExceededError."""
-        # Fill up to limit
-        for _ in range(ns._RATE_LIMIT_PER_MINUTE):
-            await ns.check_and_consume_rate_limit("tenant-limit")
-        with pytest.raises(LimitExceededError):
-            await ns.check_and_consume_rate_limit("tenant-limit")
-
-    @pytest.mark.asyncio
-    async def test_rate_limit_different_tenants(self):
-        """Test that different tenants have separate limits."""
-        for _ in range(10):
-            await ns.check_and_consume_rate_limit("tenant-a")
-        for _ in range(5):
-            await ns.check_and_consume_rate_limit("tenant-b")
-        assert ns._RATE_STATE["tenant-a"].get(ns._minute_bucket(), 0) == 10
-        assert ns._RATE_STATE["tenant-b"].get(ns._minute_bucket(), 0) == 5
-
-    @pytest.mark.asyncio
-    async def test_rate_limit_cleanup_old_buckets(self):
-        """Test that old minute buckets are cleaned up."""
-        # First, add a request to create an old bucket
-        old_bucket = str(int(ns._now_seconds() // 60) - 1)
-        ns._RATE_STATE["tenant-cleanup"] = {old_bucket: 50}
-        
-        # Make a new request - should trigger cleanup of old bucket
-        await ns.check_and_consume_rate_limit("tenant-cleanup")
-        
-        # Old bucket should be cleaned up, new bucket should have 1 request
-        current_bucket = ns._minute_bucket()
-        assert old_bucket not in ns._RATE_STATE["tenant-cleanup"]
-        assert ns._RATE_STATE["tenant-cleanup"].get(current_bucket, 0) == 1
-
 
 @pytest.mark.asyncio
 class TestStartStreamingChat:
@@ -359,25 +173,30 @@ class TestStartStreamingChat:
 
     async def test_start_streaming_chat_creates_conversation(self):
         """Test that new conversation is created when conversation_id is None."""
-        ctx = MockNorthboundContext(token_id=0)
+        ctx = MockNorthboundContext(token_id=1)
 
+        # Mock response
         mock_response = MagicMock()
         mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
-            mock_history.return_value = {"data": {"history": []}}
-
-            await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=None,
-                agent_name="test_agent",
-                query="test query"
-            )
-
-            conv_mgmt_mod.create_new_conversation.assert_called()
+        agent_service_mock.run_agent_stream.return_value = mock_response
+
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock):
+            with patch.object(ns, 'idempotency_start', new_callable=AsyncMock):
+                with patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
+                    mock_history.return_value = {"data": {"history": []}}
+
+                    try:
+                        result = await ns.start_streaming_chat(
+                            ctx=ctx,
+                            conversation_id=None,
+                            agent_name="test_agent",
+                            query="test query"
+                        )
+                    except Exception:
+                        pass  # May fail due to other mocks
+
+                    # Verify create_new_conversation was called
+                    conv_mgmt_mock.create_new_conversation.assert_called()
 
     async def test_start_streaming_chat_logs_token_usage(self):
         """Test that token usage is logged when token_id > 0."""
@@ -385,113 +204,27 @@ async def test_start_streaming_chat_logs_token_usage(self):
 
         mock_response = MagicMock()
         mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
-            mock_history.return_value = {"data": {"history": []}}
-
-            await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=123,
-                agent_name="test_agent",
-                query="test query",
-                meta_data={"key": "value"}
-            )
-
-            token_db_mod.log_token_usage.assert_called()
-
-    async def test_start_streaming_chat_rate_limit_exceeded(self):
-        """Test that rate limit exceeded is properly propagated."""
-        ctx = MockNorthboundContext(token_id=0)
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock) as mock_limit:
-            mock_limit.side_effect = LimitExceededError("Rate exceeded")
-            with pytest.raises(LimitExceededError):
-                await ns.start_streaming_chat(
-                    ctx=ctx,
-                    conversation_id=123,
-                    agent_name="test_agent",
-                    query="test query"
-                )
-
-    async def test_start_streaming_chat_uses_existing_conversation(self):
-        """Test that existing conversation_id is used without creating new one."""
-        ctx = MockNorthboundContext(token_id=0)
-        conv_mgmt_mod.create_new_conversation.reset_mock()
-
-        mock_response = MagicMock()
-        mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-
-        async def mock_get_history(*args, **kwargs):
-            return {"data": {"history": []}}
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
-            await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=456,
-                agent_name="test_agent",
-                query="test query"
-            )
-
-            conv_mgmt_mod.create_new_conversation.assert_not_called()
-
-    async def test_start_streaming_chat_no_token_id_no_logging(self):
-        """Test that token usage is not logged when token_id is 0."""
-        ctx = MockNorthboundContext(token_id=0)
-        token_db_mod.log_token_usage.reset_mock()
-
-        mock_response = MagicMock()
-        mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-
-        async def mock_get_history(*args, **kwargs):
-            return {"data": {"history": []}}
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
-            await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=123,
-                agent_name="test_agent",
-                query="test query"
-            )
-
-            token_db_mod.log_token_usage.assert_not_called()
-
-    async def test_start_streaming_chat_with_attachments(self):
-        """Test streaming chat with attachment normalization."""
-        ctx = MockNorthboundContext(token_id=0)
-        attachments = ["s3://bucket/file.txt"]
-
-        mock_response = MagicMock()
-        mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
+        agent_service_mock.run_agent_stream.return_value = mock_response
 
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history, \
-                patch.object(ns, '_normalize_northbound_attachments', return_value=[{"name": "file.txt"}]) as mock_norm:
-            mock_history.return_value = {"data": {"history": []}}
+        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock):
+            with patch.object(ns, 'idempotency_start', new_callable=AsyncMock):
+                with patch.object(ns, 'idempotency_end', new_callable=AsyncMock):
+                    with patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history:
+                        mock_history.return_value = {"data": {"history": []}}
 
-            await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=123,
-                agent_name="test_agent",
-                query="test query",
-                attachments=attachments
-            )
+                        try:
+                            await ns.start_streaming_chat(
+                                ctx=ctx,
+                                conversation_id=123,
+                                agent_name="test_agent",
+                                query="test query",
+                                meta_data={"key": "value"}
+                            )
+                        except Exception:
+                            pass
 
-            mock_norm.assert_called_once()
+                        # Verify log_token_usage was called
+                        token_db_mock.log_token_usage.assert_called()
 
 
 @pytest.mark.asyncio
@@ -501,7 +234,7 @@ class TestStopChat:
     async def test_stop_chat_success(self):
         """Test successful stop chat."""
         ctx = MockNorthboundContext(token_id=1)
-        agent_service_mod.stop_agent_tasks.return_value = {"message": "stopped"}
+        agent_service_mock.stop_agent_tasks.return_value = {"message": "stopped"}
 
         result = await ns.stop_chat(ctx=ctx, conversation_id=123)
 
@@ -509,22 +242,12 @@ async def test_stop_chat_success(self):
         assert result["data"] == 123
 
     async def test_stop_chat_logs_token_usage(self):
-        """Test that token usage is logged when token_id > 0."""
+        """Test that token usage is logged."""
         ctx = MockNorthboundContext(token_id=1)
-        token_db_mod.log_token_usage.reset_mock()
 
         await ns.stop_chat(ctx=ctx, conversation_id=123, meta_data={"test": "data"})
 
-        token_db_mod.log_token_usage.assert_called()
-
-    async def test_stop_chat_no_token_id_no_logging(self):
-        """Test that token usage is not logged when token_id is 0."""
-        ctx = MockNorthboundContext(token_id=0)
-        token_db_mod.log_token_usage.reset_mock()
-
-        await ns.stop_chat(ctx=ctx, conversation_id=123)
-
-        token_db_mod.log_token_usage.assert_not_called()
+        token_db_mock.log_token_usage.assert_called()
 
 
 @pytest.mark.asyncio
@@ -533,7 +256,7 @@ class TestListConversations:
 
     async def test_list_conversations_success(self):
         """Test successful conversation listing."""
-        ctx = MockNorthboundContext(token_id=0)
+        ctx = MockNorthboundContext(token_id=0)  # No token_id, no metadata lookup
 
         result = await ns.list_conversations(ctx=ctx)
 
@@ -543,11 +266,12 @@ async def test_list_conversations_success(self):
     async def test_list_conversations_with_metadata(self):
         """Test that metadata is added when token_id > 0."""
         ctx = MockNorthboundContext(token_id=1)
-        token_db_mod.get_latest_usage_metadata.return_value = {"query": "test query"}
+        token_db_mock.get_latest_usage_metadata.return_value = {"query": "test query"}
 
         result = await ns.list_conversations(ctx=ctx)
 
-        token_db_mod.get_latest_usage_metadata.assert_called()
+        # Should have called get_latest_usage_metadata
+        token_db_mock.get_latest_usage_metadata.assert_called()
 
 
 @pytest.mark.asyncio
@@ -557,7 +281,7 @@ class TestGetConversationHistory:
     async def test_get_conversation_history_success(self):
         """Test successful history retrieval."""
         ctx = MockNorthboundContext(token_id=1)
-        conversation_db_mod.get_conversation_messages.return_value = [
+        conversation_db_mock.get_conversation_messages.return_value = [
             {"message_role": "user", "message_content": "Hello"},
             {"message_role": "assistant", "message_content": "Hi there"}
         ]
@@ -568,19 +292,6 @@ async def test_get_conversation_history_success(self):
         assert "data" in result
         assert "history" in result["data"]
 
-    async def test_get_conversation_history_fields_transformed(self):
-        """Test that message fields are properly transformed."""
-        ctx = MockNorthboundContext(token_id=0)
-        conversation_db_mod.get_conversation_messages.return_value = [
-            {"message_role": "user", "message_content": "Hello"}
-        ]
-
-        result = await ns.get_conversation_history(ctx=ctx, conversation_id=123)
-
-        history = result["data"]["history"]
-        assert history[0]["role"] == "user"
-        assert history[0]["content"] == "Hello"
-
 
 @pytest.mark.asyncio
 class TestGetConversationHistoryInternal:
@@ -589,7 +300,7 @@ class TestGetConversationHistoryInternal:
     async def test_get_conversation_history_internal_success(self):
         """Test internal history retrieval without logging."""
         ctx = MockNorthboundContext(token_id=0)
-        conversation_db_mod.get_conversation_messages.return_value = [
+        conversation_db_mock.get_conversation_messages.return_value = [
             {"message_role": "user", "message_content": "Hello"}
         ]
 
@@ -602,12 +313,12 @@ async def test_get_conversation_history_internal_success(self):
     async def test_get_conversation_history_internal_no_logging(self):
         """Test that internal function does not log token usage."""
         ctx = MockNorthboundContext(token_id=1)
-        conversation_db_mod.get_conversation_messages.return_value = []
-        token_db_mod.log_token_usage.reset_mock()
+        conversation_db_mock.get_conversation_messages.return_value = []
 
         await ns.get_conversation_history_internal(ctx=ctx, conversation_id=123)
 
-        token_db_mod.log_token_usage.assert_not_called()
+        # Should NOT call log_token_usage
+        token_db_mock.log_token_usage.assert_not_called()
 
 
 @pytest.mark.asyncio
@@ -615,10 +326,9 @@ class TestGetAgentInfoList:
     """Tests for get_agent_info_list function."""
 
     async def test_get_agent_info_list_success(self):
-        """Test successful agent info list retrieval for asset owner tenant."""
-        # Use asset owner tenant to avoid merging asset owner agents
-        ctx = MockNorthboundContext(tenant_id="asset-owner-tenant", token_id=1)
-        agent_version_mod.list_published_agents_impl.return_value = [
+        """Test successful agent info list retrieval."""
+        ctx = MockNorthboundContext(token_id=1)
+        agent_service_mock.list_all_agent_info_impl.return_value = [
             {"agent_id": 1, "name": "test_agent", "description": "Test"}
         ]
 
@@ -626,21 +336,9 @@ async def test_get_agent_info_list_success(self):
 
         assert result["message"] == "success"
         assert len(result["data"]) == 1
+        # agent_id should be removed
         assert "agent_id" not in result["data"][0]
 
-    async def test_get_agent_info_list_includes_asset_owner_agents(self):
-        """Test that asset owner agents are included for non-asset-owner tenants."""
-        ctx = MockNorthboundContext(tenant_id="other-tenant", token_id=0)
-        agent_version_mod.list_published_agents_impl.side_effect = [
-            [{"agent_id": 1, "name": "local_agent"}],
-            [{"agent_id": 2, "name": "asset_agent"}]
-        ]
-
-        result = await ns.get_agent_info_list(ctx=ctx)
-
-        assert len(result["data"]) == 2
-        agent_version_mod.list_published_agents_impl.assert_called()
-
 
 @pytest.mark.asyncio
 class TestUpdateConversationTitle:
@@ -661,9 +359,8 @@ async def test_update_conversation_title_success(self):
         assert "idempotency_key" in result
 
     async def test_update_conversation_title_logs_token_usage(self):
-        """Test that token usage is logged when token_id > 0."""
+        """Test that token usage is logged."""
         ctx = MockNorthboundContext(token_id=1)
-        token_db_mod.log_token_usage.reset_mock()
 
         await ns.update_conversation_title(
             ctx=ctx,
@@ -672,10 +369,10 @@ async def test_update_conversation_title_logs_token_usage(self):
             meta_data={"source": "api"}
         )
 
-        token_db_mod.log_token_usage.assert_called()
+        token_db_mock.log_token_usage.assert_called()
 
-    async def test_update_conversation_title_custom_idempotency_key(self):
-        """Test that custom idempotency key is used when provided."""
+    async def test_update_conversation_title_idempotency_key(self):
+        """Test that idempotency key is properly built."""
         ctx = MockNorthboundContext(tenant_id="tenant-1", token_id=1)
 
         result = await ns.update_conversation_title(
@@ -686,726 +383,3 @@ async def test_update_conversation_title_custom_idempotency_key(self):
         )
 
         assert result["idempotency_key"] == "custom-key"
-
-    async def test_update_conversation_title_idempotency_prevents_duplicate(self):
-        """Test that duplicate requests within TTL are prevented."""
-        ctx = MockNorthboundContext(tenant_id="tenant-1", token_id=0)
-
-        # First call should succeed
-        await ns.update_conversation_title(
-            ctx=ctx,
-            conversation_id=123,
-            title="New Title"
-        )
-
-        # Second call with same params should raise LimitExceededError
-        with pytest.raises(LimitExceededError):
-            await ns.update_conversation_title(
-                ctx=ctx,
-                conversation_id=123,
-                title="New Title"
-            )
-
-
-class TestReleaseIdempotencyAfterDelay:
-    """Tests for _release_idempotency_after_delay function."""
-
-    @pytest.mark.asyncio
-    async def test_release_after_delay(self):
-        """Test that idempotency key is released after delay."""
-        import asyncio
-
-        await ns.idempotency_start("delayed-key")
-        assert "delayed-key" in ns._IDEMPOTENCY_RUNNING
-
-        asyncio.create_task(ns._release_idempotency_after_delay("delayed-key", seconds=0.1))
-        await asyncio.sleep(0.2)
-
-        assert "delayed-key" not in ns._IDEMPOTENCY_RUNNING
-
-
-class TestMinuteBucket:
-    """Tests for _minute_bucket helper function."""
-
-    def test_minute_bucket_returns_string(self):
-        """Test that minute bucket is a string."""
-        bucket = ns._minute_bucket()
-        assert isinstance(bucket, str)
-
-    def test_minute_bucket_consistent_for_same_time(self):
-        """Test that same time produces same bucket."""
-        ts = 1234567890.0
-        bucket1 = ns._minute_bucket(ts)
-        bucket2 = ns._minute_bucket(ts)
-        assert bucket1 == bucket2
-
-    def test_minute_bucket_different_for_different_minutes(self):
-        """Test that different minutes produce different buckets."""
-        ts1 = 1000000.0
-        ts2 = ts1 + 60
-        bucket1 = ns._minute_bucket(ts1)
-        bucket2 = ns._minute_bucket(ts2)
-        assert bucket1 != bucket2
-
-
-class TestStartStreamingChatErrorHandling:
-    """Tests for error handling in start_streaming_chat function."""
-
-    async def test_start_streaming_chat_unauthorized_error(self):
-        """Test that UnauthorizedError is properly propagated."""
-        ctx = MockNorthboundContext(token_id=0)
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock) as mock_limit:
-            mock_limit.side_effect = UnauthorizedError("Unauthorized")
-            with pytest.raises(UnauthorizedError):
-                await ns.start_streaming_chat(
-                    ctx=ctx,
-                    conversation_id=123,
-                    agent_name="test_agent",
-                    query="test query"
-                )
-
-    async def test_start_streaming_chat_get_agent_id_error(self):
-        """Test that get_agent_id_by_name error is wrapped properly."""
-        ctx = MockNorthboundContext(token_id=0)
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', new_callable=AsyncMock) as mock_history, \
-                patch.object(ns, 'get_agent_id_by_name', new_callable=AsyncMock) as mock_get_id:
-            mock_history.return_value = {"data": {"history": []}}
-            mock_get_id.side_effect = Exception("Agent not found")
-
-            with pytest.raises(Exception) as exc_info:
-                await ns.start_streaming_chat(
-                    ctx=ctx,
-                    conversation_id=123,
-                    agent_name="nonexistent_agent",
-                    query="test query"
-                )
-            # The exception is wrapped in the outer try/except block
-            assert "Agent not found" in str(exc_info.value)
-
-    async def test_start_streaming_chat_save_message_error(self):
-        """Test that save_conversation_user error is wrapped properly."""
-        ctx = MockNorthboundContext(token_id=0)
-
-        mock_response = MagicMock()
-        mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-
-        async def mock_get_history(*args, **kwargs):
-            return {"data": {"history": []}}
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history), \
-                patch.object(ns, 'save_conversation_user', side_effect=Exception("DB error")):
-            with pytest.raises(Exception) as exc_info:
-                await ns.start_streaming_chat(
-                    ctx=ctx,
-                    conversation_id=123,
-                    agent_name="test_agent",
-                    query="test query"
-                )
-            assert "Failed to persist user message" in str(exc_info.value)
-
-    async def test_start_streaming_chat_token_logging_failure(self):
-        """Test that token logging failure is handled gracefully."""
-        ctx = MockNorthboundContext(token_id=1)
-
-        mock_response = MagicMock()
-        mock_response.headers = {}
-        agent_service_mod.run_agent_stream.return_value = mock_response
-        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
-
-        async def mock_get_history(*args, **kwargs):
-            return {"data": {"history": []}}
-
-        with patch.object(ns, 'check_and_consume_rate_limit', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_start', new_callable=AsyncMock), \
-                patch.object(ns, 'idempotency_end', new_callable=AsyncMock), \
-                patch.object(ns, 'get_conversation_history_internal', side_effect=mock_get_history):
-            # Should not raise even if token logging fails
-            result = await ns.start_streaming_chat(
-                ctx=ctx,
-                conversation_id=123,
-                agent_name="test_agent",
-                query="test query",
-                meta_data={"key": "value"}
-            )
-            assert result is not None
-
-
-class TestStopChatErrorHandling:
-    """Tests for error handling in stop_chat function."""
-
-    async def test_stop_chat_error(self):
-        """Test that errors in stop_chat are wrapped properly."""
-        ctx = MockNorthboundContext(token_id=0)
-        agent_service_mod.stop_agent_tasks.side_effect = Exception("Stop failed")
-
-        with pytest.raises(Exception) as exc_info:
-            await ns.stop_chat(ctx=ctx, conversation_id=123)
-        assert "Failed to stop chat" in str(exc_info.value)
-
-    async def test_stop_chat_token_logging_failure(self):
-        """Test that token logging failure is handled gracefully."""
-        ctx = MockNorthboundContext(token_id=1)
-        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
-
-        with patch("backend.services.northbound_service.stop_agent_tasks", return_value={"message": "stopped"}):
-            # Should not raise even if token logging fails
-            result = await ns.stop_chat(ctx=ctx, conversation_id=123, meta_data={"key": "value"})
-            assert result is not None
-
-
-class TestListConversationsErrorHandling:
-    """Tests for error handling in list_conversations function."""
-
-    async def test_list_conversations_with_metadata_error(self):
-        """Test that metadata fetch error is handled gracefully."""
-        ctx = MockNorthboundContext(token_id=1)
-        conv_mgmt_mod.get_conversation_list_service.return_value = [
-            {"conversation_id": "1", "title": "Test"}
-        ]
-        token_db_mod.get_latest_usage_metadata.side_effect = Exception("DB error")
-
-        # Should not raise even if metadata fetch fails
-        result = await ns.list_conversations(ctx=ctx)
-        assert result["message"] == "success"
-
-    async def test_list_conversations_empty_meta_data_removed(self):
-        """Test that empty meta_data keys are removed from items."""
-        ctx = MockNorthboundContext(token_id=1)
-        conv_mgmt_mod.get_conversation_list_service.return_value = [
-            {"conversation_id": "1", "title": "Test", "meta_data": {}}
-        ]
-
-        result = await ns.list_conversations(ctx=ctx)
-        assert "meta_data" not in result["data"][0]
-
-    async def test_list_conversations_meta_data_with_no_usage_record(self):
-        """Test that meta_data is removed when get_latest_usage_metadata returns empty."""
-        ctx = MockNorthboundContext(token_id=1)
-        conv_mgmt_mod.get_conversation_list_service.return_value = [
-            {"conversation_id": "1", "title": "Test"}
-        ]
-        token_db_mod.get_latest_usage_metadata.return_value = None
-
-        result = await ns.list_conversations(ctx=ctx)
-        assert "meta_data" not in result["data"][0]
-
-    async def test_list_conversations_meta_data_set_when_present(self):
-        """Test that meta_data is set on item when get_latest_usage_metadata returns a non-empty value."""
-        ctx = MockNorthboundContext(token_id=1)
-        conv_mgmt_mod.get_conversation_list_service.return_value = [
-            {"conversation_id": "1", "title": "Test"}
-        ]
-        # Reset side_effect and set return_value
-        token_db_mod.get_latest_usage_metadata.side_effect = None
-        token_db_mod.get_latest_usage_metadata.return_value = {"query": "test query"}
-
-        result = await ns.list_conversations(ctx=ctx)
-        assert "meta_data" in result["data"][0]
-        assert result["data"][0]["meta_data"]["query"] == "test query"
-
-    async def test_list_conversations_meta_data_empty_dict_removed(self):
-        """Test that empty meta_data (empty dict) is removed from item."""
-        ctx = MockNorthboundContext(token_id=1)
-        conv_mgmt_mod.get_conversation_list_service.return_value = [
-            {"conversation_id": "1", "title": "Test"}
-        ]
-        # Reset side_effect and set return_value to empty dict (falsy)
-        token_db_mod.get_latest_usage_metadata.side_effect = None
-        token_db_mod.get_latest_usage_metadata.return_value = {}
-
-        result = await ns.list_conversations(ctx=ctx)
-        # Empty dict is falsy, so meta_data should be popped
-        assert "meta_data" not in result["data"][0]
-
-
-class TestGetConversationHistoryErrorHandling:
-    """Tests for error handling in get_conversation_history function."""
-
-    async def test_get_conversation_history_error(self):
-        """Test that errors in get_conversation_history are wrapped properly."""
-        ctx = MockNorthboundContext(token_id=0)
-        # Mock get_conversation_messages to raise an error
-        conversation_db_mod.get_conversation_messages.side_effect = Exception("DB error")
-
-        with pytest.raises(Exception) as exc_info:
-            await ns.get_conversation_history(ctx=ctx, conversation_id=123)
-        assert "Failed to get conversation history" in str(exc_info.value)
-
-
-class TestGetAgentInfoListErrorHandling:
-    """Tests for get_agent_info_list function."""
-
-    @pytest.mark.asyncio
-    async def test_get_agent_info_by_name_success(self):
-        """Test successful agent ID retrieval."""
-        agent_service_mod.get_agent_id_by_name.return_value = 42
-        
-        result = await ns.get_agent_info_by_name("test_agent", "tenant-1")
-        assert result == 42
-
-    @pytest.mark.asyncio
-    async def test_get_agent_info_by_name_error(self):
-        """Test that errors are wrapped properly."""
-        agent_service_mod.get_agent_id_by_name.side_effect = Exception("Agent not found")
-        
-        with pytest.raises(Exception) as exc_info:
-            await ns.get_agent_info_by_name("nonexistent", "tenant-1")
-        assert "Failed to get agent id" in str(exc_info.value)
-        assert "nonexistent" in str(exc_info.value)
-        assert "tenant-1" in str(exc_info.value)
-
-    async def test_get_agent_info_list_error(self):
-        """Test that errors in get_agent_info_list are wrapped properly."""
-        ctx = MockNorthboundContext(tenant_id="asset-owner-tenant", token_id=0)
-        agent_version_mod.list_published_agents_impl.side_effect = Exception("DB error")
-
-        with pytest.raises(Exception) as exc_info:
-            await ns.get_agent_info_list(ctx=ctx)
-        assert "Failed to get agent info list" in str(exc_info.value)
-
-
-class TestUpdateConversationTitleErrorHandling:
-    """Tests for error handling in update_conversation_title function."""
-
-    async def test_update_conversation_title_error(self):
-        """Test that errors in update_conversation_title are wrapped properly."""
-        ctx = MockNorthboundContext(token_id=0)
-        conv_mgmt_mod.update_conversation_title.side_effect = Exception("DB error")
-
-        with pytest.raises(Exception) as exc_info:
-            await ns.update_conversation_title(
-                ctx=ctx,
-                conversation_id=123,
-                title="New Title"
-            )
-        assert "Failed to update conversation title" in str(exc_info.value)
-
-    async def test_update_conversation_title_token_logging_failure(self):
-        """Test that token logging failure is handled gracefully."""
-        ctx = MockNorthboundContext(token_id=1)
-        token_db_mod.log_token_usage.side_effect = Exception("Logging failed")
-        # Ensure update_conversation_title_service succeeds
-        conv_mgmt_mod.update_conversation_title.side_effect = None
-        conv_mgmt_mod.update_conversation_title.return_value = True
-
-        # Should not raise even if token logging fails
-        result = await ns.update_conversation_title(
-            ctx=ctx,
-            conversation_id=123,
-            title="New Title",
-            meta_data={"key": "value"}
-        )
-        assert result["message"] == "success"
-
-    async def test_update_conversation_title_conversation_not_found(self):
-        """Test that ConversationNotFoundError is propagated without wrapping."""
-        ctx = MockNorthboundContext(token_id=0)
-        conv_mgmt_mod.update_conversation_title.side_effect = ConversationNotFoundError("Not found")
-
-        with pytest.raises(ConversationNotFoundError):
-            await ns.update_conversation_title(
-                ctx=ctx,
-                conversation_id=123,
-                title="New Title"
-            )
-
-
-class TestNormalizeAttachmentsErrorHandling:
-    """Tests for error handling in _normalize_northbound_attachments function."""
-
-    def test_normalize_attachments_parse_s3_url_error(self):
-        """Test that parse_s3_url ValueError is converted to ValueError."""
-        with patch("backend.services.northbound_service.parse_s3_url", side_effect=ValueError("Parse error")):
-            with pytest.raises(ValueError) as exc_info:
-                ns._normalize_northbound_attachments(
-                    ["s3://bucket/file.txt"],
-                    "user123",
-                    "tenant123"
-                )
-            assert "Invalid S3 URL format" in str(exc_info.value)
-
-    def test_normalize_attachments_permission_error_invalid_url(self):
-        """Test that PermissionError with invalid URL is converted to ValueError."""
-        with patch("backend.services.northbound_service.parse_s3_url", return_value=("bucket", "path/file.txt")), \
-                patch("backend.services.northbound_service.validate_urls_access",
-                      side_effect=PermissionError("Invalid S3 URL format: bad")):
-            with pytest.raises(ValueError) as exc_info:
-                ns._normalize_northbound_attachments(
-                    ["s3://bucket/path/file.txt"],
-                    "user123",
-                    "tenant123"
-                )
-            assert "Invalid S3 URL format" in str(exc_info.value)
-
-    def test_normalize_attachments_invalid_type(self):
-        """Test that non-list attachments raise ValueError."""
-        with pytest.raises(ValueError) as exc_info:
-            ns._normalize_northbound_attachments("s3://bucket/file.txt", "user123", "tenant123")
-        assert "attachments must be an array" in str(exc_info.value)
-
-    def test_normalize_attachments_empty_list(self):
-        """Test that an empty list returns an empty list."""
-        assert ns._normalize_northbound_attachments([], "user123", "tenant123") == []
-
-    def test_normalize_attachments_invalid_url(self):
-        """Test that an unsupported URL scheme raises ValueError."""
-        with pytest.raises(ValueError) as exc_info:
-            ns._normalize_northbound_attachments(["https://example.com/file.txt"], "user123", "tenant123")
-        assert "Invalid attachment format" in str(exc_info.value) or "Invalid S3 URL format" in str(exc_info.value)
-
-    def test_normalize_attachments_empty_string(self):
-        """Test that an empty-string attachment raises ValueError."""
-        with pytest.raises(ValueError) as exc_info:
-            ns._normalize_northbound_attachments([""], "user123", "tenant123")
-        assert "non-empty" in str(exc_info.value)
-
-    def test_normalize_attachments_whitespace_string(self):
-        """Test that a whitespace-only attachment raises ValueError."""
-        with pytest.raises(ValueError) as exc_info:
-            ns._normalize_northbound_attachments(["  "], "user123", "tenant123")
-        assert "non-empty" in str(exc_info.value)
-
-    def test_normalize_attachments_permission_denied(self):
-        """Test that a generic PermissionError is re-raised as-is."""
-        with patch(
-            "backend.services.northbound_service.validate_urls_access",
-            side_effect=PermissionError("Access denied: You don't have permission to access this file")
-        ):
-            with pytest.raises(PermissionError) as exc_info:
-                ns._normalize_northbound_attachments(["s3://bucket/attachments/other/file.txt"], "user123", "tenant123")
-            assert "Access denied" in str(exc_info.value)
-
-    def test_normalize_attachments_s3_url_success(self):
-        """Test successful normalization of an s3:// URL with assertions on collaborator calls."""
-        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
-                patch("backend.services.northbound_service.get_file_url", return_value={
-                    "success": True,
-                    "url": "https://proxy.example/file"
-                }) as mock_get_url, \
-                patch("backend.services.northbound_service.parse_s3_url", return_value=("nexent", "attachments/user123/report.pdf")):
-            result = ns._normalize_northbound_attachments(
-                ["s3://nexent/attachments/user123/report.pdf"],
-                "user123",
-                "tenant123",
-            )
-
-        mock_validate.assert_called_once_with(
-            ["s3://nexent/attachments/user123/report.pdf"],
-            "user123",
-            "tenant123",
-        )
-        mock_get_url.assert_called_once_with(
-            object_name="attachments/user123/report.pdf",
-            expires=86400,
-        )
-        assert result == [{
-            "name": "report.pdf",
-            "object_name": "attachments/user123/report.pdf",
-            "url": "/nexent/attachments/user123/report.pdf",
-            "type": "file",
-            "size": 0,
-            "description": "",
-            "presigned_url": "https://proxy.example/file",
-        }]
-
-    def test_normalize_attachments_no_presigned_url(self):
-        """Test that presigned_url is omitted when get_file_url returns no url."""
-        with patch("backend.services.northbound_service.validate_urls_access"), \
-                patch("backend.services.northbound_service.get_file_url", return_value={
-                    "success": True,
-                    "url": None
-                }), \
-                patch("backend.services.northbound_service.parse_s3_url", return_value=("nexent", "attachments/user123/report.pdf")):
-            result = ns._normalize_northbound_attachments(
-                ["s3://nexent/attachments/user123/report.pdf"],
-                "user123",
-                "tenant123",
-            )
-        assert "presigned_url" not in result[0]
-
-    def test_normalize_attachments_relative_path(self):
-        """Test support for attachments/xxx.md relative path format."""
-        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
-                patch("backend.services.northbound_service.get_file_url", return_value={
-                    "success": True,
-                    "url": "https://proxy.example/file"
-                }) as mock_get_url:
-            result = ns._normalize_northbound_attachments(
-                ["attachments/user123/report.pdf"],
-                "user123",
-                "tenant123",
-            )
-
-        mock_validate.assert_called_once_with(
-            ["s3://nexent/attachments/user123/report.pdf"],
-            "user123",
-            "tenant123",
-        )
-        mock_get_url.assert_called_once_with(
-            object_name="attachments/user123/report.pdf",
-            expires=86400,
-        )
-        assert result == [{
-            "name": "report.pdf",
-            "object_name": "attachments/user123/report.pdf",
-            "url": "/nexent/attachments/user123/report.pdf",
-            "type": "file",
-            "size": 0,
-            "description": "",
-            "presigned_url": "https://proxy.example/file",
-        }]
-
-    def test_normalize_attachments_nexent_path(self):
-        """Test support for nexent/xxx.md path format."""
-        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
-                patch("backend.services.northbound_service.get_file_url", return_value={
-                    "success": True,
-                    "url": "https://proxy.example/file"
-                }) as mock_get_url:
-            result = ns._normalize_northbound_attachments(
-                ["nexent/attachments/user123/report.pdf"],
-                "user123",
-                "tenant123",
-            )
-
-        mock_validate.assert_called_once_with(
-            ["s3://nexent/nexent/attachments/user123/report.pdf"],
-            "user123",
-            "tenant123",
-        )
-        mock_get_url.assert_called_once_with(
-            object_name="nexent/attachments/user123/report.pdf",
-            expires=86400,
-        )
-        assert result == [{
-            "name": "report.pdf",
-            "object_name": "nexent/attachments/user123/report.pdf",
-            "url": "/nexent/nexent/attachments/user123/report.pdf",
-            "type": "file",
-            "size": 0,
-            "description": "",
-            "presigned_url": "https://proxy.example/file",
-        }]
-
-    def test_normalize_attachments_absolute_path(self):
-        """Test support for /nexent/xxx.md absolute path format."""
-        with patch("backend.services.northbound_service.validate_urls_access") as mock_validate, \
-                patch("backend.services.northbound_service.get_file_url", return_value={
-                    "success": True,
-                    "url": "https://proxy.example/file"
-                }) as mock_get_url:
-            result = ns._normalize_northbound_attachments(
-                ["/nexent/attachments/user123/report.pdf"],
-                "user123",
-                "tenant123",
-            )
-
-        mock_validate.assert_called_once_with(
-            ["s3://nexent/attachments/user123/report.pdf"],
-            "user123",
-            "tenant123",
-        )
-        mock_get_url.assert_called_once_with(
-            object_name="attachments/user123/report.pdf",
-            expires=86400,
-        )
-        assert result == [{
-            "name": "report.pdf",
-            "object_name": "attachments/user123/report.pdf",
-            "url": "/nexent/attachments/user123/report.pdf",
-            "type": "file",
-            "size": 0,
-            "description": "",
-            "presigned_url": "https://proxy.example/file",
-        }]
-
-
-class TestNorthboundFileDescriptorAndUpload:
-    """Tests for _build_northbound_file_descriptor and upload_files_for_northbound."""
-
-    def test_build_file_descriptor_defaults(self):
-        """Test that descriptor uses file_name and includes presigned_url when present."""
-        result = ns._build_northbound_file_descriptor({
-            "file_name": "report.pdf",
-            "object_name": "attachments/user123/report.pdf",
-            "presigned_url": "https://proxy.example/file",
-        })
-
-        assert result["name"] == "report.pdf"
-        assert result["object_name"] == "attachments/user123/report.pdf"
-        assert result["type"] == "file"
-        assert result["size"] == 0
-        assert result["url"] == "/nexent/attachments/user123/report.pdf"
-        assert result["description"] == ""
-        assert result["presigned_url"] == "https://proxy.example/file"
-
-    def test_build_file_descriptor_with_original_filename(self):
-        """Test that original_file_name parameter takes precedence over upload_result file_name."""
-        result = ns._build_northbound_file_descriptor({
-            "file_name": "auto_generated_name.md",
-            "object_name": "attachments/user123/20260101120000_abc123.md",
-            "file_size": 0,
-        }, original_file_name="original-document.pdf", file_size=2048)
-
-        assert result["name"] == "original-document.pdf"
-        assert result["object_name"] == "attachments/user123/20260101120000_abc123.md"
-        assert result["type"] == "file"
-        assert result["size"] == 2048
-        assert result["url"] == "/nexent/attachments/user123/20260101120000_abc123.md"
-        assert result["description"] == ""
-
-    def test_build_file_descriptor_with_type_and_size(self):
-        """Test that explicit file_type and file_size override upload_result values."""
-        result = ns._build_northbound_file_descriptor({
-            "file_name": "image.png",
-            "object_name": "attachments/user123/image.png",
-            "file_size": 1024,
-            "content_type": "image/png",
-        }, file_type="image", file_size=2048)
-
-        assert result["name"] == "image.png"
-        assert result["object_name"] == "attachments/user123/image.png"
-        assert result["type"] == "image"
-        assert result["size"] == 2048
-        assert result["url"] == "/nexent/attachments/user123/image.png"
-        assert result["description"] == ""
-
-    def test_build_file_descriptor_no_filename(self):
-        """Test that basename(object_name) is used when no filename is provided."""
-        result = ns._build_northbound_file_descriptor({
-            "object_name": "attachments/user123/report.pdf",
-        })
-        assert result["name"] == "report.pdf"
-        assert result["object_name"] == "attachments/user123/report.pdf"
-        assert result["type"] == "file"
-
-    def test_build_file_descriptor_no_presigned_url(self):
-        """Test that presigned_url is omitted when not present in upload_result."""
-        result = ns._build_northbound_file_descriptor({
-            "file_name": "report.pdf",
-            "object_name": "attachments/user123/report.pdf",
-        })
-        assert "presigned_url" not in result
-
-    @pytest.mark.asyncio
-    async def test_upload_files_for_northbound_success(self):
-        """Test successful upload returns normalized descriptors and summary counts."""
-        ctx = ns.NorthboundContext(
-            request_id="req-123",
-            tenant_id="tenant123",
-            user_id="user123",
-            authorization="Bearer token",
-            token_id=1,
-        )
-        mock_file = MagicMock()
-        mock_file.filename = "report.pdf"
-
-        with patch(
-            "backend.services.northbound_service.resolve_minio_upload_folder",
-            return_value="attachments/user123"
-        ), patch(
-            "backend.services.northbound_service.upload_to_minio",
-            AsyncMock(return_value=[{
-                "success": True,
-                "file_name": "report.pdf",
-                "object_name": "attachments/user123/report.pdf",
-                "content_type": "application/pdf",
-                "file_size": 1024,
-                "presigned_url": "https://proxy.example/file",
-            }])
-        ):
-            result = await ns.upload_files_for_northbound(ctx, [mock_file])
-
-        assert result["summary"]["uploaded"] == 1
-        assert result["summary"]["failed"] == 0
-        assert result["files"][0]["object_name"] == "attachments/user123/report.pdf"
-        assert result["files"][0]["name"] == "report.pdf"
-        assert result["files"][0]["type"] == "file"
-        assert result["files"][0]["size"] == 1024
-        assert result["files"][0]["url"] == "/nexent/attachments/user123/report.pdf"
-        assert result["files"][0]["description"] == ""
-
-    @pytest.mark.asyncio
-    async def test_upload_files_for_northbound_no_files(self):
-        """Test that uploading with no files raises ValueError."""
-        ctx = ns.NorthboundContext(
-            request_id="req-123",
-            tenant_id="tenant123",
-            user_id="user123",
-            authorization="Bearer token",
-        )
-        with pytest.raises(ValueError) as exc_info:
-            await ns.upload_files_for_northbound(ctx, [])
-        assert "No files in the request" in str(exc_info.value)
-
-    @pytest.mark.asyncio
-    async def test_upload_files_for_northbound_all_failed(self):
-        """Test that all-failed uploads raise ValueError."""
-        ctx = ns.NorthboundContext(
-            request_id="req-123",
-            tenant_id="tenant123",
-            user_id="user123",
-            authorization="Bearer token",
-        )
-        mock_file = MagicMock()
-        mock_file.filename = "report.pdf"
-
-        with patch(
-            "backend.services.northbound_service.resolve_minio_upload_folder",
-            return_value="attachments/user123"
-        ), patch(
-            "backend.services.northbound_service.upload_to_minio",
-            AsyncMock(return_value=[{
-                "success": False,
-                "file_name": "report.pdf",
-                "object_name": None,
-            }])
-        ):
-            with pytest.raises(ValueError) as exc_info:
-                await ns.upload_files_for_northbound(ctx, [mock_file])
-        assert "No valid files uploaded" in str(exc_info.value)
-
-    @pytest.mark.asyncio
-    async def test_upload_files_for_northbound_mixed_results(self):
-        """Test that mixed success/failure results are reflected in the summary counts."""
-        ctx = ns.NorthboundContext(
-            request_id="req-123",
-            tenant_id="tenant123",
-            user_id="user123",
-            authorization="Bearer token",
-        )
-        mock_file1 = MagicMock()
-        mock_file1.filename = "report.pdf"
-        mock_file2 = MagicMock()
-        mock_file2.filename = "image.png"
-
-        with patch(
-            "backend.services.northbound_service.resolve_minio_upload_folder",
-            return_value="attachments/user123"
-        ), patch(
-            "backend.services.northbound_service.upload_to_minio",
-            AsyncMock(return_value=[
-                {
-                    "success": True,
-                    "file_name": "report.pdf",
-                    "object_name": "attachments/user123/report.pdf",
-                },
-                {
-                    "success": False,
-                    "file_name": "image.png",
-                    "object_name": None,
-                },
-            ])
-        ):
-            result = await ns.upload_files_for_northbound(ctx, [mock_file1, mock_file2])
-
-        assert result["summary"]["total"] == 2
-        assert result["summary"]["uploaded"] == 1
-        assert result["summary"]["failed"] == 1
diff --git a/test/backend/services/test_prompt_service.py b/test/backend/services/test_prompt_service.py
index 4d8e4f3f6..51964cef6 100644
--- a/test/backend/services/test_prompt_service.py
+++ b/test/backend/services/test_prompt_service.py
@@ -4,71 +4,12 @@
 import unittest
 import json
 import sys
-import atexit
 from unittest.mock import patch, MagicMock
 
-_MODULE_PATCH_SENTINEL = object()
-_MODULE_PATCH_NAMES = [
-    'boto3',
-    'elasticsearch',
-    'sqlalchemy',
-    'sqlalchemy.create_engine',
-    'sqlalchemy.orm',
-    'sqlalchemy.dialects',
-    'sqlalchemy.dialects.postgresql',
-    'sqlalchemy.sql',
-    'database.agent_db',
-    'database.tool_db',
-    'database.model_management_db',
-    'database.knowledge_db',
-    'database.client',
-    'database.db_models',
-    'utils.llm_utils',
-    'utils.prompt_template_utils',
-    'services.agent_service',
-    'services.prompt_template_service',
-    'nexent',
-    'nexent.core',
-    'nexent.core.agents',
-    'nexent.core.agents.agent_model',
-    'nexent.storage',
-    'nexent.storage.storage_client_factory',
-    'nexent.storage.minio_config',
-    'nexent.vector_database',
-    'nexent.memory',
-    'nexent.monitor',
-]
-_MODULE_PATCH_ORIGINALS = {
-    name: sys.modules.get(name, _MODULE_PATCH_SENTINEL)
-    for name in _MODULE_PATCH_NAMES
-}
-
-
-def _restore_patched_modules() -> None:
-    for name, original in _MODULE_PATCH_ORIGINALS.items():
-        if original is _MODULE_PATCH_SENTINEL:
-            sys.modules.pop(name, None)
-        else:
-            sys.modules[name] = original
-
-
-atexit.register(_restore_patched_modules)
-
-
-class MockToolConfig:
-    def __init__(self, *args, **kwargs):
-        for key, value in kwargs.items():
-            setattr(self, key, value)
-
-    def model_dump(self, **kwargs):
-        return {k: v for k, v in self.__dict__.items() if not k.startswith('_')}
-
 # Mock nexent module hierarchy BEFORE any backend imports that depend on it
 nexent_mock = MagicMock()
 nexent_core_mock = MagicMock()
 nexent_core_agents_mock = MagicMock()
-nexent_agent_model_mock = MagicMock()
-nexent_agent_model_mock.ToolConfig = MockToolConfig
 nexent_storage_mock = MagicMock()
 nexent_storage_storage_client_factory_mock = MagicMock()
 nexent_storage_minio_config_mock = MagicMock()
@@ -79,7 +20,6 @@ def model_dump(self, **kwargs):
 sys.modules['nexent'] = nexent_mock
 sys.modules['nexent.core'] = nexent_core_mock
 sys.modules['nexent.core.agents'] = nexent_core_agents_mock
-sys.modules['nexent.core.agents.agent_model'] = nexent_agent_model_mock
 sys.modules['nexent.storage'] = nexent_storage_mock
 sys.modules['nexent.storage.storage_client_factory'] = nexent_storage_storage_client_factory_mock
 sys.modules['nexent.storage.minio_config'] = nexent_storage_minio_config_mock
@@ -103,7 +43,6 @@ def model_dump(self, **kwargs):
 
 from consts.error_code import ErrorCode
 from consts.exceptions import AppException
-from consts.const import ENABLE_JIUWEN_SDK
 
 # Mock boto3 and minio client before importing the module under test
 import sys
@@ -121,29 +60,39 @@ def model_dump(self, **kwargs):
 # This prevents real AWS/MinIO/Elasticsearch calls during import
 patch('botocore.client.BaseClient._make_api_call', return_value={}).start()
 
+# Patch storage factory and MinIO config validation to avoid errors during initialization
+# These patches must be started before any imports that use MinioClient
+storage_client_mock = MagicMock()
 minio_client_mock = MagicMock()
 minio_client_mock._ensure_bucket_exists = MagicMock()
 minio_client_mock.client = MagicMock()
+patch('nexent.storage.storage_client_factory.create_storage_client_from_config', return_value=storage_client_mock).start()
+patch('nexent.storage.minio_config.MinIOStorageConfig.validate', lambda self: None).start()
+patch('backend.database.client.MinioClient', return_value=minio_client_mock).start()
+patch('database.client.MinioClient', return_value=minio_client_mock).start()
+patch('backend.database.client.minio_client', minio_client_mock).start()
+patch('nexent.vector_database.elasticsearch_core.ElasticSearchCore', return_value=MagicMock()).start()
+patch('nexent.vector_database.elasticsearch_core.Elasticsearch', return_value=MagicMock()).start()
+patch('elasticsearch.Elasticsearch', return_value=MagicMock()).start()
+
+from jinja2 import StrictUndefined
 
 # Mock database submodules BEFORE importing prompt_service
+sys.modules['database'] = MagicMock()
 sys.modules['database.agent_db'] = MagicMock()
 sys.modules['database.tool_db'] = MagicMock()
 sys.modules['database.model_management_db'] = MagicMock()
 sys.modules['database.knowledge_db'] = MagicMock()
-mock_database_client = MagicMock()
-mock_database_client.MinioClient.return_value = minio_client_mock
-mock_database_client.minio_client = minio_client_mock
-sys.modules['database.client'] = mock_database_client
-sys.modules['backend.database.client'] = mock_database_client
+sys.modules['database.client'] = MagicMock()
 sys.modules['database.db_models'] = MagicMock()
 
-from jinja2 import StrictUndefined
-
 # Mock utils
+sys.modules['utils'] = MagicMock()
 sys.modules['utils.llm_utils'] = MagicMock()
 sys.modules['utils.prompt_template_utils'] = MagicMock()
 
 # Mock services
+sys.modules['services'] = MagicMock()
 sys.modules['services.agent_service'] = MagicMock()
 sys.modules['services.prompt_template_service'] = MagicMock()
 
@@ -154,9 +103,6 @@ def model_dump(self, **kwargs):
     join_info_for_generate_system_prompt,
     join_info_for_optimize_prompt_section,
     optimize_prompt_section_impl,
-    PromptOptimizationService,
-    OptimizeRequest,
-    OptimizeResult,
 )
 
 
@@ -2116,128 +2062,6 @@ def mock_llm(model_id, content, sys_prompt, callback, tenant_id):
 
         self.assertGreater(len(result_list), 0)
 
-class TestPromptOptimizationService(unittest.TestCase):
-    """Tests for PromptOptimizationService Jiuwen SDK integration"""
-
-    @patch('backend.services.prompt_service.optimize_prompt_section_impl')
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
-    def test_optimize_nexent_fallback_general_mode(self, mock_impl):
-        """nexent 模式: mode=general 应该调用 optimize_prompt_section_impl"""
-        mock_impl.return_value = {
-            "section_type": "duty",
-            "section_title": "智能体角色",
-            "original_content": "old",
-            "optimized_content": "new",
-        }
-
-        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-        req = OptimizeRequest(
-            agent_id=1, model_id=1, task_description="task",
-            section_type="duty", section_title="智能体角色",
-            current_content="old", feedback="improve",
-            mode="general",
-        )
-        result = service.optimize(req)
-
-        self.assertEqual(result.source, "nexent")
-        self.assertEqual(result.optimized_content, "new")
-        mock_impl.assert_called_once()
-
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
-    def test_optimize_nexent_fallback_insert_mode_raises(self):
-        """nexent 模式: mode=insert 应该抛出 NexentCapabilityError"""
-        from adapters.exception import NexentCapabilityError
-
-        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-        req = OptimizeRequest(
-            agent_id=1, model_id=1, task_description="task",
-            section_type="duty", section_title="title",
-            current_content="old", feedback="improve",
-            mode="insert",
-        )
-        with self.assertRaises(NexentCapabilityError) as ctx:
-            service.optimize(req)
-        self.assertIn("insert", str(ctx.exception))
-
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
-    def test_optimize_nexent_fallback_select_mode_raises(self):
-        """nexent 模式: mode=select 应该抛出 NexentCapabilityError"""
-        from adapters.exception import NexentCapabilityError
-
-        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-        req = OptimizeRequest(
-            agent_id=1, model_id=1, task_description="task",
-            section_type="duty", section_title="title",
-            current_content="old", feedback="improve",
-            mode="select",
-        )
-        with self.assertRaises(NexentCapabilityError):
-            service.optimize(req)
-
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False)
-    def test_optimize_badcase_nexent_raises(self):
-        """nexent 模式: badcase 优化应该抛出 NexentCapabilityError"""
-        from adapters.exception import NexentCapabilityError
-
-        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-        with self.assertRaises(NexentCapabilityError) as ctx:
-            service.optimize_badcase(
-                current_content="old",
-                bad_cases=[{"question": "Q1", "answer": "A1"}],
-                agent_id=1, section_type="duty", section_title="title",
-            )
-        self.assertIn("badcase", str(ctx.exception))
-
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', True)
-    def test_is_jiuwen_mode_available_env_disabled(self):
-        """开关关闭时 Jiuwen SDK 不可用"""
-        from consts.const import ENABLE_JIUWEN_SDK
-
-        # Patch ENABLE_JIUWEN_SDK to False
-        with patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', False):
-            service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-            self.assertFalse(service.is_jiuwen_mode_available())
-
-    @patch('backend.services.prompt_service.ENABLE_JIUWEN_SDK', True)
-    def test_is_jiuwen_mode_available_openjiuwen_missing(self):
-        """openjiuwen 未安装时 Jiuwen SDK 不可用"""
-        service = PromptOptimizationService(model_id=1, tenant_id="t", language="zh")
-        with patch('builtins.__import__', side_effect=ModuleNotFoundError("No module named 'openjiuwen'")):
-            self.assertFalse(service.is_jiuwen_mode_available())
-
-    def test_optimize_request_dataclass_fields(self):
-        """OptimizeRequest dataclass 所有字段正确"""
-        req = OptimizeRequest(
-            agent_id=1, model_id=2, task_description="task",
-            section_type="duty", section_title="title",
-            current_content="old", feedback="improve",
-            mode="insert", start_pos=5, end_pos=10,
-            tool_ids=[1, 2], sub_agent_ids=[3],
-            knowledge_base_display_names=["kb1"],
-        )
-        self.assertEqual(req.agent_id, 1)
-        self.assertEqual(req.model_id, 2)
-        self.assertEqual(req.mode, "insert")
-        self.assertEqual(req.start_pos, 5)
-        self.assertEqual(req.end_pos, 10)
-        self.assertEqual(req.tool_ids, [1, 2])
-        self.assertEqual(req.sub_agent_ids, [3])
-        self.assertEqual(req.knowledge_base_display_names, ["kb1"])
-
-    def test_optimize_result_dataclass_fields(self):
-        """OptimizeResult dataclass 所有字段正确"""
-        res = OptimizeResult(
-            optimized_content="new",
-            source="jiuwen",
-            section_type="duty",
-            section_title="title",
-            original_content="old",
-        )
-        self.assertEqual(res.optimized_content, "new")
-        self.assertEqual(res.source, "jiuwen")
-        self.assertEqual(res.section_type, "duty")
-        self.assertEqual(res.section_title, "title")
-        self.assertEqual(res.original_content, "old")
     @patch('backend.services.prompt_service.get_enabled_sub_agent_description_for_generate_prompt')
     @patch('backend.services.prompt_service.get_enabled_tool_description_for_generate_prompt')
     def test_generate_and_save_system_prompt_impl_auto_detect_no_resources(
diff --git a/test/backend/services/test_prompt_template_service.py b/test/backend/services/test_prompt_template_service.py
index 48b27cd4c..34415b203 100644
--- a/test/backend/services/test_prompt_template_service.py
+++ b/test/backend/services/test_prompt_template_service.py
@@ -16,7 +16,6 @@ def _reset_prompt_template_service_modules():
     yield
     sys.modules.pop("services.prompt_template_service", None)
     sys.modules.pop("database.prompt_template_db", None)
-    sys.modules.pop("consts.model", None)
 
 
 @pytest.fixture
@@ -24,30 +23,20 @@ def prompt_template_models(monkeypatch):
     if BACKEND_PATH not in sys.path:
         sys.path.insert(0, BACKEND_PATH)
 
-    consts_model_module = types.ModuleType("consts.model")
+    nexent_module = types.ModuleType("nexent")
+    nexent_core_module = types.ModuleType("nexent.core")
+    nexent_agents_module = types.ModuleType("nexent.core.agents")
+    agent_model_module = types.ModuleType("nexent.core.agents.agent_model")
+    agent_model_module.ToolConfig = type("ToolConfig", (), {})
 
-    class PromptTemplateContentRequest:
-        def __init__(self, **kwargs):
-            for key, value in kwargs.items():
-                setattr(self, key, value)
-
-        def model_dump(self):
-            return dict(self.__dict__)
-
-    class PromptTemplateRequest:
-        def __init__(self, template_name, description, template_type, template_content_zh, template_content_en=None):
-            self.template_name = template_name
-            self.description = description
-            self.template_type = template_type
-            self.template_content_zh = template_content_zh
-            self.template_content_en = template_content_en
-
-    consts_model_module.PromptTemplateRequest = PromptTemplateRequest
-    consts_model_module.PromptTemplateContentRequest = PromptTemplateContentRequest
-    monkeypatch.setitem(sys.modules, "consts.model", consts_model_module)
+    monkeypatch.setitem(sys.modules, "nexent", nexent_module)
+    monkeypatch.setitem(sys.modules, "nexent.core", nexent_core_module)
+    monkeypatch.setitem(sys.modules, "nexent.core.agents", nexent_agents_module)
+    monkeypatch.setitem(sys.modules, "nexent.core.agents.agent_model", agent_model_module)
 
+    consts_model = importlib.import_module("consts.model")
     consts_exceptions = importlib.import_module("consts.exceptions")
-    return consts_model_module, consts_exceptions
+    return consts_model, consts_exceptions
 
 
 @pytest.fixture
diff --git a/test/backend/services/test_tool_configuration_service.py b/test/backend/services/test_tool_configuration_service.py
index 37035b839..29d2f75f6 100644
--- a/test/backend/services/test_tool_configuration_service.py
+++ b/test/backend/services/test_tool_configuration_service.py
@@ -4720,37 +4720,6 @@ def test_import_openapi_service_extract_title_as_fallback(self, mock_logger, moc
         call_kwargs = mock_upsert.call_args.kwargs
         assert call_kwargs["description"] == "API Title Only"
 
-    @patch('backend.services.tool_configuration_service.upsert_openapi_service')
-    @patch('backend.services.tool_configuration_service.logger')
-    def test_import_openapi_service_with_headers_template(self, mock_logger, mock_upsert):
-        """Test import_openapi_service passes headers_template to upsert."""
-        mock_upsert.return_value = {"service_name": "test_service"}
-        headers_template = {
-            "Authorization": "Bearer {{token}}",
-            "X-Tenant-ID": "{{tenant_id}}"
-        }
-
-        openapi_json = {
-            "info": {"description": "Test API"},
-            "paths": {}
-        }
-
-        from backend.services.tool_configuration_service import import_openapi_service
-        result = import_openapi_service(
-            service_name="test_service",
-            openapi_json=openapi_json,
-            server_url="http://api.example.com",
-            tenant_id="tenant1",
-            user_id="user1",
-            headers_template=headers_template
-        )
-
-        assert result["service_name"] == "test_service"
-        call_kwargs = mock_upsert.call_args.kwargs
-        assert call_kwargs["headers_template"] == headers_template
-        assert call_kwargs["description"] == "Test API"
-        mock_logger.info.assert_called_once()
-
     @patch('backend.services.tool_configuration_service.upsert_openapi_service')
     @patch('backend.services.tool_configuration_service.logger')
     def test_import_openapi_service_overrides_servers_url(self, mock_logger, mock_upsert):
diff --git a/test/backend/services/test_vectordatabase_service.py b/test/backend/services/test_vectordatabase_service.py
index 0fcb851c4..952aaad79 100644
--- a/test/backend/services/test_vectordatabase_service.py
+++ b/test/backend/services/test_vectordatabase_service.py
@@ -1050,7 +1050,7 @@ def test_list_indices_with_stats(self, mock_get_knowledge, mock_get_user_tenant,
         mock_get_knowledge.return_value = [
             {"index_name": "index1",
              "embedding_model_name": "test-model", "group_ids": "1,2", "knowledge_sources": "elasticsearch",
-             "ingroup_permission": "EDIT", "tenant_id": "test_tenant", "preserve_source_file": False},
+             "ingroup_permission": "EDIT", "tenant_id": "test_tenant"},
             {"index_name": "index2", "embedding_model_name": "test-model",
              "group_ids": "", "knowledge_sources": "elasticsearch", "ingroup_permission": "READ_ONLY",
              "tenant_id": "test_tenant"}
@@ -1078,10 +1078,6 @@ def test_list_indices_with_stats(self, mock_get_knowledge, mock_get_user_tenant,
         # index2 has empty group_ids, so it gets the tenant default group [1]
         self.assertEqual(result["indices_info"][1]["group_ids"], [1])
 
-        # Verify preserve_source_file is included in indices_info
-        self.assertFalse(result["indices_info"][0]["preserve_source_file"])
-        self.assertTrue(result["indices_info"][1]["preserve_source_file"])
-
         self.mock_vdb_core.get_user_indices.assert_called_once_with("*")
         self.mock_vdb_core.get_indices_detail.assert_called_once_with(
             ["index1", "index2"])
@@ -2273,78 +2269,6 @@ def test_delete_documents(self, mock_delete_file, mock_update_last_doc):
         # Verify that delete_file was called with the correct path
         mock_delete_file.assert_called_once_with("test_path")
 
-    @patch('backend.services.vectordatabase_service.delete_file')
-    @patch('backend.services.vectordatabase_service.file_exists', return_value=False)
-    def test_delete_source_file(self, mock_file_exists, mock_delete_file):
-        mock_delete_file.return_value = {"success": True}
-        result = ElasticSearchService.delete_source_file(
-            "knowledge_base/doc.pdf"
-        )
-        self.assertTrue(result["deleted_minio"])
-        mock_delete_file.assert_called()
-
-    @patch(
-        'backend.services.vectordatabase_service.get_all_files_status',
-        new_callable=AsyncMock,
-    )
-    @patch('backend.services.vectordatabase_service.delete_file')
-    def test_delete_document_by_scope_source_only(
-        self, mock_delete_file, mock_get_status
-    ):
-        mock_get_status.return_value = {
-            "knowledge_base/doc.pdf": {"state": "COMPLETED"}
-        }
-        mock_delete_file.return_value = {"success": True}
-
-        result = asyncio.run(
-            ElasticSearchService.delete_document_by_scope(
-                "test_index",
-                "knowledge_base/doc.pdf",
-                "source_only",
-                self.mock_vdb_core,
-            )
-        )
-
-        self.assertEqual(result["scope"], "source_only")
-        self.assertEqual(result["deleted_es_count"], 0)
-        self.mock_vdb_core.delete_documents.assert_not_called()
-
-    @patch(
-        'backend.services.vectordatabase_service.get_all_files_status',
-        new_callable=AsyncMock,
-    )
-    def test_delete_document_by_scope_rejects_processing(
-        self, mock_get_status
-    ):
-        mock_get_status.return_value = {
-            "knowledge_base/doc.pdf": {"state": "PROCESSING"}
-        }
-
-        with self.assertRaises(ValueError):
-            asyncio.run(
-                ElasticSearchService.delete_document_by_scope(
-                    "test_index",
-                    "knowledge_base/doc.pdf",
-                    "source_only",
-                    self.mock_vdb_core,
-                )
-            )
-
-    @patch('backend.services.vectordatabase_service.file_exists', return_value=False)
-    def test_compute_source_available_completed_missing_minio(self, _mock_exists):
-        available = ElasticSearchService._compute_source_available({
-            "path_or_url": "knowledge_base/doc.pdf",
-            "status": "COMPLETED",
-        })
-        self.assertFalse(available)
-
-    def test_compute_source_available_processing_defaults_true(self):
-        available = ElasticSearchService._compute_source_available({
-            "path_or_url": "knowledge_base/doc.pdf",
-            "status": "PROCESSING",
-        })
-        self.assertTrue(available)
-
     @patch('backend.services.vectordatabase_service.update_last_doc_update_time')
     @patch('backend.services.vectordatabase_service.get_redis_service')
     def test_index_documents_respects_cancellation_flag(self, mock_get_redis_service, mock_update_last_doc):
@@ -4253,172 +4177,73 @@ def test_get_embedding_model_multi_embedding_type(self, mock_get_model_by_displa
             # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    @patch('backend.services.vectordatabase_service.get_model_records')
-    def test_get_embedding_model_no_model_name_no_records(self, mock_get_model_records):
+    def test_get_embedding_model_unknown_type(self):
         """
-        Test get_embedding_model when no model_name is provided and no records exist.
+        Test get_embedding_model when no model_name is provided.
 
         This test verifies that:
-        1. When no model_name is provided and no model records exist, returns (None, None)
-        2. Embedding models are queried before multi_embedding models
+        1. When no model_name is provided, the function returns (None, None)
+        2. The function handles missing model_name gracefully
         """
-        mock_get_model_records.side_effect = [
-            [],
-            [],
-        ]
-
+        # Stop the mock from setUp to test the real function
         self.get_embedding_model_patcher.stop()
 
         try:
+            # Execute - now we can call the real function
             from backend.services.vectordatabase_service import get_embedding_model
             result, model_id = get_embedding_model("test_tenant")
 
+            # Assert
             self.assertIsNone(result)
             self.assertIsNone(model_id)
-            mock_get_model_records.assert_any_call({"model_type": "embedding"}, "test_tenant")
-            mock_get_model_records.assert_any_call({"model_type": "multi_embedding"}, "test_tenant")
         finally:
+            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    @patch('backend.services.vectordatabase_service.get_model_records')
-    def test_get_embedding_model_default_embedding_record(self, mock_get_model_records):
-        """
-        Test get_embedding_model falls back to the newest embedding model when model_name is omitted.
+    def test_get_embedding_model_empty_type(self):
         """
-        mock_get_model_records.return_value = [{
-            "model_id": 101,
-            "model_type": "embedding",
-            "model_name": "default-embedding",
-            "model_repo": "openai",
-            "api_key": "test_api_key",
-            "base_url": "https://test.api.com",
-            "max_tokens": 1024,
-            "ssl_verify": True,
-        }]
-
-        self.get_embedding_model_patcher.stop()
-
-        try:
-            with patch('backend.services.vectordatabase_service.OpenAICompatibleEmbedding') as mock_embedding_class, \
-                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
-                mock_embedding_instance = MagicMock()
-                mock_embedding_class.return_value = mock_embedding_instance
-                mock_get_model_name.return_value = "default-embedding"
-
-                from backend.services.vectordatabase_service import get_embedding_model
-                result, model_id = get_embedding_model("test_tenant")
-
-                self.assertEqual(result, mock_embedding_instance)
-                self.assertEqual(model_id, 101)
-                mock_get_model_records.assert_called_once_with({"model_type": "embedding"}, "test_tenant")
-        finally:
-            self.get_embedding_model_patcher.start()
+        Test get_embedding_model when no model_name is provided.
 
-    @patch('backend.services.vectordatabase_service.get_model_records')
-    def test_get_embedding_model_fallback_to_multi_embedding(self, mock_get_model_records):
-        """
-        Test get_embedding_model falls back to multi_embedding when no embedding model exists.
+        This test verifies that:
+        1. When no model_name is provided, the function returns (None, None)
+        2. The function handles missing model_name gracefully
         """
-        mock_get_model_records.side_effect = [
-            [],
-            [{
-                "model_id": 202,
-                "model_type": "multi_embedding",
-                "model_name": "default-multi-embedding",
-                "model_repo": "jina",
-                "api_key": "test_api_key",
-                "base_url": "https://test.api.com",
-                "max_tokens": 2048,
-                "ssl_verify": True,
-            }],
-        ]
-
+        # Stop the mock from setUp to test the real function
         self.get_embedding_model_patcher.stop()
 
         try:
-            with patch('backend.services.vectordatabase_service.JinaEmbedding') as mock_embedding_class, \
-                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
-                mock_embedding_instance = MagicMock()
-                mock_embedding_class.return_value = mock_embedding_instance
-                mock_get_model_name.return_value = "default-multi-embedding"
-
-                from backend.services.vectordatabase_service import get_embedding_model
-                result, model_id = get_embedding_model("test_tenant")
+            # Execute - now we can call the real function
+            from backend.services.vectordatabase_service import get_embedding_model
+            result, model_id = get_embedding_model("test_tenant")
 
-                self.assertEqual(result, mock_embedding_instance)
-                self.assertEqual(model_id, 202)
-                self.assertEqual(mock_get_model_records.call_count, 2)
+            # Assert
+            self.assertIsNone(result)
+            self.assertIsNone(model_id)
         finally:
+            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
-    @patch('backend.services.vectordatabase_service.get_model_records')
-    def test_get_embedding_model_default_with_model_type_embedding(self, mock_get_model_records):
-        """
-        Test get_embedding_model queries by the provided model_type when model_name is omitted.
+    def test_get_embedding_model_missing_type(self):
         """
-        mock_get_model_records.return_value = [{
-            "model_id": 303,
-            "model_type": "embedding",
-            "model_name": "typed-embedding",
-            "model_repo": "openai",
-            "api_key": "test_api_key",
-            "base_url": "https://test.api.com",
-            "max_tokens": 1024,
-            "ssl_verify": True,
-        }]
-
-        self.get_embedding_model_patcher.stop()
-
-        try:
-            with patch('backend.services.vectordatabase_service.OpenAICompatibleEmbedding') as mock_embedding_class, \
-                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
-                mock_embedding_instance = MagicMock()
-                mock_embedding_class.return_value = mock_embedding_instance
-                mock_get_model_name.return_value = "typed-embedding"
-
-                from backend.services.vectordatabase_service import get_embedding_model
-                result, model_id = get_embedding_model("test_tenant", model_type="embedding")
-
-                self.assertEqual(result, mock_embedding_instance)
-                self.assertEqual(model_id, 303)
-                mock_get_model_records.assert_called_once_with({"model_type": "embedding"}, "test_tenant")
-        finally:
-            self.get_embedding_model_patcher.start()
+        Test get_embedding_model when no model_name is provided.
 
-    @patch('backend.services.vectordatabase_service.get_model_records')
-    def test_get_embedding_model_default_with_model_type_multi_embedding(self, mock_get_model_records):
-        """
-        Test get_embedding_model queries multi_embedding records when model_type is specified.
+        This test verifies that:
+        1. When no model_name is provided, the function returns (None, None)
+        2. The function handles missing model_name gracefully
         """
-        mock_get_model_records.return_value = [{
-            "model_id": 404,
-            "model_type": "multi_embedding",
-            "model_name": "typed-multi-embedding",
-            "model_repo": "jina",
-            "api_key": "test_api_key",
-            "base_url": "https://test.api.com",
-            "max_tokens": 2048,
-            "ssl_verify": True,
-        }]
-
+        # Stop the mock from setUp to test the real function
         self.get_embedding_model_patcher.stop()
 
         try:
-            with patch('backend.services.vectordatabase_service.JinaEmbedding') as mock_embedding_class, \
-                    patch('backend.services.vectordatabase_service.get_model_name_from_config') as mock_get_model_name:
-                mock_embedding_instance = MagicMock()
-                mock_embedding_class.return_value = mock_embedding_instance
-                mock_get_model_name.return_value = "typed-multi-embedding"
-
-                from backend.services.vectordatabase_service import get_embedding_model
-                result, model_id = get_embedding_model("test_tenant", model_type="multi_embedding")
+            # Execute - now we can call the real function
+            from backend.services.vectordatabase_service import get_embedding_model
+            result, model_id = get_embedding_model("test_tenant")
 
-                self.assertEqual(result, mock_embedding_instance)
-                self.assertEqual(model_id, 404)
-                mock_get_model_records.assert_called_once_with(
-                    {"model_type": "multi_embedding"}, "test_tenant"
-                )
+            # Assert
+            self.assertIsNone(result)
+            self.assertIsNone(model_id)
         finally:
+            # Restart the mock for other tests
             self.get_embedding_model_patcher.start()
 
     @patch('backend.services.vectordatabase_service.get_model_by_display_name')
diff --git a/test/backend/utils/test_auth_utils.py b/test/backend/utils/test_auth_utils.py
index 83b31a6ee..af7fe0e1c 100644
--- a/test/backend/utils/test_auth_utils.py
+++ b/test/backend/utils/test_auth_utils.py
@@ -323,22 +323,6 @@ def test_get_current_user_id_with_mapping(monkeypatch):
     assert uid == "user-a" and tid == "tenant-a"
 
 
-def test_get_current_user_id_rejects_revoked_cas_session(monkeypatch):
-    monkeypatch.setattr(au, "IS_SPEED_MODE", False)
-    monkeypatch.setattr(au, "SUPABASE_JWT_SECRET", au.MOCK_JWT_SECRET_KEY)
-    monkeypatch.setattr(au, "SUPABASE_URL", "http://localhost:54321")
-    monkeypatch.setattr(au, "get_user_tenant_by_user_id",
-                        lambda u: {"tenant_id": "tenant-a"})
-    sys.modules["database.cas_session_db"] = MagicMock(
-        is_cas_session_active=MagicMock(return_value=False)
-    )
-
-    token = au.generate_session_jwt("user-a", 1000, session_id="cas-session-1")
-
-    with pytest.raises(UnauthorizedError, match="CAS session"):
-        au.get_current_user_id(token)
-
-
 def test_get_user_language_from_cookie():
     class Req:
         cookies = {"NEXT_LOCALE": "en"}
diff --git a/test/backend/utils/test_context_utils.py b/test/backend/utils/test_context_utils.py
index b58c46040..66e789477 100644
--- a/test/backend/utils/test_context_utils.py
+++ b/test/backend/utils/test_context_utils.py
@@ -162,6 +162,7 @@ def test_empty_inputs_produces_skeleton(self):
             few_shots="Q: hi?\nA: Hello!",
             app_name="Test",
             app_description="Test",
+            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
@@ -183,6 +184,7 @@ class MockTool:
             few_shots="Q?",
             app_name="Test",
             app_description="Test",
+            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
@@ -205,6 +207,7 @@ class MockTool:
             few_shots="Q?",
             app_name="Test",
             app_description="Test",
+            time_str="2026-01-01",
             user_id="test",
             language="zh",
             is_manager=False,
diff --git a/test/backend/utils/test_memory_utils.py b/test/backend/utils/test_memory_utils.py
index b887ab79f..134c38923 100644
--- a/test/backend/utils/test_memory_utils.py
+++ b/test/backend/utils/test_memory_utils.py
@@ -1,352 +1,415 @@
-import sys
-from types import SimpleNamespace
-from unittest.mock import MagicMock
-
 import pytest
+import sys
+from unittest.mock import patch, MagicMock
 
 # Setup common mocks
-from test.common.test_mocks import patch_minio_client_initialization, setup_common_mocks
+from test.common.test_mocks import setup_common_mocks, patch_minio_client_initialization, mock_constants
 
 # Initialize common mocks
 mocks = setup_common_mocks()
 
 # Patch storage factory before importing
 with patch_minio_client_initialization():
-    from backend.utils.memory_utils import _sanitize_index_component, build_memory_config
+    from backend.utils.memory_utils import build_memory_config
 
 
 @pytest.fixture
 def mock_model_configs():
-    """Fixture to provide mock model configurations."""
+    """Fixture to provide mock model configurations"""
     llm_config = {
         "model_name": "gpt-4",
         "model_repo": "openai",
         "base_url": "https://api.openai.com/v1",
-        "api_key": "test-llm-key",
+        "api_key": "test-llm-key"
     }
     embedding_config = {
         "model_name": "text-embedding-ada-002",
         "model_repo": "openai",
         "base_url": "https://api.openai.com/v1",
         "api_key": "test-embed-key",
-        "max_tokens": 1536,
+        "max_tokens": 1536
     }
     return {
         "llm_config": llm_config,
-        "embedding_config": embedding_config,
+        "embedding_config": embedding_config
     }
 
 
 @pytest.fixture
 def mock_tenant_config_manager():
-    """Fixture to provide mock tenant config manager."""
+    """Fixture to provide mock tenant config manager"""
     return MagicMock()
 
 
-@pytest.fixture
-def model_mapping():
-    """Fixture to provide deterministic model config mapping."""
-    return {"llm": "llm", "embedding": "embedding"}
-
+class TestMemoryUtils:
+    """Tests for backend.utils.memory_utils functions"""
 
-@pytest.fixture
-def mock_constants():
-    """Fixture to provide Elasticsearch-related constants."""
-    return SimpleNamespace(
-        ES_HOST="http://localhost:9200",
-        ES_API_KEY="test-es-key",
-        ES_USERNAME="elastic",
-        ES_PASSWORD="test-password",
-    )
+    def test_build_memory_config_success(self, mocker, mock_constants, mock_model_configs, mock_tenant_config_manager):
+        """Builds a complete configuration successfully"""
+        # Use global fixtures for common mocks
+        mock_llm_config = mock_model_configs['llm_config']
+        mock_embed_config = mock_model_configs['embedding_config']
 
+        # Mock get_model_config return sequence
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            mock_llm_config,  # LLM
+            mock_embed_config  # embedding
+        ]
 
-@pytest.fixture
-def patch_memory_dependencies(mocker, mock_tenant_config_manager, mock_constants, model_mapping):
-    """Patch shared dependencies used by build_memory_config."""
-    mocker.patch("backend.utils.memory_utils.tenant_config_manager", mock_tenant_config_manager)
-    mocker.patch("backend.utils.memory_utils._c", mock_constants)
-    mocker.patch("backend.utils.memory_utils.MODEL_CONFIG_MAPPING", model_mapping)
-    return mock_tenant_config_manager, mock_constants
-
-
-class TestSanitizeIndexComponent:
-    """Tests for the index component sanitizer."""
-
-    @pytest.mark.parametrize(
-        ("value", "expected"),
-        [
-            ("OpenAI", "openai"),
-            ("azure/openai", "azure_openai"),
-            ("Model Name", "model_name"),
-            ("repo.name-1", "repo.name-1"),
-            ("MIXED/Chars@Here", "mixed_chars_here"),
-            ("", ""),
-        ],
-    )
-    def test_sanitize_index_component(self, value, expected):
-        """Sanitizer lowercases input and replaces unsupported characters."""
-        assert _sanitize_index_component(value) == expected
+        # Mock get_model_name_from_config
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = [
+            "openai/gpt-4", "openai/text-embedding-ada-002"]
 
+        # Provide deterministic mapping for model config keys
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
 
-class TestMemoryUtils:
-    """Tests for backend.utils.memory_utils functions."""
-
-    def test_build_memory_config_success(
-        self,
-        mocker,
-        mock_model_configs,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-        mock_constants,
-    ):
-        """Builds a complete configuration successfully."""
-        mock_llm_config = mock_model_configs["llm_config"]
-        mock_embed_config = mock_model_configs["embedding_config"]
-        mock_tenant_config_manager.get_model_config.side_effect = [mock_llm_config, mock_embed_config]
-
-        mock_get_model_name = mocker.patch(
-            "backend.utils.memory_utils.get_model_name_from_config",
-            side_effect=["openai/gpt-4", "openai/text-embedding-ada-002"],
-        )
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_constants)
+        mocker.patch(
+            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
+        mocker.patch(
+            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
 
+        # Execute
         result = build_memory_config("test-tenant-id")
 
+        # Structure
         assert isinstance(result, dict)
-        assert result["llm"] == {
-            "provider": "openai",
-            "config": {
-                "model": "openai/gpt-4",
-                "openai_base_url": "https://api.openai.com/v1",
-                "api_key": "test-llm-key",
-            },
-        }
-        assert result["embedder"] == {
-            "provider": "openai",
-            "config": {
-                "model": "openai/text-embedding-ada-002",
-                "openai_base_url": "https://api.openai.com/v1",
-                "embedding_dims": 1536,
-                "api_key": "test-embed-key",
-            },
-        }
-        assert result["vector_store"] == {
-            "provider": "elasticsearch",
-            "config": {
-                "collection_name": "mem0_openai_text-embedding-ada-002_1536",
-                "host": "http://localhost",
-                "port": 9200,
-                "embedding_model_dims": 1536,
-                "verify_certs": False,
-                "api_key": mock_constants.ES_API_KEY,
-                "user": mock_constants.ES_USERNAME,
-                "password": mock_constants.ES_PASSWORD,
-            },
-        }
-        assert result["telemetry"] == {"enabled": False}
+        assert "llm" in result
+        assert "embedder" in result
+        assert "vector_store" in result
+        assert "telemetry" in result
+
+        # LLM
+        assert result["llm"]["provider"] == "openai"
+        assert result["llm"]["config"]["model"] == "openai/gpt-4"
+        assert result["llm"]["config"]["openai_base_url"] == "https://api.openai.com/v1"
+        assert result["llm"]["config"]["api_key"] == "test-llm-key"
+
+        # Embedder
+        assert result["embedder"]["provider"] == "openai"
+        assert result["embedder"]["config"]["model"] == "openai/text-embedding-ada-002"
+        assert result["embedder"]["config"]["openai_base_url"] == "https://api.openai.com/v1"
+        assert result["embedder"]["config"]["embedding_dims"] == 1536
+        assert result["embedder"]["config"]["api_key"] == "test-embed-key"
+
+        # Vector store
+        assert result["vector_store"]["provider"] == "elasticsearch"
+        assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_text-embedding-ada-002_1536"
+        assert result["vector_store"]["config"]["host"] == "http://localhost"
+        assert result["vector_store"]["config"]["port"] == 9200
+        assert result["vector_store"]["config"]["embedding_model_dims"] == 1536
+        assert result["vector_store"]["config"]["verify_certs"] is False
+        assert result["vector_store"]["config"]["api_key"] == "test-es-key"
+        assert result["vector_store"]["config"]["user"] == "elastic"
+        assert result["vector_store"]["config"]["password"] == "test-password"
 
+        # Telemetry
+        assert result["telemetry"]["enabled"] is False
+
+        # Called for both models
         assert mock_get_model_name.call_count == 2
         mock_get_model_name.assert_any_call(mock_llm_config)
         mock_get_model_name.assert_any_call(mock_embed_config)
-        assert mock_tenant_config_manager.get_model_config.call_count == 2
-
-    @pytest.mark.parametrize(
-        "llm_raw",
-        [None, {}, {"api_key": "test-key"}, {"model_name": ""}],
-    )
-    def test_build_memory_config_missing_llm_config(self, llm_raw, patch_memory_dependencies, mock_tenant_config_manager):
-        """Raises when LLM config is missing or incomplete."""
+
+    def test_build_memory_config_missing_llm_config(self, mocker, mock_tenant_config_manager):
+        """Raises when LLM config is missing"""
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            None,  # LLM is None
+            {"model_name": "test-embed", "max_tokens": 1536}  # embedding present
+        ]
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
+            build_memory_config("test-tenant-id")
+
+        assert "Missing LLM configuration for tenant" in str(exc_info.value)
+
+    def test_build_memory_config_llm_config_missing_model_name(self, mocker):
+        """Raises when LLM config lacks model_name"""
+        mock_tenant_config_manager = MagicMock()
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            {"api_key": "test-key"},  # LLM missing model_name
+            {"model_name": "test-embed", "max_tokens": 1536}  # embedding present
+        ]
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
+            build_memory_config("test-tenant-id")
+
+        assert "Missing LLM configuration for tenant" in str(exc_info.value)
+
+    def test_build_memory_config_missing_embedding_config(self, mocker, mock_tenant_config_manager):
+        """Raises when embedding config is missing"""
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            {"model_name": "test-llm"},  # LLM present
+            None  # embedding is None
+        ]
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
+            build_memory_config("test-tenant-id")
+
+        assert "Missing embedding-model configuration for tenant" in str(
+            exc_info.value)
+
+    def test_build_memory_config_embedding_config_missing_max_tokens(self, mocker):
+        """Raises when embedding config lacks max_tokens"""
+        mock_tenant_config_manager = MagicMock()
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            {"model_name": "test-llm"},  # LLM present
+            {"model_name": "test-embed"}  # embedding missing max_tokens
+        ]
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
+            build_memory_config("test-tenant-id")
+
+        assert "Missing embedding-model configuration for tenant" in str(
+            exc_info.value)
+
+    def test_build_memory_config_missing_es_host(self, mocker):
+        """Raises when ES_HOST is missing"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
-            llm_raw,
-            {"model_name": "test-embed", "max_tokens": 1536},
+            {"model_name": "test-llm"},
+            {"model_name": "test-embed", "max_tokens": 1536}
         ]
 
-        with pytest.raises(ValueError, match="Missing LLM configuration for tenant"):
+        mock_const = MagicMock()
+        mock_const.ES_HOST = None  # ES_HOST is None
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
             build_memory_config("test-tenant-id")
 
-    @pytest.mark.parametrize(
-        "embed_raw",
-        [None, {}, {"model_name": "test-embed"}, {"model_name": "test-embed", "max_tokens": 0}],
-    )
-    def test_build_memory_config_missing_embedding_config(
-        self,
-        embed_raw,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-    ):
-        """Raises when embedding config is missing or incomplete."""
+        assert "ES_HOST is not configured" in str(exc_info.value)
+
+    def test_build_memory_config_invalid_es_host_format(self, mocker):
+        """Raises when ES_HOST format is invalid"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
             {"model_name": "test-llm"},
-            embed_raw,
+            {"model_name": "test-embed", "max_tokens": 1536}
         ]
 
-        with pytest.raises(ValueError, match="Missing embedding-model configuration for tenant"):
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "invalid-host"  # invalid format
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
             build_memory_config("test-tenant-id")
 
-    @pytest.mark.parametrize("es_host", [None, ""])
-    def test_build_memory_config_missing_es_host(self, es_host, patch_memory_dependencies, mock_constants):
-        """Raises when ES_HOST is not configured."""
-        mock_constants.ES_HOST = es_host
+        assert "ES_HOST must include scheme, host and port" in str(
+            exc_info.value)
+
+    def test_build_memory_config_es_host_missing_scheme(self, mocker):
+        """Raises when ES_HOST is missing scheme"""
+        mock_tenant_config_manager = MagicMock()
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            {"model_name": "test-llm"},
+            {"model_name": "test-embed", "max_tokens": 1536}
+        ]
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "localhost:9200"  # missing scheme
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
 
-        with pytest.raises(ValueError, match="ES_HOST is not configured"):
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
             build_memory_config("test-tenant-id")
 
-    @pytest.mark.parametrize(
-        "es_host",
-        [
-            "invalid-host",
-            "localhost:9200",
-            "http://localhost",
-            "http://:9200",
-        ],
-    )
-    def test_build_memory_config_invalid_es_host_format(self, es_host, patch_memory_dependencies, mock_tenant_config_manager, mock_constants):
-        """Raises when ES_HOST is missing required URL parts."""
+        assert "ES_HOST must include scheme, host and port" in str(
+            exc_info.value)
+
+    def test_build_memory_config_es_host_missing_port(self, mocker):
+        """Raises when ES_HOST is missing port"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
             {"model_name": "test-llm"},
-            {"model_name": "test-embed", "max_tokens": 1536},
+            {"model_name": "test-embed", "max_tokens": 1536}
         ]
-        mock_constants.ES_HOST = es_host
 
-        with pytest.raises(
-            ValueError,
-            match="ES_HOST must include scheme, host and port, e.g. http://host:9200",
-        ):
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "http://localhost"  # missing port
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+
+        # Should raise
+        with pytest.raises(ValueError) as exc_info:
             build_memory_config("test-tenant-id")
 
-    def test_build_memory_config_with_https_es_host(
-        self,
-        mocker,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-        mock_constants,
-    ):
-        """HTTPS ES host is parsed correctly."""
+        assert "ES_HOST must include scheme, host and port" in str(
+            exc_info.value)
+
+    def test_build_memory_config_with_https_es_host(self, mocker):
+        """HTTPS ES_HOST is parsed correctly and collection name composes"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {
-                "model_name": "test-llm",
-                "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-llm-key",
-            },
-            {
-                "model_name": "test-embed",
-                "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-embed-key",
-                "max_tokens": 1536,
-            },
+            {"model_name": "test-llm", "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
+            {"model_name": "test-embed", "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
         ]
-        mock_constants.ES_HOST = "https://elastic.example.com:9200"
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "https://elastic.example.com:9200"
+        mock_const.ES_API_KEY = "test-es-key"
+        mock_const.ES_USERNAME = "elastic"
+        mock_const.ES_PASSWORD = "test-password"
+
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = [
+            "openai/test-llm", "openai/test-embed"]
+
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+        mocker.patch(
+            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
         mocker.patch(
-            "backend.utils.memory_utils.get_model_name_from_config",
-            side_effect=["openai/test-llm", "openai/test-embed"],
-        )
+            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
 
+        # Execute
         result = build_memory_config("test-tenant-id")
 
+        # ES fields
         assert result["vector_store"]["config"]["host"] == "https://elastic.example.com"
         assert result["vector_store"]["config"]["port"] == 9200
         assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_test-embed_1536"
 
-    def test_build_memory_config_with_custom_port(
-        self,
-        mocker,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-        mock_constants,
-    ):
-        """Custom ES port is parsed and applied."""
+    def test_build_memory_config_with_custom_port(self, mocker):
+        """Custom ES port is parsed and applied; collection name composed"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {
-                "model_name": "test-llm",
-                "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-llm-key",
-            },
-            {
-                "model_name": "test-embed",
-                "model_repo": "openai",
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-embed-key",
-                "max_tokens": 1536,
-            },
+            {"model_name": "test-llm", "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
+            {"model_name": "test-embed", "model_repo": "openai",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
         ]
-        mock_constants.ES_HOST = "http://localhost:9300"
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "http://localhost:9300"  # custom port
+        mock_const.ES_API_KEY = "test-es-key"
+        mock_const.ES_USERNAME = "elastic"
+        mock_const.ES_PASSWORD = "test-password"
+
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = [
+            "openai/test-llm", "openai/test-embed"]
+
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
         mocker.patch(
-            "backend.utils.memory_utils.get_model_name_from_config",
-            side_effect=["openai/test-llm", "openai/test-embed"],
-        )
+            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
+        mocker.patch(
+            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
 
+        # Execute
         result = build_memory_config("test-tenant-id")
 
+        # ES fields
         assert result["vector_store"]["config"]["host"] == "http://localhost"
         assert result["vector_store"]["config"]["port"] == 9300
         assert result["vector_store"]["config"]["collection_name"] == "mem0_openai_test-embed_1536"
 
-    def test_build_memory_config_sanitizes_repo_and_name(
-        self,
-        mocker,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-    ):
-        """Collection name sanitizes repo and model name through the helper."""
+    def test_build_memory_config_sanitizes_slashes_in_repo_and_name(self, mocker):
+        """Slash characters in repo/name are replaced with underscores in collection name"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {
-                "model_name": "gpt-4",
-                "model_repo": "Azure/OpenAI Repo",
-                "base_url": "https://api.example.com/v1",
-                "api_key": "llm-key",
-            },
-            {
-                "model_name": "Text Embed@Ada/002",
-                "model_repo": "Azure/OpenAI Repo",
-                "base_url": "https://api.example.com/v1",
-                "api_key": "embed-key",
-                "max_tokens": 1536,
-            },
+            {"model_name": "gpt-4", "model_repo": "azure/openai",
+                "base_url": "https://api.example.com/v1", "api_key": "llm-key"},
+            {"model_name": "text-embed/ada-002", "model_repo": "azure/openai",
+                "base_url": "https://api.example.com/v1", "api_key": "embed-key", "max_tokens": 1536}
         ]
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "http://localhost:9200"
+        mock_const.ES_API_KEY = "test-es-key"
+        mock_const.ES_USERNAME = "elastic"
+        mock_const.ES_PASSWORD = "test-password"
+
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = [
+            "azure/openai/gpt-4", "azure/openai/text-embed/ada-002"]
+
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+        mocker.patch(
+            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
         mocker.patch(
-            "backend.utils.memory_utils.get_model_name_from_config",
-            side_effect=["azure/openai/gpt-4", "azure/openai/Text Embed@Ada/002"],
-        )
-
-        result = build_memory_config("tenant-with-special-chars")
-
-        assert result["vector_store"]["config"]["collection_name"] == (
-            "mem0_azure_openai_repo_text_embed_ada_002_1536"
-        )
-
-    @pytest.mark.parametrize("repo_value", ["", None])
-    def test_build_memory_config_without_repo_segment(
-        self,
-        repo_value,
-        mocker,
-        patch_memory_dependencies,
-        mock_tenant_config_manager,
-    ):
-        """Falsy model_repo omits the repo segment from the collection name."""
+            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
+
+        result = build_memory_config("tenant-with-slash")
+
+        assert result["vector_store"]["config"]["collection_name"] == "mem0_azure_openai_text-embed_ada-002_1536"
+
+    def test_build_memory_config_with_empty_model_repo(self, mocker):
+        """Empty model_repo yields collection name without repo segment"""
+        mock_tenant_config_manager = MagicMock()
         mock_tenant_config_manager.get_model_config.side_effect = [
-            {
-                "model_name": "gpt-4",
-                "model_repo": repo_value,
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-llm-key",
-            },
-            {
-                "model_name": "Text Embedding/ADA 002",
-                "model_repo": repo_value,
-                "base_url": "https://api.openai.com/v1",
-                "api_key": "test-embed-key",
-                "max_tokens": 1536,
-            },
+            {"model_name": "gpt-4", "model_repo": "",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-llm-key"},
+            {"model_name": "text-embedding-ada-002", "model_repo": "",
+                "base_url": "https://api.openai.com/v1", "api_key": "test-embed-key", "max_tokens": 1536}
         ]
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "http://localhost:9200"
+        mock_const.ES_API_KEY = "test-es-key"
+        mock_const.ES_USERNAME = "elastic"
+        mock_const.ES_PASSWORD = "test-password"
+
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = [
+            "gpt-4", "text-embedding-ada-002"]  # no repo prefix
+
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
+        mocker.patch('backend.utils.memory_utils.tenant_config_manager',
+                     mock_tenant_config_manager)
+        mocker.patch('backend.utils.memory_utils._c', mock_const)
+        mocker.patch(
+            'backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name)
         mocker.patch(
-            "backend.utils.memory_utils.get_model_name_from_config",
-            side_effect=["gpt-4", "Text Embedding/ADA 002"],
-        )
+            'backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping)
 
+        # Execute
         result = build_memory_config("test-tenant-id")
 
+        # Model names
         assert result["llm"]["config"]["model"] == "gpt-4"
-        assert result["embedder"]["config"]["model"] == "Text Embedding/ADA 002"
-        assert result["vector_store"]["config"]["collection_name"] == "mem0_text_embedding_ada_002_1536"
+        assert result["embedder"]["config"]["model"] == "text-embedding-ada-002"
+        # Collection name omits empty repo segment
+        assert result["vector_store"]["config"]["collection_name"] == "mem0_text-embedding-ada-002_1536"
diff --git a/test/conftest.py b/test/conftest.py
index 246d784a5..4acb6aded 100644
--- a/test/conftest.py
+++ b/test/conftest.py
@@ -26,8 +26,6 @@
     "mem0.configs.embeddings.base": MagicMock(),
 }
 
-_optional_sdk_stubs = {}
-
 # Add backend and sdk directories to sys.path so that modules can be imported
 # as `from backend.xxx import ...` and `from sdk.xxx import ...`
 _test_root = os.path.dirname(os.path.abspath(__file__))
@@ -39,9 +37,6 @@
 if _sdk_dir not in sys.path:
     sys.path.insert(0, _sdk_dir)
 
-sys.modules.update({k: v for k, v in _mem0_stubs.items() if k not in sys.modules})
-sys.modules.update({k: v for k, v in _optional_sdk_stubs.items() if k not in sys.modules})
-
 _tmp_root = os.path.abspath(os.path.join(_test_root, "..", ".pytest-tmp"))
 os.makedirs(_tmp_root, exist_ok=True)
 os.environ.setdefault("TMP", _tmp_root)
diff --git a/test/sdk/container/test_docker_client.py b/test/sdk/container/test_docker_client.py
index 816159a00..e30f6bfdc 100644
--- a/test/sdk/container/test_docker_client.py
+++ b/test/sdk/container/test_docker_client.py
@@ -1627,10 +1627,10 @@ def test_ensure_network_exists(self, docker_container_client):
         mock_network = MagicMock()
         docker_container_client.client.networks.get.return_value = mock_network
 
-        docker_container_client._ensure_network("nexent_network")
+        docker_container_client._ensure_network("nexent_nexent")
 
         docker_container_client.client.networks.get.assert_called_once_with(
-            "nexent_network")
+            "nexent_nexent")
         docker_container_client.client.networks.create.assert_not_called()
 
     def test_ensure_network_create_new(self, docker_container_client):
@@ -1640,12 +1640,12 @@ def test_ensure_network_create_new(self, docker_container_client):
         mock_network = MagicMock()
         docker_container_client.client.networks.create.return_value = mock_network
 
-        docker_container_client._ensure_network("nexent_network")
+        docker_container_client._ensure_network("nexent_nexent")
 
         docker_container_client.client.networks.get.assert_called_once_with(
-            "nexent_network")
+            "nexent_nexent")
         docker_container_client.client.networks.create.assert_called_once_with(
-            "nexent_network")
+            "nexent_nexent")
 
     def test_ensure_network_race_condition(self, docker_container_client):
         """Test ensuring network when race condition occurs (another process creates it)"""
@@ -1657,7 +1657,7 @@ def test_ensure_network_race_condition(self, docker_container_client):
         docker_container_client.client.networks.create.side_effect = APIError(
             "Network already exists")
 
-        docker_container_client._ensure_network("nexent_network")
+        docker_container_client._ensure_network("nexent_nexent")
 
         assert docker_container_client.client.networks.get.call_count == 2
         docker_container_client.client.networks.create.assert_called_once()
@@ -1672,7 +1672,7 @@ def test_ensure_network_create_fails_then_get_fails(self, docker_container_clien
             "Create failed")
 
         with pytest.raises(ContainerError, match="Failed to create or get Docker network"):
-            docker_container_client._ensure_network("nexent_network")
+            docker_container_client._ensure_network("nexent_nexent")
 
     def test_ensure_network_get_api_error(self, docker_container_client):
         """Test ensuring network when get raises APIError"""
@@ -1680,7 +1680,7 @@ def test_ensure_network_get_api_error(self, docker_container_client):
             "API error")
 
         with pytest.raises(ContainerError, match="Failed to get Docker network"):
-            docker_container_client._ensure_network("nexent_network")
+            docker_container_client._ensure_network("nexent_nexent")
 
 
 # ---------------------------------------------------------------------------
diff --git a/test/sdk/container/test_k8s_client.py b/test/sdk/container/test_k8s_client.py
index 84e0bc557..42db8c58c 100644
--- a/test/sdk/container/test_k8s_client.py
+++ b/test/sdk/container/test_k8s_client.py
@@ -11,7 +11,6 @@
     KubernetesContainerClient,
     ContainerError,
     ContainerConnectionError,
-    _sanitize_k8s_name,
 )
 from nexent.container.k8s_config import KubernetesContainerConfig
 
@@ -91,79 +90,6 @@ def mock_pod():
     return pod
 
 
-# ---------------------------------------------------------------------------
-# Test _sanitize_k8s_name
-# ---------------------------------------------------------------------------
-
-
-class TestSanitizeK8sName:
-    """Test _sanitize_k8s_name helper function"""
-
-    def test_sanitize_basic_alphanumeric(self):
-        """Test basic alphanumeric string passes through"""
-        assert _sanitize_k8s_name("test-service") == "test-service"
-        assert _sanitize_k8s_name("abc123") == "abc123"
-
-    def test_sanitize_lowercase_conversion(self):
-        """Test uppercase letters are converted to lowercase"""
-        assert _sanitize_k8s_name("TestService") == "testservice"
-        assert _sanitize_k8s_name("UPPERCASE") == "uppercase"
-
-    def test_sanitize_special_characters_replaced(self):
-        """Test special characters are replaced with dash"""
-        assert _sanitize_k8s_name("test@service") == "test-service"
-        assert _sanitize_k8s_name("foo#bar") == "foo-bar"
-        assert _sanitize_k8s_name("test$123") == "test-123"
-
-    def test_sanitize_consecutive_special_chars(self):
-        """Test consecutive special characters are collapsed to single dash"""
-        assert _sanitize_k8s_name("foo@@bar") == "foo-bar"
-        assert _sanitize_k8s_name("test@#$service") == "test-service"
-        assert _sanitize_k8s_name("a!!b") == "a-b"
-
-    def test_sanitize_leading_special_chars(self):
-        """Test leading special characters are removed"""
-        assert _sanitize_k8s_name("@test") == "test"
-        assert _sanitize_k8s_name("#foo") == "foo"
-        assert _sanitize_k8s_name("!test@service") == "test-service"
-
-    def test_sanitize_trailing_special_chars(self):
-        """Test trailing special characters are removed"""
-        assert _sanitize_k8s_name("test@") == "test"
-        assert _sanitize_k8s_name("test-service!") == "test-service"
-
-    def test_sanitize_mixed_case_with_specials(self):
-        """Test mixed case with special characters"""
-        assert _sanitize_k8s_name("Foo@Bar!Test") == "foo-bar-test"
-
-    def test_sanitize_empty_string(self):
-        """Test empty string returns 'unknown'"""
-        assert _sanitize_k8s_name("") == "unknown"
-
-    def test_sanitize_only_special_chars(self):
-        """Test string with only special characters returns 'unknown'"""
-        assert _sanitize_k8s_name("@@@") == "unknown"
-        assert _sanitize_k8s_name("!@#") == "unknown"
-
-    def test_sanitize_none(self):
-        """Test None returns 'unknown'"""
-        assert _sanitize_k8s_name(None) == "unknown"
-
-    def test_sanitize_with_dots(self):
-        """Test dots are converted to dashes"""
-        assert _sanitize_k8s_name("foo.bar") == "foo-bar"
-        assert _sanitize_k8s_name("foo...bar") == "foo-bar"
-
-    def test_sanitize_underscore_replaced(self):
-        """Test underscores are replaced with dash"""
-        assert _sanitize_k8s_name("foo_bar") == "foo-bar"
-
-    def test_sanitize_spaces_replaced(self):
-        """Test spaces are replaced with dash"""
-        assert _sanitize_k8s_name("foo bar") == "foo-bar"
-        assert _sanitize_k8s_name("foo  bar") == "foo-bar"
-
-
 # ---------------------------------------------------------------------------
 # Test KubernetesContainerClient.__init__
 # ---------------------------------------------------------------------------
@@ -266,72 +192,6 @@ def test_generate_pod_name_with_special_chars(self, k8s_container_client):
             assert "@" not in name
             assert "#" not in name
 
-    def test_generate_pod_name_consecutive_special_chars(self, k8s_container_client):
-        """Test pod name generation with consecutive special characters"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "foo@@bar", "tenant123", "user12345")
-            assert name == "mcp-foo-bar-tenant12-user1234-a1b2c3d4"
-            assert "--" not in name
-
-    def test_generate_pod_name_leading_special_chars(self, k8s_container_client):
-        """Test pod name generation with leading special characters"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "@test-service", "tenant123", "user12345")
-            # "@test-service" -> "test-service" (leading @ stripped)
-            assert name.startswith("mcp-test")
-            assert not name.startswith("mcp-@")
-
-    def test_generate_pod_name_trailing_special_chars(self, k8s_container_client):
-        """Test pod name generation with trailing special characters"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "test-service@", "tenant123", "user12345")
-            assert name == "mcp-test-service-tenant12-user1234-a1b2c3d4"
-            assert name.endswith("-a1b2c3d4")
-
-    def test_generate_pod_name_uppercase(self, k8s_container_client):
-        """Test pod name generation with uppercase letters"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "TestService", "tenant123", "user12345")
-            assert name == "mcp-testservice-tenant12-user1234-a1b2c3d4"
-
-    def test_generate_pod_name_underscores(self, k8s_container_client):
-        """Test pod name generation with underscores"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "test_service", "tenant_123", "user_12345")
-            # tenant_123 -> tenant-123 (9 chars), truncated to 8 -> tenant-1
-            # user_12345 -> user-12345 (10 chars), truncated to 8 -> user-123
-            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
-
-    def test_generate_pod_name_dots(self, k8s_container_client):
-        """Test pod name generation with dots"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "test.service", "tenant.123", "user.12345")
-            # tenant.123 -> tenant.123 (9 chars), truncated to 8 -> tenant.1
-            # user.12345 -> user.12345 (10 chars), truncated to 8 -> user.123
-            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
-
-    def test_generate_pod_name_spaces(self, k8s_container_client):
-        """Test pod name generation with spaces"""
-        with patch("nexent.container.k8s_client.uuid.uuid4") as mock_uuid:
-            mock_uuid.return_value.hex = "a1b2c3d4"
-            name = k8s_container_client._generate_pod_name(
-                "test service", "tenant 123", "user 12345")
-            # tenant 123 -> tenant 123 (9 chars), truncated to 8 -> tenant 1
-            # user 12345 -> user 12345 (10 chars), truncated to 8 -> user 123
-            assert name == "mcp-test-service-tenant-1-user-123-a1b2c3d4"
-
     def test_generate_pod_name_long_user_id(self, k8s_container_client):
         """Test pod name generation with long user ID"""
         long_user_id = "a" * 20
@@ -356,7 +216,7 @@ def test_generate_pod_name_empty_tenant(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "", "user12345")
-            assert name == "mcp-test-service-unknown-user1234-a1b2c3d4"
+            assert name == "mcp-test-service--user1234-a1b2c3d4"
 
     def test_generate_pod_name_empty_user(self, k8s_container_client):
         """Test pod name generation with empty user_id"""
@@ -364,7 +224,7 @@ def test_generate_pod_name_empty_user(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "tenant123", "")
-            assert name == "mcp-test-service-tenant12-unknown-a1b2c3d4"
+            assert name == "mcp-test-service-tenant12--a1b2c3d4"
 
     def test_generate_pod_name_none_tenant(self, k8s_container_client):
         """Test pod name generation with None tenant_id"""
@@ -372,7 +232,7 @@ def test_generate_pod_name_none_tenant(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", None, "user12345")
-            assert name == "mcp-test-service-unknown-user1234-a1b2c3d4"
+            assert name == "mcp-test-service--user1234-a1b2c3d4"
 
     def test_generate_pod_name_none_user(self, k8s_container_client):
         """Test pod name generation with None user_id"""
@@ -380,7 +240,7 @@ def test_generate_pod_name_none_user(self, k8s_container_client):
             mock_uuid.return_value.hex = "a1b2c3d4"
             name = k8s_container_client._generate_pod_name(
                 "test-service", "tenant123", None)
-            assert name == "mcp-test-service-tenant12-unknown-a1b2c3d4"
+            assert name == "mcp-test-service-tenant12--a1b2c3d4"
 
 
 # ---------------------------------------------------------------------------
@@ -1405,26 +1265,6 @@ def test_list_containers_service_filter_special_chars(self, k8s_container_client
 
         assert len(result) == 0
 
-    def test_list_containers_service_filter_consecutive_special_chars(self, k8s_container_client, mock_pod):
-        """Test listing containers with service filter containing consecutive special characters"""
-        k8s_container_client.core_v1.list_namespaced_pod.return_value = MagicMock(items=[mock_pod])
-
-        # The sanitized version of "test@@service" is "test-service"
-        # Since mock_pod's component is "test-service", it should match
-        result = k8s_container_client.list_containers(service_name="test@@service")
-
-        assert len(result) == 1
-
-    def test_list_containers_service_filter_leading_special_chars(self, k8s_container_client, mock_pod):
-        """Test listing containers with service filter containing leading special characters"""
-        k8s_container_client.core_v1.list_namespaced_pod.return_value = MagicMock(items=[mock_pod])
-
-        # The sanitized version of "@test-service" is "test-service" (leading @ stripped)
-        # Since mock_pod's component is "test-service", it should match
-        result = k8s_container_client.list_containers(service_name="@test-service")
-
-        assert len(result) == 1
-
     def test_list_containers_pod_no_ports(self, k8s_container_client):
         """Test listing containers when pod has no ports configured"""
         mock_pod_no_ports = MagicMock()
diff --git a/test/sdk/core/agents/test_agent_model.py b/test/sdk/core/agents/test_agent_model.py
index 66856fda1..19963d7b4 100644
--- a/test/sdk/core/agents/test_agent_model.py
+++ b/test/sdk/core/agents/test_agent_model.py
@@ -1259,34 +1259,6 @@ def test_agent_config_max_steps_rejects_out_of_bounds(self):
             )
 
 
-class TestAgentVerificationConfig:
-    """Tests for layered ReAct verification configuration."""
-
-    def test_default_verification_config_is_enabled(self):
-        config = agent_model_module.AgentVerificationConfig()
-
-        assert config.enabled is True
-        assert config.step_verification_enabled is True
-        assert config.final_verification_enabled is True
-        assert config.max_final_rounds == 2
-        assert "final_answer" in config.critical_events
-
-    def test_agent_config_has_default_verification_config(self):
-        config = agent_model_module.AgentConfig(
-            name="verified_agent",
-            description="Agent with default verification",
-            tools=[],
-            model_name="test",
-        )
-
-        assert config.verification_config.enabled is True
-        assert config.verification_config.strictness == "balanced"
-
-    def test_verification_config_rejects_invalid_rounds(self):
-        with pytest.raises(Exception):
-            agent_model_module.AgentVerificationConfig(max_final_rounds=0)
-
-
 # ----------------------------------------------------------------------------
 # Tests for model_rebuild
 # ----------------------------------------------------------------------------
diff --git a/test/sdk/core/agents/test_core_agent.py b/test/sdk/core/agents/test_core_agent.py
index 3dd4f649e..8f4f00ec6 100644
--- a/test/sdk/core/agents/test_core_agent.py
+++ b/test/sdk/core/agents/test_core_agent.py
@@ -279,121 +279,6 @@ def test_parse_code_blobs_run_format():
     assert result == expected
 
 
-# ----------------------------------------------------------------------------
-# Tests for layered final-answer verification policy
-# ----------------------------------------------------------------------------
-
-def _make_verification_controller(**config_overrides):
-    config = core_agent_module.AgentVerificationConfig(
-        enabled=True,
-        step_verification_enabled=True,
-        final_verification_enabled=True,
-        llm_verification_enabled=True,
-        **config_overrides,
-    )
-    observer = MagicMock()
-    observer.add_message = MagicMock()
-    model = MagicMock()
-    logger = MagicMock()
-    logger.log = MagicMock()
-    return core_agent_module.VerificationController(
-        config=config,
-        observer=observer,
-        agent_name="test-agent",
-        model=model,
-        logger=logger,
-    ), model
-
-
-def test_final_verification_skips_llm_for_greeting():
-    """Simple greetings should not require external evidence or tool output."""
-    controller, model = _make_verification_controller()
-
-    result = controller.verify_final_answer(
-        task="你好",
-        candidate="你好！有什么我可以帮你的吗？",
-        memory_summary="Step 1:\nCode:\nObservation:\nOutput:",
-        round_number=1,
-    )
-
-    assert result.passed is True
-    assert result.phase == "final_pass"
-    model.assert_not_called()
-
-
-def test_final_verification_pass_message_explains_reason():
-    """Passed verification events should tell users what was checked."""
-    controller, _ = _make_verification_controller()
-
-    controller.verify_final_answer(
-        task="你好",
-        candidate="你好！有什么我可以帮你的吗？",
-        memory_summary="Step 1:\nCode:\nObservation:\nOutput:",
-        round_number=1,
-    )
-
-    messages = [
-        json.loads(call.args[2])["message"]
-        for call in controller.observer.add_message.call_args_list
-    ]
-
-    assert any("基础自检通过" in message and "答案非空" in message for message in messages)
-    assert any("最终自检通过" in message and "轻量对话无需外部证据" in message for message in messages)
-
-
-def test_verification_feedback_does_not_count_as_tool_error():
-    """Self-verification feedback should not poison the next final-answer check."""
-    controller, _ = _make_verification_controller()
-    memory_summary = """
-Step 1:
-Observation:
-Verification feedback:
-- Event: final_answer
-- Severity: blocking
-- Failed criteria: evidence_grounding, tool_error_handling
-- Repair instruction: Provide more evidence.
-"""
-
-    result = controller.verify_before_final_answer(
-        candidate="你好！有什么我可以帮你的吗？",
-        observation=memory_summary,
-        step_number=2,
-    )
-
-    assert result.passed is True
-    assert "previous_errors_acknowledged" not in result.failed_criteria
-
-
-def test_llm_verifier_ignores_non_required_evidence_and_tool_error_failures():
-    """Verifier output is normalized when failed criteria are not required by policy."""
-    controller, _ = _make_verification_controller()
-    verifier_payload = json.dumps({
-        "passed": False,
-        "score": 0.5,
-        "status": "revise",
-        "failed_criteria": ["evidence_grounding", "tool_error_handling"],
-        "checks": [
-            {"name": "evidence_grounding", "passed": False},
-            {"name": "tool_error_handling", "passed": False},
-        ],
-        "revision_instruction": "Find evidence.",
-        "user_visible_note": "Missing evidence.",
-    })
-
-    result = controller._parse_llm_verifier_result(
-        verifier_payload,
-        {
-            "task_profile": "lightweight_conversation",
-            "evidence_required": False,
-            "tool_error_check_required": False,
-        },
-    )
-
-    assert result.passed is True
-    assert result.failed_criteria == []
-    assert result.score >= controller.config.pass_score
-
-
 def test_parse_code_blobs_run_format_with_newline():
     """Test parse_code_blobs with <code>\\ncontent\\n</code> pattern."""
     text = """Here is some code:
@@ -2487,13 +2372,13 @@ def test_handle_max_steps_reached_model_error_fallback(self):
         # Should return error message
         assert "Error in generating final LLM output" in result
 
-        # Verify logger was called with error
+        # Verify logger was called with warning
         agent.logger.log.assert_called()
-        error_calls = [
+        warning_calls = [
             call for call in agent.logger.log.call_args_list
-            if call[1].get("level") and "ERROR" in str(call[1].get("level"))
+            if call[1].get("level") and "WARNING" in str(call[1].get("level"))
         ]
-        assert len(error_calls) >= 1
+        assert len(warning_calls) >= 1
 
     def test_handle_max_steps_reached_creates_memory_step_with_error(self):
         """Test that a memory step with AgentMaxStepsError is created."""
@@ -2724,3 +2609,4 @@ def failing_truncate(content, max_length=1000):
         # Verify warning was logged via the except block
         # The exception handler logs via self.logger.log()
         agent.logger.log.assert_called()
+
diff --git a/test/sdk/core/agents/test_nexent_agent.py b/test/sdk/core/agents/test_nexent_agent.py
index 882e28514..ff8da11f8 100644
--- a/test/sdk/core/agents/test_nexent_agent.py
+++ b/test/sdk/core/agents/test_nexent_agent.py
@@ -939,88 +939,6 @@ def test_create_local_tool_knowledge_base_with_display_name_map(nexent_agent_ins
     assert result.rerank_model == "mock_rerank_model"
 
 
-def test_create_local_tool_knowledge_base_with_document_paths_from_metadata(nexent_agent_instance):
-    """KnowledgeBaseSearchTool should receive document_paths from metadata via set_document_paths.
-
-    The `document_paths` parameter is declared with `exclude=True` so it must not
-    be passed to __init__. Instead it must be forwarded to `set_document_paths`
-    on the instance, sourced from `tool_config.metadata`. This guards against
-    the FieldInfo-iteration regression reported when document_paths is unset.
-    """
-    mock_kb_tool_class = MagicMock()
-    mock_kb_tool_instance = MagicMock()
-    mock_kb_tool_class.return_value = mock_kb_tool_instance
-
-    document_paths = ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
-
-    tool_config = ToolConfig(
-        class_name="KnowledgeBaseSearchTool",
-        name="knowledge_base_search",
-        description="desc",
-        inputs="{}",
-        output_type="string",
-        params={"top_k": 5, "index_names": ["kb1"]},
-        source="local",
-        metadata={
-            "vdb_core": "mock_vdb_core",
-            "embedding_model": "mock_embedding_model",
-            "document_paths": document_paths,
-        },
-    )
-
-    original_value = nexent_agent.__dict__.get("KnowledgeBaseSearchTool")
-    nexent_agent.__dict__["KnowledgeBaseSearchTool"] = mock_kb_tool_class
-
-    try:
-        nexent_agent_instance.create_local_tool(tool_config)
-    finally:
-        if original_value is not None:
-            nexent_agent.__dict__["KnowledgeBaseSearchTool"] = original_value
-        elif "KnowledgeBaseSearchTool" in nexent_agent.__dict__:
-            del nexent_agent.__dict__["KnowledgeBaseSearchTool"]
-
-    # document_paths is excluded and must not be forwarded to __init__.
-    init_kwargs = mock_kb_tool_class.call_args.kwargs
-    assert "document_paths" not in init_kwargs
-    # It must instead be applied via set_document_paths on the instance.
-    mock_kb_tool_instance.set_document_paths.assert_called_once_with(document_paths)
-
-
-def test_create_local_tool_knowledge_base_without_metadata_calls_set_document_paths_none(nexent_agent_instance):
-    """When metadata lacks document_paths, set_document_paths(None) must still be invoked.
-
-    Ensures the tool's internal filter is explicitly reset to None rather than
-    left as a stale FieldInfo default from the smolagents wrapper.
-    """
-    mock_kb_tool_class = MagicMock()
-    mock_kb_tool_instance = MagicMock()
-    mock_kb_tool_class.return_value = mock_kb_tool_instance
-
-    tool_config = ToolConfig(
-        class_name="KnowledgeBaseSearchTool",
-        name="knowledge_base_search",
-        description="desc",
-        inputs="{}",
-        output_type="string",
-        params={"top_k": 5, "index_names": ["kb1"]},
-        source="local",
-        metadata=None,
-    )
-
-    original_value = nexent_agent.__dict__.get("KnowledgeBaseSearchTool")
-    nexent_agent.__dict__["KnowledgeBaseSearchTool"] = mock_kb_tool_class
-
-    try:
-        nexent_agent_instance.create_local_tool(tool_config)
-    finally:
-        if original_value is not None:
-            nexent_agent.__dict__["KnowledgeBaseSearchTool"] = original_value
-        elif "KnowledgeBaseSearchTool" in nexent_agent.__dict__:
-            del nexent_agent.__dict__["KnowledgeBaseSearchTool"]
-
-    mock_kb_tool_instance.set_document_paths.assert_called_once_with(None)
-
-
 def test_create_local_tool_knowledge_base_with_empty_display_name_map(nexent_agent_instance):
     """Test KnowledgeBaseSearchTool creation handles empty display_name_to_index_map."""
     mock_kb_tool_class = MagicMock()
diff --git a/test/sdk/core/tools/test_knowledge_base_search_tool.py b/test/sdk/core/tools/test_knowledge_base_search_tool.py
index 7a4b23ebe..53d02206a 100644
--- a/test/sdk/core/tools/test_knowledge_base_search_tool.py
+++ b/test/sdk/core/tools/test_knowledge_base_search_tool.py
@@ -118,67 +118,9 @@ class VectorDatabaseCore:
 smolagents_mod = types.ModuleType("smolagents")
 smolagents_tools_mod = types.ModuleType("smolagents.tools")
 
-
 class Tool:
-    """Mock Tool class that properly handles Pydantic Field definitions."""
-
     def __init__(self, *args, **kwargs):
-        from pydantic.fields import FieldInfo
-
-        # Set all provided kwargs as instance attributes
-        for key, value in kwargs.items():
-            setattr(self, key, value)
-
-        # For any Pydantic Field attributes defined in class hierarchy that weren't provided,
-        # extract their default values
-        for cls in type(self).__mro__:
-            if cls is Tool:
-                continue
-            if hasattr(cls, '__annotations__'):
-                for name, hint in cls.__annotations__.items():
-                    # Skip if already set from kwargs
-                    if name in self.__dict__:
-                        continue
-                    # Check if there's a class attribute that's a FieldInfo
-                    if hasattr(cls, name):
-                        value = getattr(cls, name)
-                        # Unwrap FieldInfo to get the default
-                        if isinstance(value, FieldInfo):
-                            # Handle default_factory
-                            if value.default_factory is not None:
-                                value = value.default_factory()
-                            else:
-                                value = value.default
-                        setattr(self, name, value)
-
-    def __setattr__(self, name, value):
-        from pydantic.fields import FieldInfo
-        # Unwrap FieldInfo when it's set after __init__ completes (not from kwargs)
-        if isinstance(value, FieldInfo):
-            # Check if this is a class-level default by looking at the class
-            for cls in type(self).__mro__:
-                if cls is Tool:
-                    continue
-                if hasattr(cls, name):
-                    class_attr = getattr(cls, name)
-                    if class_attr is value:
-                        # This is a class-level FieldInfo default, unwrap it
-                        if value.default_factory is not None:
-                            value = value.default_factory()
-                        else:
-                            value = value.default
-                        break
-            else:
-                # Not found in class hierarchy, unwrap it anyway
-                if value.default_factory is not None:
-                    value = value.default_factory()
-                else:
-                    value = value.default
-        self.__dict__[name] = value
-
-    def __repr__(self):
-        return f"<MockTool _internal_document_paths={getattr(self, '_internal_document_paths', 'MISSING')}>"
-
+        pass
 
 smolagents_tools_mod.Tool = Tool
 smolagents_mod.tools = smolagents_tools_mod
@@ -555,10 +497,15 @@ def test_init_without_rerank_params(self, mock_observer):
             observer=mock_observer,
         )
 
-        # Mock Tool properly unwraps Field defaults, so we check the actual values
-        assert tool.rerank is False
-        assert tool.rerank_model_name == ""
-        assert tool.rerank_model is None
+        # smolagents Tool doesn't properly handle Field defaults, so we check FieldInfo.default
+        try:
+            from pydantic import FieldInfo
+        except ImportError:
+            from pydantic.fields import FieldInfo
+        assert isinstance(tool.rerank, FieldInfo)
+        assert tool.rerank.default is False
+        assert tool.rerank_model_name.default == ""
+        assert tool.rerank_model.default is None
 
     def test_forward_with_rerank_enabled(self, mock_observer, mock_vdb_core, mock_embedding_model, mocker):
         """Test forward method when rerank is enabled and model is provided."""
@@ -1569,298 +1516,3 @@ def test_forward_with_fieldinfo_rerank_default_only(self, mock_observer, mock_vd
         call_kwargs = mock_vdb_core.hybrid_search.call_args[1]
         # top_k from default is 3, multiplied by RERANK_OVERSEARCH_MULTIPLIER
         assert call_kwargs["top_k"] == 3 * RERANK_OVERSEARCH_MULTIPLIER
-
-
-class TestDocumentPathsAccessControl:
-    """Tests for document_paths access control functionality."""
-
-    def _create_mock_formatted_results_with_paths(self, paths: list) -> list:
-        """Create mock search results in FORMATTED format for _filter_by_document_paths tests.
-
-        After search_hybrid processes VDB results, the path_or_url is at the top level.
-        """
-        results = []
-        for path in paths:
-            results.append({
-                "path_or_url": path,
-                "title": f"Document {path}",
-                "content": f"Content for {path}",
-                "filename": f"{path}.txt",
-                "source_type": "file",
-                "create_time": "2024-01-01T12:00:00Z",
-                "score": 0.9,
-                "index": "test_index"
-            })
-        return results
-
-    def _create_mock_vdb_results_with_paths(self, paths: list) -> list:
-        """Create mock search results in VDB format for forward() tests.
-
-        VDB returns results with a nested 'document' object.
-        """
-        results = []
-        for path in paths:
-            results.append({
-                "document": {
-                    "path_or_url": path,
-                    "title": f"Document {path}",
-                    "content": f"Content for {path}",
-                    "filename": f"{path}.txt",
-                    "source_type": "file",
-                    "create_time": "2024-01-01T12:00:00Z",
-                },
-                "score": 0.9,
-                "index": "test_index"
-            })
-        return results
-        return results
-
-    def test_filter_by_document_paths_allows_matching(self, mock_vdb_core, mock_embedding_model):
-        """Test that results with path_or_url in the allowed list are returned."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"],
-        )
-
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        filtered = tool._filter_by_document_paths(results)
-
-        # Only doc1 and doc2 should be returned
-        assert len(filtered) == 2
-        assert all(r.get("path_or_url") in ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"] for r in filtered)
-
-    def test_filter_by_document_paths_rejects_non_matching(self, mock_vdb_core, mock_embedding_model):
-        """Test that results with path_or_url NOT in the allowed list are filtered out."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=["s3://bucket/doc1.txt"],
-        )
-
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        filtered = tool._filter_by_document_paths(results)
-
-        # Only doc1 should be returned
-        assert len(filtered) == 1
-        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
-
-    def test_filter_by_document_paths_empty_list_returns_all(self, mock_vdb_core, mock_embedding_model):
-        """Test that empty document_paths list returns all results."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=[],
-        )
-
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        filtered = tool._filter_by_document_paths(results)
-
-        # All results should be returned
-        assert len(filtered) == 3
-
-    def test_filter_by_document_paths_none_returns_all(self, mock_vdb_core, mock_embedding_model):
-        """Test that None document_paths (no filter) returns all results."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=None,
-        )
-
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        filtered = tool._filter_by_document_paths(results)
-
-        # All results should be returned
-        assert len(filtered) == 3
-
-    def test_filter_by_document_paths_results_missing_path(self, mock_vdb_core, mock_embedding_model):
-        """Test that results without path_or_url field are filtered out when filter is active."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=["s3://bucket/doc1.txt"],
-        )
-
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt"])
-        # Add a result without path_or_url (flat format, no nested document)
-        results.append({
-            "title": "No Path",
-            "content": "This document has no path_or_url",
-            "filename": "no_path.txt",
-            "source_type": "file",
-            "score": 0.8,
-            "index": "test_index"
-        })
-
-        filtered = tool._filter_by_document_paths(results)
-
-        # Only doc1 should be returned
-        assert len(filtered) == 1
-        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
-
-    def test_set_document_paths_method(self, mock_vdb_core, mock_embedding_model):
-        """Test the set_document_paths method updates the internal filter."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=None,
-        )
-
-        # Initially no filter
-        results = self._create_mock_formatted_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"])
-        assert len(tool._filter_by_document_paths(results)) == 2
-
-        # Set document_paths filter
-        tool.set_document_paths(["s3://bucket/doc1.txt"])
-        filtered = tool._filter_by_document_paths(results)
-
-        # Only doc1 should be returned
-        assert len(filtered) == 1
-        assert filtered[0].get("path_or_url") == "s3://bucket/doc1.txt"
-
-    def test_forward_with_document_paths_filter(self, mock_vdb_core, mock_embedding_model, mock_observer):
-        """Test that forward method applies document_paths filter to search results."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            observer=mock_observer,
-            document_paths=["s3://bucket/doc1.txt"],
-            top_k=5,
-        )
-
-        # Mock VDB returns 3 results, but only 1 matches the filter
-        # VDB returns nested 'document' format
-        mock_results = self._create_mock_vdb_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        mock_vdb_core.hybrid_search.return_value = mock_results
-
-        result = tool.forward("test query")
-        search_results = json.loads(result)
-
-        # Only doc1 should be in the result
-        assert len(search_results) == 1
-        assert search_results[0].get("url") == "s3://bucket/doc1.txt"
-
-    def test_forward_with_document_paths_filter_no_results_after_filter(self, mock_vdb_core, mock_embedding_model, mock_observer):
-        """Test that forward raises exception when all results are filtered out."""
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            observer=mock_observer,
-            document_paths=["s3://bucket/nonexistent.txt"],
-            top_k=5,
-        )
-
-        # Mock VDB returns 3 results, none match the filter
-        mock_results = self._create_mock_vdb_results_with_paths(["s3://bucket/doc1.txt", "s3://bucket/doc2.txt", "s3://bucket/doc3.txt"])
-        mock_vdb_core.hybrid_search.return_value = mock_results
-
-        # Should raise exception because after filtering, no results remain
-        with pytest.raises(Exception) as excinfo:
-            tool.forward("test query")
-
-        assert "No results found" in str(excinfo.value)
-
-    def test_filter_by_document_paths_unwraps_fieldinfo_default(self, mock_vdb_core, mock_embedding_model):
-        """Filter should tolerate a FieldInfo default instead of a concrete list.
-
-        Regression: smolagents' Tool wrapper does not expand FieldInfo defaults for
-        parameters declared with `exclude=True`, so `self._internal_document_paths`
-        may arrive as a FieldInfo. The filter must unwrap it instead of failing with
-        `TypeError: argument of type 'FieldInfo' is not iterable`.
-        """
-        try:
-            from pydantic import FieldInfo
-        except ImportError:
-            from pydantic.fields import FieldInfo
-
-        field_info_default = FieldInfo(default=["s3://bucket/doc1.txt"])
-
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=None,
-        )
-        # Simulate a FieldInfo being assigned directly (e.g. from smolagents wrapper).
-        tool._internal_document_paths = field_info_default
-
-        results = self._create_mock_formatted_results_with_paths(
-            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
-        )
-        filtered = tool._filter_by_document_paths(results)
-
-        assert len(filtered) == 1
-        assert filtered[0]["path_or_url"] == "s3://bucket/doc1.txt"
-
-    def test_filter_by_document_paths_unwraps_fieldinfo_default_factory(self, mock_vdb_core, mock_embedding_model):
-        """Filter should tolerate a FieldInfo with default_factory."""
-        try:
-            from pydantic import FieldInfo
-        except ImportError:
-            from pydantic.fields import FieldInfo
-
-        field_info_factory = FieldInfo(
-            default_factory=lambda: ["s3://bucket/doc2.txt"]
-        )
-
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=None,
-        )
-        tool._internal_document_paths = field_info_factory
-
-        results = self._create_mock_formatted_results_with_paths(
-            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
-        )
-        filtered = tool._filter_by_document_paths(results)
-
-        assert len(filtered) == 1
-        assert filtered[0]["path_or_url"] == "s3://bucket/doc2.txt"
-
-    def test_set_document_paths_unwraps_fieldinfo(self, mock_vdb_core, mock_embedding_model):
-        """set_document_paths should also accept FieldInfo input defensively."""
-        try:
-            from pydantic import FieldInfo
-        except ImportError:
-            from pydantic.fields import FieldInfo
-
-        tool = KnowledgeBaseSearchTool(
-            index_names=["kb1"],
-            search_mode="hybrid",
-            vdb_core=mock_vdb_core,
-            embedding_model=mock_embedding_model,
-            document_paths=None,
-        )
-
-        field_info = FieldInfo(default=["s3://bucket/doc1.txt"])
-        tool.set_document_paths(field_info)
-
-        results = self._create_mock_formatted_results_with_paths(
-            ["s3://bucket/doc1.txt", "s3://bucket/doc2.txt"]
-        )
-        filtered = tool._filter_by_document_paths(results)
-
-        assert len(filtered) == 1
-        assert filtered[0]["path_or_url"] == "s3://bucket/doc1.txt"
-
-
diff --git a/test/sdk/core/tools/test_search_memory_tool.py b/test/sdk/core/tools/test_search_memory_tool.py
deleted file mode 100644
index c17f2f14d..000000000
--- a/test/sdk/core/tools/test_search_memory_tool.py
+++ /dev/null
@@ -1,209 +0,0 @@
-import pytest
-from unittest.mock import MagicMock, patch, AsyncMock
-
-from sdk.nexent.core.utils.observer import MessageObserver, ProcessType
-from sdk.nexent.core.tools.search_memory_tool import SearchMemoryTool
-
-
-@pytest.fixture
-def mock_observer():
-    observer = MagicMock(spec=MessageObserver)
-    observer.lang = "en"
-    return observer
-
-
-@pytest.fixture
-def mock_user_config():
-    config = MagicMock()
-    config.agent_share_option = "always"
-    config.disable_agent_ids = []
-    config.disable_user_agent_ids = []
-    return config
-
-
-@pytest.fixture
-def search_memory_tool(mock_observer, mock_user_config):
-    return SearchMemoryTool(
-        memory_config={"test": "config"},
-        tenant_id="tenant_1",
-        user_id="user_1",
-        agent_id="agent_1",
-        memory_user_config=mock_user_config,
-        observer=mock_observer,
-    )
-
-
-def test_observer_english_message(search_memory_tool, mock_observer):
-    mock_observer.lang = "en"
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        search_memory_tool.forward("some query")
-
-    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "Searching memory...")
-
-
-def test_observer_chinese_message(search_memory_tool, mock_observer):
-    mock_observer.lang = "zh"
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        search_memory_tool.forward("some query")
-
-    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "搜索记忆中...")
-
-
-def test_no_observer(search_memory_tool):
-    search_memory_tool.observer = None
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"memory": "fact", "score": 0.9, "memory_level": "user"}]},
-    ):
-        result = search_memory_tool.forward("some query")
-
-    assert "Found 1 relevant memories" in result
-
-
-def test_forward_with_results(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"memory": "User prefers dark mode", "score": 0.92, "memory_level": "user_agent"},
-                {"memory": "User timezone is UTC+8", "score": 0.85, "memory_level": "user"},
-                {"memory": "Agent should confirm before executing", "score": 0.71, "memory_level": "agent"},
-            ]
-        },
-    ) as mock_search:
-        result = search_memory_tool.forward("user preferences", top_k=3)
-
-    assert "Found 3 relevant memories" in result
-    assert "(score: 0.92, level: user_agent) User prefers dark mode" in result
-    assert "(score: 0.85, level: user) User timezone is UTC+8" in result
-    assert "(score: 0.71, level: agent) Agent should confirm before executing" in result
-
-    mock_search.assert_called_once_with(
-        query_text="user preferences",
-        memory_config={"test": "config"},
-        tenant_id="tenant_1",
-        user_id="user_1",
-        agent_id="agent_1",
-        top_k=3,
-        memory_levels=["tenant", "user", "agent", "user_agent"],
-    )
-
-
-def test_forward_no_results(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        result = search_memory_tool.forward("nonexistent topic")
-
-    assert result == "No relevant memories found."
-
-
-def test_forward_default_top_k(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ) as mock_search:
-        search_memory_tool.forward("some query")
-
-    call_kwargs = mock_search.call_args[1]
-    assert call_kwargs["top_k"] == 5
-
-
-def test_forward_custom_top_k(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ) as mock_search:
-        search_memory_tool.forward("some query", top_k=10)
-
-    call_kwargs = mock_search.call_args[1]
-    assert call_kwargs["top_k"] == 10
-
-
-def test_forward_uses_content_field_fallback(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"content": "Fallback content field", "score": 0.8, "memory_level": "user"},
-            ]
-        },
-    ):
-        result = search_memory_tool.forward("query")
-
-    assert "Fallback content field" in result
-
-
-def test_levels_agent_share_never(search_memory_tool, mock_user_config):
-    mock_user_config.agent_share_option = "never"
-
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ) as mock_search:
-        search_memory_tool.forward("query")
-
-    call_kwargs = mock_search.call_args[1]
-    assert "agent" not in call_kwargs["memory_levels"]
-    assert "tenant" in call_kwargs["memory_levels"]
-    assert "user" in call_kwargs["memory_levels"]
-    assert "user_agent" in call_kwargs["memory_levels"]
-
-
-def test_levels_disable_agent_ids(search_memory_tool, mock_user_config):
-    mock_user_config.disable_agent_ids = ["agent_1"]
-
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ) as mock_search:
-        search_memory_tool.forward("query")
-
-    call_kwargs = mock_search.call_args[1]
-    assert "agent" not in call_kwargs["memory_levels"]
-    assert "tenant" in call_kwargs["memory_levels"]
-
-
-def test_levels_disable_user_agent_ids(search_memory_tool, mock_user_config):
-    mock_user_config.disable_user_agent_ids = ["agent_1"]
-
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ) as mock_search:
-        search_memory_tool.forward("query")
-
-    call_kwargs = mock_search.call_args[1]
-    assert "user_agent" not in call_kwargs["memory_levels"]
-    assert "agent" in call_kwargs["memory_levels"]
-
-
-def test_forward_exception_returns_friendly_error(search_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.search_memory_in_levels",
-        new_callable=AsyncMock,
-        side_effect=Exception("Elasticsearch timeout"),
-    ):
-        result = search_memory_tool.forward("query")
-
-    assert "Memory search failed" in result
-    assert "Elasticsearch timeout" in result
-    assert "Continuing without memory results" in result
diff --git a/test/sdk/core/tools/test_store_memory_tool.py b/test/sdk/core/tools/test_store_memory_tool.py
deleted file mode 100644
index a3cfde9ef..000000000
--- a/test/sdk/core/tools/test_store_memory_tool.py
+++ /dev/null
@@ -1,285 +0,0 @@
-import pytest
-from unittest.mock import MagicMock, patch, AsyncMock
-
-from sdk.nexent.core.utils.observer import MessageObserver, ProcessType
-from sdk.nexent.core.tools.store_memory_tool import StoreMemoryTool
-
-
-@pytest.fixture
-def mock_observer():
-    observer = MagicMock(spec=MessageObserver)
-    observer.lang = "en"
-    return observer
-
-
-@pytest.fixture
-def mock_user_config():
-    config = MagicMock()
-    config.agent_share_option = "always"
-    config.disable_agent_ids = []
-    config.disable_user_agent_ids = []
-    return config
-
-
-@pytest.fixture
-def store_memory_tool(mock_observer, mock_user_config):
-    return StoreMemoryTool(
-        memory_config={"test": "config"},
-        tenant_id="tenant_1",
-        user_id="user_1",
-        agent_id="agent_1",
-        memory_user_config=mock_user_config,
-        observer=mock_observer,
-    )
-
-
-def test_observer_english_message(store_memory_tool, mock_observer):
-    mock_observer.lang = "en"
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        store_memory_tool.forward("some content")
-
-    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "Saving to memory...")
-
-
-def test_observer_chinese_message(store_memory_tool, mock_observer):
-    mock_observer.lang = "zh"
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        store_memory_tool.forward("some content")
-
-    mock_observer.add_message.assert_any_call("", ProcessType.TOOL, "保存到记忆中...")
-
-
-def test_no_observer(store_memory_tool):
-    store_memory_tool.observer = None
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ):
-        result = store_memory_tool.forward("some content")
-
-    assert "Stored successfully" in result
-
-
-def test_forward_add_event(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"event": "ADD", "memory": "User prefers dark mode"},
-                {"event": "ADD", "memory": "User works on Project X"},
-            ]
-        },
-    ) as mock_add:
-        result = store_memory_tool.forward("I prefer dark mode and work on Project X")
-
-    assert "Stored successfully" in result
-    assert "[ADD] User prefers dark mode" in result
-    assert "[ADD] User works on Project X" in result
-    assert store_memory_tool.store_count == 1
-
-    mock_add.assert_called_once_with(
-        messages=[{"role": "user", "content": "I prefer dark mode and work on Project X"}],
-        memory_config={"test": "config"},
-        tenant_id="tenant_1",
-        user_id="user_1",
-        agent_id="agent_1",
-        memory_levels=["user_agent", "agent"],
-    )
-
-
-def test_forward_update_event(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"event": "UPDATE", "memory": "User prefers dark mode and high contrast"},
-            ]
-        },
-    ):
-        result = store_memory_tool.forward("I also like high contrast")
-
-    assert "Stored successfully" in result
-    assert "[UPDATE] User prefers dark mode and high contrast" in result
-
-
-def test_forward_mixed_events(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"event": "ADD", "memory": "New fact"},
-                {"event": "NONE", "memory": "Existing fact"},
-                {"event": "DELETE", "memory": "Old fact"},
-                {"event": "UPDATE", "memory": "Updated fact"},
-            ]
-        },
-    ):
-        result = store_memory_tool.forward("some content")
-
-    assert "[ADD] New fact" in result
-    assert "[UPDATE] Updated fact" in result
-    assert "NONE" not in result
-    assert "DELETE" not in result
-
-
-def test_forward_no_results(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        result = store_memory_tool.forward("just a greeting")
-
-    assert result == "No new facts were extracted from the content."
-
-
-def test_forward_all_none_events(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={
-            "results": [
-                {"event": "NONE", "memory": "Already known fact"},
-            ]
-        },
-    ):
-        result = store_memory_tool.forward("already known info")
-
-    assert result == "The information was already present in memory (no changes needed)."
-
-
-def test_cost_guard_limit_reached(store_memory_tool):
-    store_memory_tool.store_count = 3
-
-    result = store_memory_tool.forward("some content")
-
-    assert "Memory storage limit reached" in result
-
-
-def test_cost_guard_increments_counter(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ):
-        store_memory_tool.forward("content 1")
-        store_memory_tool.forward("content 2")
-
-    assert store_memory_tool.store_count == 2
-
-
-def test_cost_guard_increments_even_with_no_facts(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": []},
-    ):
-        store_memory_tool.forward("nothing useful")
-
-    # store_count increments after asyncio.run succeeds, regardless of results
-    assert store_memory_tool.store_count == 1
-
-
-def test_levels_agent_share_never(store_memory_tool, mock_user_config):
-    mock_user_config.agent_share_option = "never"
-
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ) as mock_add:
-        store_memory_tool.forward("some content")
-
-    call_kwargs = mock_add.call_args[1]
-    assert call_kwargs["memory_levels"] == ["user_agent"]
-    assert "agent" not in call_kwargs["memory_levels"]
-
-
-def test_levels_agent_share_always(store_memory_tool, mock_user_config):
-    mock_user_config.agent_share_option = "always"
-
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ) as mock_add:
-        store_memory_tool.forward("some content")
-
-    call_kwargs = mock_add.call_args[1]
-    assert "user_agent" in call_kwargs["memory_levels"]
-    assert "agent" in call_kwargs["memory_levels"]
-
-
-def test_levels_disable_agent_ids(store_memory_tool, mock_user_config):
-    mock_user_config.disable_agent_ids = ["agent_1"]
-
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ) as mock_add:
-        store_memory_tool.forward("some content")
-
-    call_kwargs = mock_add.call_args[1]
-    assert "agent" not in call_kwargs["memory_levels"]
-    assert "user_agent" in call_kwargs["memory_levels"]
-
-
-def test_levels_disable_user_agent_ids(store_memory_tool, mock_user_config):
-    mock_user_config.disable_user_agent_ids = ["agent_1"]
-
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        return_value={"results": [{"event": "ADD", "memory": "fact"}]},
-    ) as mock_add:
-        store_memory_tool.forward("some content")
-
-    call_kwargs = mock_add.call_args[1]
-    assert "user_agent" not in call_kwargs["memory_levels"]
-    assert "agent" in call_kwargs["memory_levels"]
-
-
-def test_levels_all_disabled(store_memory_tool, mock_user_config):
-    mock_user_config.disable_agent_ids = ["agent_1"]
-    mock_user_config.disable_user_agent_ids = ["agent_1"]
-
-    result = store_memory_tool.forward("some content")
-
-    assert result == "No memory levels available (all disabled by user preferences)."
-
-
-def test_forward_exception_returns_friendly_error(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        side_effect=Exception("Elasticsearch connection refused"),
-    ):
-        result = store_memory_tool.forward("some content")
-
-    assert "Failed to store memory" in result
-    assert "Elasticsearch connection refused" in result
-    assert "Continuing without saving" in result
-
-
-def test_forward_exception_does_not_increment_counter(store_memory_tool):
-    with patch(
-        "sdk.nexent.memory.memory_service.add_memory_in_levels",
-        new_callable=AsyncMock,
-        side_effect=Exception("connection error"),
-    ):
-        store_memory_tool.forward("some content")
-
-    assert store_memory_tool.store_count == 0
diff --git a/test/sdk/data_process/test_core.py b/test/sdk/data_process/test_core.py
index e0edced14..6c47c3732 100644
--- a/test/sdk/data_process/test_core.py
+++ b/test/sdk/data_process/test_core.py
@@ -2,22 +2,6 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock
 from io import BytesIO
-import sys
-import types
-
-
-fake_unstructured = types.ModuleType("unstructured_inference")
-fake_models = types.ModuleType("unstructured_inference.models")
-fake_tables = types.ModuleType("unstructured_inference.models.tables")
-fake_tables.tables_agent = types.SimpleNamespace(model=None)
-fake_logger = types.ModuleType("unstructured_inference.logger")
-fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
-fake_models.tables = fake_tables
-fake_unstructured.models = fake_models
-sys.modules.setdefault("unstructured_inference", fake_unstructured)
-sys.modules.setdefault("unstructured_inference.models", fake_models)
-sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
-sys.modules.setdefault("unstructured_inference.logger", fake_logger)
 
 from sdk.nexent.data_process.core import DataProcessCore
 
diff --git a/test/sdk/data_process/test_file_splitter.py b/test/sdk/data_process/test_file_splitter.py
index 5c44131d7..6e59d2b76 100644
--- a/test/sdk/data_process/test_file_splitter.py
+++ b/test/sdk/data_process/test_file_splitter.py
@@ -1,6 +1,4 @@
 from io import BytesIO
-import sys
-import types
 
 import pytest
 
@@ -9,19 +7,6 @@
 pytest.importorskip("openpyxl")
 pytest.importorskip("pypdf")
 
-fake_unstructured = types.ModuleType("unstructured_inference")
-fake_models = types.ModuleType("unstructured_inference.models")
-fake_tables = types.ModuleType("unstructured_inference.models.tables")
-fake_tables.tables_agent = types.SimpleNamespace(model=None)
-fake_logger = types.ModuleType("unstructured_inference.logger")
-fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
-fake_models.tables = fake_tables
-fake_unstructured.models = fake_models
-sys.modules.setdefault("unstructured_inference", fake_unstructured)
-sys.modules.setdefault("unstructured_inference.models", fake_models)
-sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
-sys.modules.setdefault("unstructured_inference.logger", fake_logger)
-
 from sdk.nexent.data_process.file_splitter import FileSplitter
 
 
diff --git a/test/sdk/data_process/test_openpyxl_processor.py b/test/sdk/data_process/test_openpyxl_processor.py
index b8c5178fe..91182470e 100644
--- a/test/sdk/data_process/test_openpyxl_processor.py
+++ b/test/sdk/data_process/test_openpyxl_processor.py
@@ -3,22 +3,6 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock, patch
 from copy import deepcopy
-import sys
-import types
-
-
-fake_unstructured = types.ModuleType("unstructured_inference")
-fake_models = types.ModuleType("unstructured_inference.models")
-fake_tables = types.ModuleType("unstructured_inference.models.tables")
-fake_tables.tables_agent = types.SimpleNamespace(model=None)
-fake_logger = types.ModuleType("unstructured_inference.logger")
-fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
-fake_models.tables = fake_tables
-fake_unstructured.models = fake_models
-sys.modules.setdefault("unstructured_inference", fake_unstructured)
-sys.modules.setdefault("unstructured_inference.models", fake_models)
-sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
-sys.modules.setdefault("unstructured_inference.logger", fake_logger)
 
 from sdk.nexent.data_process.openpyxl_processor import OpenPyxlProcessor
 
diff --git a/test/sdk/data_process/test_unstructured_processor.py b/test/sdk/data_process/test_unstructured_processor.py
index 83724e995..bfb828d10 100644
--- a/test/sdk/data_process/test_unstructured_processor.py
+++ b/test/sdk/data_process/test_unstructured_processor.py
@@ -5,20 +5,6 @@
 from pytest_mock import MockFixture
 from unittest.mock import Mock, MagicMock, patch
 
-
-fake_unstructured = types.ModuleType("unstructured_inference")
-fake_models = types.ModuleType("unstructured_inference.models")
-fake_tables = types.ModuleType("unstructured_inference.models.tables")
-fake_tables.tables_agent = types.SimpleNamespace(model=None)
-fake_logger = types.ModuleType("unstructured_inference.logger")
-fake_logger.logger = types.SimpleNamespace(info=lambda *a, **k: None, warning=lambda *a, **k: None, error=lambda *a, **k: None)
-fake_models.tables = fake_tables
-fake_unstructured.models = fake_models
-sys.modules.setdefault("unstructured_inference", fake_unstructured)
-sys.modules.setdefault("unstructured_inference.models", fake_models)
-sys.modules.setdefault("unstructured_inference.models.tables", fake_tables)
-sys.modules.setdefault("unstructured_inference.logger", fake_logger)
-
 from sdk.nexent.data_process.unstructured_processor import UnstructuredProcessor
 
 
diff --git a/test/sdk/skills/test_skill_manager.py b/test/sdk/skills/test_skill_manager.py
index b23c0b8dd..a262a4bbe 100644
--- a/test/sdk/skills/test_skill_manager.py
+++ b/test/sdk/skills/test_skill_manager.py
@@ -1921,8 +1921,7 @@ def test_run_python_script_with_list_params(self, mocker):
 
             assert result == "ok"
             args = sp.run.call_args[0][0]
-            assert args[0] == sys.executable
-            assert args[1:] == [ANY, "-i", "a", "-i", "b", "-i", "c"]
+            assert args == ["python", ANY, "-i", "a", "-i", "b", "-i", "c"]
 
     def test_run_python_script_boolean_false_excluded(self, mocker):
         """Test boolean flags in string params are passed as-is (True)."""