From 625c2d5a77a65f94ae2f377023ba6b8968f3d351 Mon Sep 17 00:00:00 2001
From: Junyan Chin <rockchinq@gmail.com>
Date: Sun, 1 Mar 2026 18:11:43 +0800
Subject: [PATCH 1/7] feat: model fallback chain (#2017)

---------

Co-authored-by: TyperBody <mcjiekejiemi@163.com>
---
 .../libs/wechatpad_api/util/http_util.py      |  28 +-
 .../controller/groups/provider/api_chains.py  |  41 +
 src/langbot/pkg/api/http/service/api_chain.py | 149 ++++
 src/langbot/pkg/api/http/service/space.py     |  82 +-
 src/langbot/pkg/core/app.py                   |   6 +
 src/langbot/pkg/core/bootutils/deps.py        |   8 +-
 src/langbot/pkg/core/stages/build_app.py      |   9 +
 .../pkg/entity/persistence/api_chain.py       |  98 +++
 .../migrations/dbm008_api_chain.py            |  46 ++
 .../dbm020_api_chain_model_api_level.py       |  39 +
 .../dbm021_api_chain_health_check_flag.py     |  27 +
 .../cntfilter/filters/baiduexamine.py         |  83 +-
 src/langbot/pkg/pipeline/preproc/preproc.py   |  52 +-
 src/langbot/pkg/platform/sources/discord.py   |  60 +-
 src/langbot/pkg/platform/sources/kook.py      |  68 +-
 src/langbot/pkg/platform/sources/lark.py      |  24 +-
 .../pkg/platform/sources/legacy/gewechat.py   |  18 +-
 src/langbot/pkg/platform/sources/telegram.py  |  46 +-
 src/langbot/pkg/platform/webhook_pusher.py    |  34 +-
 .../pkg/provider/modelmgr/api_chain.py        | 757 ++++++++++++++++++
 .../pkg/provider/runners/localagent.py        | 122 ++-
 src/langbot/pkg/provider/runners/n8nsvapi.py  |  80 +-
 src/langbot/pkg/utils/image.py                | 163 ++--
 .../templates/metadata/pipeline/ai.yaml       |   6 +-
 web/eslint.config.mjs                         |   3 +
 .../home/bots/components/bot-form/BotForm.tsx |   8 +-
 .../api-chains-dialog/APIChainCard.tsx        | 495 ++++++++++++
 .../api-chains-dialog/APIChainForm.tsx        | 665 +++++++++++++++
 .../api-chains-dialog/APIChainsDialog.tsx     | 179 +++++
 .../dynamic-form/DynamicFormComponent.tsx     |  41 +-
 .../dynamic-form/DynamicFormItemComponent.tsx | 104 ++-
 .../components/models-dialog/ModelsDialog.tsx |  37 +-
 web/src/app/infra/entities/api/api_chain.ts   |  64 ++
 web/src/app/infra/entities/api/index.ts       |  58 ++
 web/src/app/infra/entities/form/dynamic.ts    |   1 +
 web/src/app/infra/http/BackendClient.ts       |  29 +
 web/src/i18n/locales/en-US.ts                 |  56 ++
 web/src/i18n/locales/ja-JP.ts                 |  58 +-
 web/src/i18n/locales/zh-Hans.ts               |  56 ++
 web/src/i18n/locales/zh-Hant.ts               |  55 ++
 40 files changed, 3487 insertions(+), 468 deletions(-)
 create mode 100644 src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
 create mode 100644 src/langbot/pkg/api/http/service/api_chain.py
 create mode 100644 src/langbot/pkg/entity/persistence/api_chain.py
 create mode 100644 src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
 create mode 100644 src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
 create mode 100644 src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py
 create mode 100644 src/langbot/pkg/provider/modelmgr/api_chain.py
 create mode 100644 web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
 create mode 100644 web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
 create mode 100644 web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
 create mode 100644 web/src/app/infra/entities/api/api_chain.ts

diff --git a/src/langbot/libs/wechatpad_api/util/http_util.py b/src/langbot/libs/wechatpad_api/util/http_util.py
index 7390f43ec..447c29df0 100644
--- a/src/langbot/libs/wechatpad_api/util/http_util.py
+++ b/src/langbot/libs/wechatpad_api/util/http_util.py
@@ -1,5 +1,5 @@
 import requests
-from langbot.pkg.utils import httpclient
+import aiohttp
 
 
 def post_json(base_url, token, data=None):
@@ -63,16 +63,16 @@ async def async_request(
     """
     headers = {'Content-Type': 'application/json'}
     url = f'{base_url}?key={token_key}'
-    session = httpclient.get_session()
-    async with session.request(
-        method=method, url=url, params=params, headers=headers, data=data, json=json
-    ) as response:
-        response.raise_for_status()  # 如果状态码不是200，抛出异常
-        result = await response.json()
-        # print(result)
-        return result
-        # if result.get('Code') == 200:
-        #
-        #     return await result
-        # else:
-        #     raise RuntimeError("请求失败",response.text)
+    async with aiohttp.ClientSession() as session:
+        async with session.request(
+            method=method, url=url, params=params, headers=headers, data=data, json=json
+        ) as response:
+            response.raise_for_status()  # 如果状态码不是200，抛出异常
+            result = await response.json()
+            # print(result)
+            return result
+            # if result.get('Code') == 200:
+            #
+            #     return await result
+            # else:
+            #     raise RuntimeError("请求失败",response.text)
diff --git a/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py b/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
new file mode 100644
index 000000000..fd921f135
--- /dev/null
+++ b/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
@@ -0,0 +1,41 @@
+"""API Chain HTTP Controller"""
+
+import quart
+
+from ... import group
+
+
+@group.group_class('api_chains', '/api/v1/provider/api-chains')
+class APIChainRouterGroup(group.RouterGroup):
+    async def initialize(self) -> None:
+        @self.route('', methods=['GET', 'POST'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
+        async def _() -> str:
+            if quart.request.method == 'GET':
+                chains = await self.ap.api_chain_service.get_api_chains()
+                return self.success(data={'chains': chains})
+            elif quart.request.method == 'POST':
+                json_data = await quart.request.json
+                chain_uuid = await self.ap.api_chain_service.create_api_chain(json_data)
+                return self.success(data={'uuid': chain_uuid})
+
+        @self.route('/<chain_uuid>', methods=['GET', 'PUT', 'DELETE'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
+        async def _(chain_uuid: str) -> str:
+            if quart.request.method == 'GET':
+                chain = await self.ap.api_chain_service.get_api_chain(chain_uuid)
+
+                if chain is None:
+                    return self.http_status(404, -1, 'API chain not found')
+
+                return self.success(data={'chain': chain})
+            elif quart.request.method == 'PUT':
+                json_data = await quart.request.json
+                await self.ap.api_chain_service.update_api_chain(chain_uuid, json_data)
+                return self.success()
+            elif quart.request.method == 'DELETE':
+                await self.ap.api_chain_service.delete_api_chain(chain_uuid)
+                return self.success()
+
+        @self.route('/<chain_uuid>/test', methods=['POST'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
+        async def _(chain_uuid: str) -> str:
+            result = await self.ap.api_chain_service.test_api_chain(chain_uuid)
+            return self.success(data=result)
diff --git a/src/langbot/pkg/api/http/service/api_chain.py b/src/langbot/pkg/api/http/service/api_chain.py
new file mode 100644
index 000000000..5d12196cb
--- /dev/null
+++ b/src/langbot/pkg/api/http/service/api_chain.py
@@ -0,0 +1,149 @@
+"""API Chain Service - HTTP service for managing API chains"""
+
+from __future__ import annotations
+
+import uuid
+from typing import Dict, Any, List
+import sqlalchemy
+
+from ....core import app
+from ....entity.persistence import api_chain as api_chain_entity
+# NOTE: uuid and sqlalchemy are kept for the read methods; mutations delegate to api_chain_mgr
+
+
+class APIChainService:
+    """Service for managing API chains"""
+
+    ap: app.Application
+
+    def __init__(self, ap: app.Application) -> None:
+        self.ap = ap
+
+    async def get_api_chains(self) -> List[Dict[str, Any]]:
+        """Get all API chains with their statuses"""
+        result = await self.ap.persistence_mgr.execute_async(sqlalchemy.select(api_chain_entity.APIChain))
+
+        chains = []
+        for chain in result.all():
+            # Get status for all providers in this chain
+            status_result = await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.select(api_chain_entity.APIChainStatus).where(
+                    api_chain_entity.APIChainStatus.chain_uuid == chain.uuid
+                )
+            )
+
+            statuses = []
+            for status in status_result.all():
+                statuses.append(
+                    {
+                        'provider_uuid': status.provider_uuid,
+                        'model_name': status.model_name,
+                        'api_key_index': status.api_key_index,
+                        'is_healthy': status.is_healthy,
+                        'failure_count': status.failure_count,
+                        'last_failure_time': status.last_failure_time.isoformat() if status.last_failure_time else None,
+                        'last_success_time': status.last_success_time.isoformat() if status.last_success_time else None,
+                        'last_health_check_time': status.last_health_check_time.isoformat()
+                        if status.last_health_check_time
+                        else None,
+                        'last_error_message': status.last_error_message,
+                        'health_check_last_failed': status.health_check_last_failed,
+                    }
+                )
+
+            chains.append(
+                {
+                    'uuid': chain.uuid,
+                    'name': chain.name,
+                    'description': chain.description,
+                    'chain_config': chain.chain_config,
+                    'health_check_interval': chain.health_check_interval,
+                    'health_check_enabled': chain.health_check_enabled,
+                    'created_at': chain.created_at.isoformat() if chain.created_at else None,
+                    'updated_at': chain.updated_at.isoformat() if chain.updated_at else None,
+                    'statuses': statuses,
+                }
+            )
+
+        return chains
+
+    async def get_api_chain(self, chain_uuid: str) -> Dict[str, Any] | None:
+        """Get a specific API chain"""
+        result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.select(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
+        )
+
+        chain = result.first()
+        if not chain:
+            return None
+
+        # Get status for all providers in the chain
+        status_result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.select(api_chain_entity.APIChainStatus).where(
+                api_chain_entity.APIChainStatus.chain_uuid == chain_uuid
+            )
+        )
+
+        statuses = []
+        for status in status_result.all():
+            statuses.append(
+                {
+                    'provider_uuid': status.provider_uuid,
+                    'model_name': status.model_name,
+                    'api_key_index': status.api_key_index,
+                    'is_healthy': status.is_healthy,
+                    'failure_count': status.failure_count,
+                    'last_failure_time': status.last_failure_time.isoformat() if status.last_failure_time else None,
+                    'last_success_time': status.last_success_time.isoformat() if status.last_success_time else None,
+                    'last_health_check_time': status.last_health_check_time.isoformat()
+                    if status.last_health_check_time
+                    else None,
+                    'last_error_message': status.last_error_message,
+                    'health_check_last_failed': status.health_check_last_failed,
+                }
+            )
+
+        return {
+            'uuid': chain.uuid,
+            'name': chain.name,
+            'description': chain.description,
+            'chain_config': chain.chain_config,
+            'health_check_interval': chain.health_check_interval,
+            'health_check_enabled': chain.health_check_enabled,
+            'created_at': chain.created_at.isoformat() if chain.created_at else None,
+            'updated_at': chain.updated_at.isoformat() if chain.updated_at else None,
+            'statuses': statuses,
+        }
+
+    async def create_api_chain(self, chain_data: Dict[str, Any]) -> str:
+        """Create a new API chain"""
+        chain_data = dict(chain_data)
+        chain_data.setdefault('uuid', str(uuid.uuid4()))
+        chain_data.setdefault('chain_config', [])
+        chain_data.setdefault('health_check_interval', 300)
+        chain_data.setdefault('health_check_enabled', True)
+
+        # Delegate to manager so in-memory state and health-check task are created
+        await self.ap.api_chain_mgr.create_chain(chain_data)
+        return chain_data['uuid']
+
+    async def update_api_chain(self, chain_uuid: str, chain_data: Dict[str, Any]):
+        """Update an existing API chain"""
+        chain_data = dict(chain_data)
+        chain_data.pop('uuid', None)
+        chain_data.pop('created_at', None)
+        chain_data.pop('updated_at', None)
+
+        # Delegate to manager so in-memory state and health-check task are refreshed
+        await self.ap.api_chain_mgr.update_chain(chain_uuid, chain_data)
+
+    async def delete_api_chain(self, chain_uuid: str):
+        """Delete an API chain"""
+        # Delegate to manager which handles both DB deletion and memory/task cleanup
+        await self.ap.api_chain_mgr.delete_chain(chain_uuid)
+
+    async def test_api_chain(self, chain_uuid: str) -> Dict[str, Any]:
+        """Test an API chain by making a simple request"""
+        # This would make a test request through the chain
+        # For now, just return success
+        return {'success': True, 'message': 'API chain test not yet implemented'}
diff --git a/src/langbot/pkg/api/http/service/space.py b/src/langbot/pkg/api/http/service/space.py
index c05e4896a..cd6948833 100644
--- a/src/langbot/pkg/api/http/service/space.py
+++ b/src/langbot/pkg/api/http/service/space.py
@@ -1,6 +1,6 @@
 from __future__ import annotations
 
-from langbot.pkg.utils import httpclient
+import aiohttp
 import typing
 import datetime
 import time
@@ -99,49 +99,49 @@ async def exchange_oauth_code(self, code: str) -> typing.Dict:
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        session = httpclient.get_session()
-        async with session.post(
-            f'{space_url}/api/v1/accounts/oauth/token',
-            json={'code': code, 'instance_id': constants.instance_id},
-        ) as response:
-            if response.status != 200:
-                raise ValueError(f'Failed to exchange OAuth code: {await response.text()}')
-            data = await response.json()
-            if data.get('code') != 0:
-                raise ValueError(f'Failed to exchange OAuth code: {data.get("msg")}')
-            return data.get('data', {})
+        async with aiohttp.ClientSession() as session:
+            async with session.post(
+                f'{space_url}/api/v1/accounts/oauth/token',
+                json={'code': code, 'instance_id': constants.instance_id},
+            ) as response:
+                if response.status != 200:
+                    raise ValueError(f'Failed to exchange OAuth code: {await response.text()}')
+                data = await response.json()
+                if data.get('code') != 0:
+                    raise ValueError(f'Failed to exchange OAuth code: {data.get("msg")}')
+                return data.get('data', {})
 
     async def refresh_token(self, refresh_token: str) -> typing.Dict:
         """Refresh Space access token"""
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        session = httpclient.get_session()
-        async with session.post(
-            f'{space_url}/api/v1/accounts/token/refresh', json={'refresh_token': refresh_token}
-        ) as response:
-            if response.status != 200:
-                raise ValueError(f'Failed to refresh token: {await response.text()}')
-            data = await response.json()
-            if data.get('code') != 0:
-                raise ValueError(f'Failed to refresh token: {data.get("msg")}')
-            return data.get('data', {})
+        async with aiohttp.ClientSession() as session:
+            async with session.post(
+                f'{space_url}/api/v1/accounts/token/refresh', json={'refresh_token': refresh_token}
+            ) as response:
+                if response.status != 200:
+                    raise ValueError(f'Failed to refresh token: {await response.text()}')
+                data = await response.json()
+                if data.get('code') != 0:
+                    raise ValueError(f'Failed to refresh token: {data.get("msg")}')
+                return data.get('data', {})
 
     async def get_user_info_raw(self, access_token: str) -> typing.Dict:
         """Get user info from Space using access token (no validation)"""
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        session = httpclient.get_session()
-        async with session.get(
-            f'{space_url}/api/v1/accounts/me', headers={'Authorization': f'Bearer {access_token}'}
-        ) as response:
-            if response.status != 200:
-                raise ValueError(f'Failed to get user info: {await response.text()}')
-            data = await response.json()
-            if data.get('code') != 0:
-                raise ValueError(f'Failed to get user info: {data.get("msg")}')
-            return data.get('data', {})
+        async with aiohttp.ClientSession() as session:
+            async with session.get(
+                f'{space_url}/api/v1/accounts/me', headers={'Authorization': f'Bearer {access_token}'}
+            ) as response:
+                if response.status != 200:
+                    raise ValueError(f'Failed to get user info: {await response.text()}')
+                data = await response.json()
+                if data.get('code') != 0:
+                    raise ValueError(f'Failed to get user info: {data.get("msg")}')
+                return data.get('data', {})
 
     # === API calls with token validation ===
 
@@ -178,12 +178,12 @@ async def get_models(self) -> typing.List[SpaceModel]:
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        session = httpclient.get_session()
-        async with session.get(f'{space_url}/api/v1/models') as response:
-            if response.status != 200:
-                raise ValueError(f'Failed to get models: {await response.text()}')
-            data = await response.json()
-            if data.get('code') != 0:
-                raise ValueError(f'Failed to get models: {data.get("msg")}')
-            models_data = data.get('data', {}).get('models', [])
-            return [SpaceModel.model_validate(model_dict) for model_dict in models_data]
+        async with aiohttp.ClientSession() as session:
+            async with session.get(f'{space_url}/api/v1/models') as response:
+                if response.status != 200:
+                    raise ValueError(f'Failed to get models: {await response.text()}')
+                data = await response.json()
+                if data.get('code') != 0:
+                    raise ValueError(f'Failed to get models: {data.get("msg")}')
+                models_data = data.get('data', {}).get('models', [])
+                return [SpaceModel.model_validate(model_dict) for model_dict in models_data]
diff --git a/src/langbot/pkg/core/app.py b/src/langbot/pkg/core/app.py
index 98e886175..a7928341f 100644
--- a/src/langbot/pkg/core/app.py
+++ b/src/langbot/pkg/core/app.py
@@ -9,6 +9,7 @@
 from ..platform.webhook_pusher import WebhookPusher
 from ..provider.session import sessionmgr as llm_session_mgr
 from ..provider.modelmgr import modelmgr as llm_model_mgr
+from ..provider.modelmgr import api_chain as api_chain_module
 from langbot.pkg.provider.tools import toolmgr as llm_tool_mgr
 from ..config import manager as config_mgr
 from ..command import cmdmgr
@@ -30,6 +31,7 @@
 from ..api.http.service import apikey as apikey_service
 from ..api.http.service import webhook as webhook_service
 from ..api.http.service import monitoring as monitoring_service
+from ..api.http.service import api_chain as api_chain_service
 from ..discover import engine as discover_engine
 from ..storage import mgr as storagemgr
 from ..utils import logcache
@@ -62,6 +64,8 @@ class Application:
 
     model_mgr: llm_model_mgr.ModelManager = None
 
+    api_chain_mgr: api_chain_module.APIChainManager = None
+
     rag_mgr: rag_mgr.RAGManager = None
     rag_runtime_service: RAGRuntimeService = None
 
@@ -151,6 +155,8 @@ class Application:
 
     monitoring_service: monitoring_service.MonitoringService = None
 
+    api_chain_service: api_chain_service.APIChainService = None
+
     def __init__(self):
         pass
 
diff --git a/src/langbot/pkg/core/bootutils/deps.py b/src/langbot/pkg/core/bootutils/deps.py
index 1f6530379..b2508b22e 100644
--- a/src/langbot/pkg/core/bootutils/deps.py
+++ b/src/langbot/pkg/core/bootutils/deps.py
@@ -1,4 +1,3 @@
-import importlib.util
 import pip
 import os
 from ...utils import pkgmgr
@@ -50,10 +49,9 @@ async def check_deps() -> list[str]:
 
     missing_deps = []
     for dep in required_deps:
-        # Use find_spec instead of __import__ to avoid actually loading
-        # all modules into memory. find_spec only checks if the module
-        # can be found, without executing module-level code.
-        if importlib.util.find_spec(dep) is None:
+        try:
+            __import__(dep)
+        except ImportError:
             missing_deps.append(dep)
     return missing_deps
 
diff --git a/src/langbot/pkg/core/stages/build_app.py b/src/langbot/pkg/core/stages/build_app.py
index 62f0ae7b5..d20a1340b 100644
--- a/src/langbot/pkg/core/stages/build_app.py
+++ b/src/langbot/pkg/core/stages/build_app.py
@@ -10,6 +10,7 @@
 from ...command import cmdmgr
 from ...provider.session import sessionmgr as llm_session_mgr
 from ...provider.modelmgr import modelmgr as llm_model_mgr
+from ...provider.modelmgr import api_chain as api_chain_module
 from ...provider.tools import toolmgr as llm_tool_mgr
 from ...rag.knowledge import kbmgr as rag_mgr
 from ...rag.service import RAGRuntimeService
@@ -28,6 +29,7 @@
 from ...api.http.service import apikey as apikey_service
 from ...api.http.service import webhook as webhook_service
 from ...api.http.service import monitoring as monitoring_service
+from ...api.http.service import api_chain as api_chain_service
 from ...discover import engine as discover_engine
 from ...storage import mgr as storagemgr
 from ...utils import logcache
@@ -121,6 +123,10 @@ async def run(self, ap: app.Application):
         ap.model_mgr = llm_model_mgr_inst
         await llm_model_mgr_inst.initialize()
 
+        api_chain_mgr_inst = api_chain_module.APIChainManager(ap)
+        ap.api_chain_mgr = api_chain_mgr_inst
+        await api_chain_mgr_inst.initialize()
+
         llm_session_mgr_inst = llm_session_mgr.SessionManager(ap)
         await llm_session_mgr_inst.initialize()
         ap.sess_mgr = llm_session_mgr_inst
@@ -164,6 +170,9 @@ async def run(self, ap: app.Application):
         monitoring_service_inst = monitoring_service.MonitoringService(ap)
         ap.monitoring_service = monitoring_service_inst
 
+        api_chain_service_inst = api_chain_service.APIChainService(ap)
+        ap.api_chain_service = api_chain_service_inst
+
         async def runtime_disconnect_callback(connector: plugin_connector.PluginRuntimeConnector) -> None:
             await asyncio.sleep(3)
             await plugin_connector_inst.initialize()
diff --git a/src/langbot/pkg/entity/persistence/api_chain.py b/src/langbot/pkg/entity/persistence/api_chain.py
new file mode 100644
index 000000000..b40903008
--- /dev/null
+++ b/src/langbot/pkg/entity/persistence/api_chain.py
@@ -0,0 +1,98 @@
+import sqlalchemy
+from sqlalchemy import JSON, Integer, String, DateTime, Boolean
+from .base import Base
+
+
+class APIChain(Base):
+    """API Chain - manages multiple API providers with priority and failover"""
+
+    __tablename__ = 'api_chains'
+
+    uuid = sqlalchemy.Column(String(255), primary_key=True, unique=True)
+    name = sqlalchemy.Column(String(255), nullable=False)
+    description = sqlalchemy.Column(String(512), nullable=True)
+
+    # Chain configuration
+    chain_config = sqlalchemy.Column(JSON, nullable=False, default=list)
+    """
+    List of API chain items:
+    [
+        {
+            "provider_uuid": "xxx",
+            "priority": 1,              // provider priority in the chain
+            "is_aggregated": false,
+            "max_retries": 3,
+            "timeout_ms": 30000,
+            "model_configs": [          // optional: per-model priority config
+                {
+                    "model_name": "gpt-4o",   // model name (as in LLMModel.name)
+                    "priority": 1,             // model priority within this provider
+                    "api_key_indices": [        // optional: per-API-key priority
+                        {"index": 0, "priority": 1},
+                        {"index": 1, "priority": 2}
+                    ]
+                }
+            ]
+        },
+        ...
+    ]
+    If model_configs is empty/absent, the chain uses the query's original model
+    with round-robin API key rotation. If api_key_indices is empty/absent for a
+    model config, round-robin rotation is used for that model.
+    """
+
+    # Health check configuration
+    health_check_interval = sqlalchemy.Column(Integer, nullable=False, default=300)
+    """Health check interval in seconds for failed APIs"""
+
+    health_check_enabled = sqlalchemy.Column(Boolean, nullable=False, default=True)
+    """Whether to enable automatic health check for failed APIs"""
+
+    # Metadata
+    created_at = sqlalchemy.Column(DateTime, nullable=False, server_default=sqlalchemy.func.now())
+    updated_at = sqlalchemy.Column(
+        DateTime,
+        nullable=False,
+        server_default=sqlalchemy.func.now(),
+        onupdate=sqlalchemy.func.now(),
+    )
+
+
+class APIChainStatus(Base):
+    """API Chain Status - tracks the health status of APIs in chains"""
+
+    __tablename__ = 'api_chain_status'
+
+    uuid = sqlalchemy.Column(String(255), primary_key=True, unique=True)
+    chain_uuid = sqlalchemy.Column(String(255), nullable=False, index=True)
+    provider_uuid = sqlalchemy.Column(String(255), nullable=False, index=True)
+
+    # Granularity: model-level and API-key-level tracking
+    model_name = sqlalchemy.Column(String(255), nullable=True, index=True)
+    """Model name (from LLMModel.name); NULL means provider-level status"""
+
+    api_key_index = sqlalchemy.Column(Integer, nullable=True)
+    """Index into the provider's api_keys list; NULL means all/round-robin"""
+
+    # Status tracking
+    is_healthy = sqlalchemy.Column(Boolean, nullable=False, default=True)
+    failure_count = sqlalchemy.Column(Integer, nullable=False, default=0)
+    last_failure_time = sqlalchemy.Column(DateTime, nullable=True)
+    last_success_time = sqlalchemy.Column(DateTime, nullable=True)
+    last_health_check_time = sqlalchemy.Column(DateTime, nullable=True)
+
+    # Error information
+    last_error_message = sqlalchemy.Column(String(1024), nullable=True)
+
+    health_check_last_failed = sqlalchemy.Column(Boolean, nullable=False, default=False)
+    """True when the last health-check probe itself failed (not a normal request failure).
+    Is_healthy remains False while this is True. Does NOT increment failure_count."""
+
+    # Metadata
+    created_at = sqlalchemy.Column(DateTime, nullable=False, server_default=sqlalchemy.func.now())
+    updated_at = sqlalchemy.Column(
+        DateTime,
+        nullable=False,
+        server_default=sqlalchemy.func.now(),
+        onupdate=sqlalchemy.func.now(),
+    )
diff --git a/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py b/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
new file mode 100644
index 000000000..931a36322
--- /dev/null
+++ b/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
@@ -0,0 +1,46 @@
+"""Database migration for API Chain feature"""
+
+from sqlalchemy import text
+
+
+async def migrate(ap):
+    """Add API chain tables"""
+
+    # Create api_chains table
+    await ap.persistence_mgr.execute_async(
+        text("""
+        CREATE TABLE IF NOT EXISTS api_chains (
+            uuid VARCHAR(255) PRIMARY KEY,
+            name VARCHAR(255) NOT NULL,
+            description VARCHAR(512),
+            chain_config JSON NOT NULL,
+            health_check_interval INTEGER NOT NULL DEFAULT 300,
+            health_check_enabled BOOLEAN NOT NULL DEFAULT 1,
+            created_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
+            updated_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP
+        )
+        """)
+    )
+
+    # Create api_chain_status table
+    await ap.persistence_mgr.execute_async(
+        text("""
+        CREATE TABLE IF NOT EXISTS api_chain_status (
+            uuid VARCHAR(255) PRIMARY KEY,
+            chain_uuid VARCHAR(255) NOT NULL,
+            provider_uuid VARCHAR(255) NOT NULL,
+            is_healthy BOOLEAN NOT NULL DEFAULT 1,
+            failure_count INTEGER NOT NULL DEFAULT 0,
+            last_failure_time DATETIME,
+            last_success_time DATETIME,
+            last_health_check_time DATETIME,
+            last_error_message VARCHAR(1024),
+            created_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
+            updated_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
+            INDEX idx_chain_uuid (chain_uuid),
+            INDEX idx_provider_uuid (provider_uuid)
+        )
+        """)
+    )
+
+    ap.logger.info('API Chain tables created successfully')
diff --git a/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py b/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
new file mode 100644
index 000000000..861d7b840
--- /dev/null
+++ b/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
@@ -0,0 +1,39 @@
+import sqlalchemy
+from .. import migration
+
+
+@migration.migration_class(20)
+class DBMigrateAPIChainModelAPILevel(migration.DBMigration):
+    """Add model_name and api_key_index columns to api_chain_status for per-model/api-key health tracking"""
+
+    async def upgrade(self):
+        """Upgrade"""
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text('ALTER TABLE api_chain_status ADD COLUMN model_name VARCHAR(255) DEFAULT NULL')
+            )
+        except Exception:
+            pass
+
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text('ALTER TABLE api_chain_status ADD COLUMN api_key_index INTEGER DEFAULT NULL')
+            )
+        except Exception:
+            pass
+
+    async def downgrade(self):
+        """Downgrade"""
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN model_name')
+            )
+        except Exception:
+            pass
+
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN api_key_index')
+            )
+        except Exception:
+            pass
diff --git a/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py b/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py
new file mode 100644
index 000000000..d4d9a1c87
--- /dev/null
+++ b/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py
@@ -0,0 +1,27 @@
+import sqlalchemy
+from .. import migration
+
+
+@migration.migration_class(21)
+class DBMigrateAPIChainHealthCheckFlag(migration.DBMigration):
+    """Add health_check_last_failed column to api_chain_status"""
+
+    async def upgrade(self):
+        """Upgrade"""
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text(
+                    'ALTER TABLE api_chain_status ADD COLUMN health_check_last_failed BOOLEAN NOT NULL DEFAULT 0'
+                )
+            )
+        except Exception:
+            pass
+
+    async def downgrade(self):
+        """Downgrade"""
+        try:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN health_check_last_failed')
+            )
+        except Exception:
+            pass
diff --git a/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py b/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
index a376310f6..4213e662b 100644
--- a/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
+++ b/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
@@ -1,9 +1,10 @@
 from __future__ import annotations
 
+import aiohttp
+
 from .. import entities
 from .. import filter as filter_model
 import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
-from langbot.pkg.utils import httpclient
 
 BAIDU_EXAMINE_URL = 'https://aip.baidubce.com/rest/2.0/solution/v1/text_censor/v2/user_defined?access_token={}'
 BAIDU_EXAMINE_TOKEN_URL = 'https://aip.baidubce.com/oauth/2.0/token'
@@ -14,50 +15,50 @@ class BaiduCloudExamine(filter_model.ContentFilter):
     """百度云内容审核"""
 
     async def _get_token(self) -> str:
-        session = httpclient.get_session()
-        async with session.post(
-            BAIDU_EXAMINE_TOKEN_URL,
-            params={
-                'grant_type': 'client_credentials',
-                'client_id': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-key'],
-                'client_secret': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-secret'],
-            },
-        ) as resp:
-            return (await resp.json())['access_token']
+        async with aiohttp.ClientSession() as session:
+            async with session.post(
+                BAIDU_EXAMINE_TOKEN_URL,
+                params={
+                    'grant_type': 'client_credentials',
+                    'client_id': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-key'],
+                    'client_secret': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-secret'],
+                },
+            ) as resp:
+                return (await resp.json())['access_token']
 
     async def process(self, query: pipeline_query.Query, message: str) -> entities.FilterResult:
-        session = httpclient.get_session()
-        async with session.post(
-            BAIDU_EXAMINE_URL.format(await self._get_token()),
-            headers={
-                'Content-Type': 'application/x-www-form-urlencoded',
-                'Accept': 'application/json',
-            },
-            data=f'text={message}'.encode('utf-8'),
-        ) as resp:
-            result = await resp.json()
-
-            if 'error_code' in result:
-                return entities.FilterResult(
-                    level=entities.ResultLevel.BLOCK,
-                    replacement=message,
-                    user_notice='',
-                    console_notice=f'百度云判定出错，错误信息：{result["error_msg"]}',
-                )
-            else:
-                conclusion = result['conclusion']
-
-                if conclusion in ('合规'):
+        async with aiohttp.ClientSession() as session:
+            async with session.post(
+                BAIDU_EXAMINE_URL.format(await self._get_token()),
+                headers={
+                    'Content-Type': 'application/x-www-form-urlencoded',
+                    'Accept': 'application/json',
+                },
+                data=f'text={message}'.encode('utf-8'),
+            ) as resp:
+                result = await resp.json()
+
+                if 'error_code' in result:
                     return entities.FilterResult(
-                        level=entities.ResultLevel.PASS,
+                        level=entities.ResultLevel.BLOCK,
                         replacement=message,
                         user_notice='',
-                        console_notice=f'百度云判定结果：{conclusion}',
+                        console_notice=f'百度云判定出错，错误信息：{result["error_msg"]}',
                     )
                 else:
-                    return entities.FilterResult(
-                        level=entities.ResultLevel.BLOCK,
-                        replacement=message,
-                        user_notice='消息中存在不合适的内容, 请修改',
-                        console_notice=f'百度云判定结果：{conclusion}',
-                    )
+                    conclusion = result['conclusion']
+
+                    if conclusion in ('合规'):
+                        return entities.FilterResult(
+                            level=entities.ResultLevel.PASS,
+                            replacement=message,
+                            user_notice='',
+                            console_notice=f'百度云判定结果：{conclusion}',
+                        )
+                    else:
+                        return entities.FilterResult(
+                            level=entities.ResultLevel.BLOCK,
+                            replacement=message,
+                            user_notice='消息中存在不合适的内容, 请修改',
+                            console_notice=f'百度云判定结果：{conclusion}',
+                        )
diff --git a/src/langbot/pkg/pipeline/preproc/preproc.py b/src/langbot/pkg/pipeline/preproc/preproc.py
index cd039d796..9cf4d8b93 100644
--- a/src/langbot/pkg/pipeline/preproc/preproc.py
+++ b/src/langbot/pkg/pipeline/preproc/preproc.py
@@ -36,17 +36,20 @@ async def process(
         session = await self.ap.sess_mgr.get_session(query)
 
         # When not local-agent, llm_model is None
-        try:
-            llm_model = (
-                await self.ap.model_mgr.get_model_by_uuid(query.pipeline_config['ai']['local-agent']['model'])
-                if selected_runner == 'local-agent'
-                else None
-            )
-        except ValueError:
-            self.ap.logger.warning(
-                f'LLM model {query.pipeline_config["ai"]["local-agent"]["model"] + " "}not found or not configured'
-            )
-            llm_model = None
+        llm_model = None
+        use_api_chain_uuid = None
+        if selected_runner == 'local-agent':
+            model_value = query.pipeline_config['ai']['local-agent'].get('model', '')
+            if model_value:
+                try:
+                    llm_model = await self.ap.model_mgr.get_model_by_uuid(model_value)
+                except ValueError:
+                    # Not a model UUID — try as API chain UUID
+                    chain = await self.ap.api_chain_mgr.get_chain(model_value)
+                    if chain:
+                        use_api_chain_uuid = model_value
+                    else:
+                        self.ap.logger.warning(f'LLM model/chain {model_value} not found or not configured')
 
         conversation = await self.ap.sess_mgr.get_conversation(
             query,
@@ -61,19 +64,28 @@ async def process(
         query.prompt = conversation.prompt.copy()
         query.messages = conversation.messages.copy()
 
-        if selected_runner == 'local-agent' and llm_model:
+        if selected_runner == 'local-agent':
             query.use_funcs = []
-            query.use_llm_model_uuid = llm_model.model_entity.uuid
-
-            if llm_model.model_entity.abilities.__contains__('func_call'):
-                # Get bound plugins and MCP servers for filtering tools
+            if llm_model:
+                query.use_llm_model_uuid = llm_model.model_entity.uuid
+
+                if llm_model.model_entity.abilities.__contains__('func_call'):
+                    # Get bound plugins and MCP servers for filtering tools
+                    bound_plugins = query.variables.get('_pipeline_bound_plugins', None)
+                    bound_mcp_servers = query.variables.get('_pipeline_bound_mcp_servers', None)
+                    query.use_funcs = await self.ap.tool_mgr.get_all_tools(bound_plugins, bound_mcp_servers)
+
+                    self.ap.logger.debug(f'Bound plugins: {bound_plugins}')
+                    self.ap.logger.debug(f'Bound MCP servers: {bound_mcp_servers}')
+                    self.ap.logger.debug(f'Use funcs: {query.use_funcs}')
+
+            elif use_api_chain_uuid:
+                query.variables['_use_api_chain_uuid'] = use_api_chain_uuid
+                # Enable all tools for chain; individual models will decide capability
                 bound_plugins = query.variables.get('_pipeline_bound_plugins', None)
                 bound_mcp_servers = query.variables.get('_pipeline_bound_mcp_servers', None)
                 query.use_funcs = await self.ap.tool_mgr.get_all_tools(bound_plugins, bound_mcp_servers)
-
-                self.ap.logger.debug(f'Bound plugins: {bound_plugins}')
-                self.ap.logger.debug(f'Bound MCP servers: {bound_mcp_servers}')
-                self.ap.logger.debug(f'Use funcs: {query.use_funcs}')
+                self.ap.logger.debug(f'Using API chain {use_api_chain_uuid} for local-agent')
 
         sender_name = ''
 
diff --git a/src/langbot/pkg/platform/sources/discord.py b/src/langbot/pkg/platform/sources/discord.py
index e9cc7a37e..cb80ce48e 100644
--- a/src/langbot/pkg/platform/sources/discord.py
+++ b/src/langbot/pkg/platform/sources/discord.py
@@ -14,7 +14,7 @@
 import asyncio
 from enum import Enum
 
-from langbot.pkg.utils import httpclient
+import aiohttp
 import pydantic
 
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
@@ -622,23 +622,23 @@ async def yiri2target(
                     image_bytes = base64.b64decode(base64_data)
                 elif ele.url:
                     # 从URL下载图片
-                    session = httpclient.get_session()
-                    async with session.get(ele.url) as response:
-                        image_bytes = await response.read()
-                        # 从URL或Content-Type推断文件类型
-                        content_type = response.headers.get('Content-Type', '')
-                        if 'jpeg' in content_type or 'jpg' in content_type:
-                            filename = f'{uuid.uuid4()}.jpg'
-                        elif 'gif' in content_type:
-                            filename = f'{uuid.uuid4()}.gif'
-                        elif 'webp' in content_type:
-                            filename = f'{uuid.uuid4()}.webp'
-                        elif ele.url.lower().endswith(('.jpg', '.jpeg')):
-                            filename = f'{uuid.uuid4()}.jpg'
-                        elif ele.url.lower().endswith('.gif'):
-                            filename = f'{uuid.uuid4()}.gif'
-                        elif ele.url.lower().endswith('.webp'):
-                            filename = f'{uuid.uuid4()}.webp'
+                    async with aiohttp.ClientSession() as session:
+                        async with session.get(ele.url) as response:
+                            image_bytes = await response.read()
+                            # 从URL或Content-Type推断文件类型
+                            content_type = response.headers.get('Content-Type', '')
+                            if 'jpeg' in content_type or 'jpg' in content_type:
+                                filename = f'{uuid.uuid4()}.jpg'
+                            elif 'gif' in content_type:
+                                filename = f'{uuid.uuid4()}.gif'
+                            elif 'webp' in content_type:
+                                filename = f'{uuid.uuid4()}.webp'
+                            elif ele.url.lower().endswith(('.jpg', '.jpeg')):
+                                filename = f'{uuid.uuid4()}.jpg'
+                            elif ele.url.lower().endswith('.gif'):
+                                filename = f'{uuid.uuid4()}.gif'
+                            elif ele.url.lower().endswith('.webp'):
+                                filename = f'{uuid.uuid4()}.webp'
                 elif ele.path:
                     # 从文件路径读取图片
                     # 确保路径没有空字节
@@ -702,9 +702,9 @@ async def yiri2target(
                     file_base64 = ele.base64.split(',')[-1]
                     file_bytes = base64.b64decode(file_base64)
                 elif ele.url:
-                    session = httpclient.get_session()
-                    async with session.get(ele.url) as response:
-                        file_bytes = await response.read()
+                    async with aiohttp.ClientSession() as session:
+                        async with session.get(ele.url) as response:
+                            file_bytes = await response.read()
                 if file_bytes:
                     files.append(discord.File(fp=io.BytesIO(file_bytes), filename=filename))
             elif isinstance(ele, platform_message.File):
@@ -717,9 +717,9 @@ async def yiri2target(
                     else:
                         file_bytes = base64.b64decode(ele.base64)
                 elif ele.url:
-                    session = httpclient.get_session()
-                    async with session.get(ele.url) as response:
-                        file_bytes = await response.read()
+                    async with aiohttp.ClientSession() as session:
+                        async with session.get(ele.url) as response:
+                            file_bytes = await response.read()
                 if file_bytes:
                     files.append(discord.File(fp=io.BytesIO(file_bytes), filename=filename))
             elif isinstance(ele, platform_message.Forward):
@@ -775,12 +775,12 @@ def text_element_recur(
 
         # attachments
         for attachment in message.attachments:
-            session = httpclient.get_session(trust_env=True)
-            async with session.get(attachment.url) as response:
-                image_data = await response.read()
-                image_base64 = base64.b64encode(image_data).decode('utf-8')
-                image_format = response.headers['Content-Type']
-                element_list.append(platform_message.Image(base64=f'data:{image_format};base64,{image_base64}'))
+            async with aiohttp.ClientSession(trust_env=True) as session:
+                async with session.get(attachment.url) as response:
+                    image_data = await response.read()
+                    image_base64 = base64.b64encode(image_data).decode('utf-8')
+                    image_format = response.headers['Content-Type']
+                    element_list.append(platform_message.Image(base64=f'data:{image_format};base64,{image_base64}'))
 
         return platform_message.MessageChain(element_list)
 
diff --git a/src/langbot/pkg/platform/sources/kook.py b/src/langbot/pkg/platform/sources/kook.py
index 5a6bade36..17777a95e 100644
--- a/src/langbot/pkg/platform/sources/kook.py
+++ b/src/langbot/pkg/platform/sources/kook.py
@@ -9,8 +9,6 @@
 import time
 
 import aiohttp
-
-from langbot.pkg.utils import httpclient
 import websockets
 import pydantic
 
@@ -122,16 +120,16 @@ async def target2yiri(kook_message: dict, bot_account_id: str = '') -> platform_
             if content:
                 # Download image and convert to base64
                 try:
-                    session = httpclient.get_session()
-                    async with session.get(content) as response:
-                        if response.status == 200:
-                            image_bytes = await response.read()
-                            image_base64 = base64.b64encode(image_bytes).decode('utf-8')
-                            # Detect image format
-                            content_type = response.headers.get('Content-Type', 'image/png')
-                            components.append(
-                                platform_message.Image(base64=f'data:{content_type};base64,{image_base64}')
-                            )
+                    async with aiohttp.ClientSession() as session:
+                        async with session.get(content) as response:
+                            if response.status == 200:
+                                image_bytes = await response.read()
+                                image_base64 = base64.b64encode(image_bytes).decode('utf-8')
+                                # Detect image format
+                                content_type = response.headers.get('Content-Type', 'image/png')
+                                components.append(
+                                    platform_message.Image(base64=f'data:{content_type};base64,{image_base64}')
+                                )
                 except Exception:
                     # If download fails, just add as plain text
                     components.append(platform_message.Plain(text=f'[Image: {content}]'))
@@ -297,17 +295,17 @@ async def _get_gateway_url(self) -> str:
             'Authorization': f'Bot {self.config["token"]}',
         }
 
-        session = httpclient.get_session()
-        async with session.get(base_url, params=params, headers=headers) as response:
-            if response.status == 200:
-                data = await response.json()
-                if data.get('code') == 0:
-                    gateway_url = data['data']['url']
-                    return gateway_url
+        async with aiohttp.ClientSession() as session:
+            async with session.get(base_url, params=params, headers=headers) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    if data.get('code') == 0:
+                        gateway_url = data['data']['url']
+                        return gateway_url
+                    else:
+                        raise Exception(f'Failed to get gateway URL: {data.get("message")}')
                 else:
-                    raise Exception(f'Failed to get gateway URL: {data.get("message")}')
-            else:
-                raise Exception(f'Failed to get gateway URL: HTTP {response.status}')
+                    raise Exception(f'Failed to get gateway URL: HTTP {response.status}')
 
     async def _get_bot_user_info(self) -> dict:
         """Get bot's own user information from KOOK API"""
@@ -317,17 +315,17 @@ async def _get_bot_user_info(self) -> dict:
             'Authorization': f'Bot {self.config["token"]}',
         }
 
-        session = httpclient.get_session()
-        async with session.get(base_url, headers=headers) as response:
-            if response.status == 200:
-                data = await response.json()
-                if data.get('code') == 0:
-                    user_info = data['data']
-                    return user_info
+        async with aiohttp.ClientSession() as session:
+            async with session.get(base_url, headers=headers) as response:
+                if response.status == 200:
+                    data = await response.json()
+                    if data.get('code') == 0:
+                        user_info = data['data']
+                        return user_info
+                    else:
+                        raise Exception(f'Failed to get bot user info: {data.get("message")}')
                 else:
-                    raise Exception(f'Failed to get bot user info: {data.get("message")}')
-            else:
-                raise Exception(f'Failed to get bot user info: HTTP {response.status}')
+                    raise Exception(f'Failed to get bot user info: HTTP {response.status}')
 
     async def _handle_hello(self, data: dict):
         """Handle HELLO signal (signal 1)"""
@@ -512,7 +510,7 @@ async def send_message(self, target_type: str, target_id: str, message: platform
 
         try:
             if not self.http_session:
-                self.http_session = httpclient.get_session()
+                self.http_session = aiohttp.ClientSession()
 
             async with self.http_session.post(url, json=payload, headers=headers) as response:
                 if response.status == 200:
@@ -578,7 +576,7 @@ async def reply_message(
 
         try:
             if not self.http_session:
-                self.http_session = httpclient.get_session()
+                self.http_session = aiohttp.ClientSession()
 
             async with self.http_session.post(url, json=payload, headers=headers) as response:
                 if response.status == 200:
@@ -626,7 +624,7 @@ async def run_async(self):
 
         try:
             # Create HTTP session
-            self.http_session = httpclient.get_session()
+            self.http_session = aiohttp.ClientSession()
 
             await self.logger.info('Starting KOOK adapter')
 
diff --git a/src/langbot/pkg/platform/sources/lark.py b/src/langbot/pkg/platform/sources/lark.py
index 3ce4280cd..ce5277311 100644
--- a/src/langbot/pkg/platform/sources/lark.py
+++ b/src/langbot/pkg/platform/sources/lark.py
@@ -17,7 +17,7 @@
 import os
 import mimetypes
 
-from langbot.pkg.utils import httpclient
+import aiohttp
 import lark_oapi.ws.exception
 import quart
 from lark_oapi.api.im.v1 import *
@@ -78,13 +78,13 @@ async def upload_image_to_lark(msg: platform_message.Image, api_client: lark_oap
                 return None
         elif msg.url:
             try:
-                session = httpclient.get_session()
-                async with session.get(msg.url) as response:
-                    if response.status == 200:
-                        image_bytes = await response.read()
-                    else:
-                        print(f'Failed to download image from {msg.url}: HTTP {response.status}')
-                        return None
+                async with aiohttp.ClientSession() as session:
+                    async with session.get(msg.url) as response:
+                        if response.status == 200:
+                            image_bytes = await response.read()
+                        else:
+                            print(f'Failed to download image from {msg.url}: HTTP {response.status}')
+                            return None
             except Exception as e:
                 print(f'Failed to download image from {msg.url}: {e}')
                 traceback.print_exc()
@@ -208,10 +208,10 @@ async def _get_media_bytes(
                 pass
         elif msg.url:
             try:
-                session = httpclient.get_session()
-                async with session.get(msg.url) as resp:
-                    if resp.status == 200:
-                        data = await resp.read()
+                async with aiohttp.ClientSession() as session:
+                    async with session.get(msg.url) as resp:
+                        if resp.status == 200:
+                            data = await resp.read()
             except Exception:
                 pass
         elif msg.path:
diff --git a/src/langbot/pkg/platform/sources/legacy/gewechat.py b/src/langbot/pkg/platform/sources/legacy/gewechat.py
index 68e1bdedd..93bef53cb 100644
--- a/src/langbot/pkg/platform/sources/legacy/gewechat.py
+++ b/src/langbot/pkg/platform/sources/legacy/gewechat.py
@@ -9,7 +9,7 @@
 import threading
 
 import quart
-from langbot.pkg.utils import httpclient
+import aiohttp
 
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
 from ....core import app
@@ -639,14 +639,14 @@ def unregister_listener(
 
     async def run_async(self):
         if not self.config['token']:
-            session = httpclient.get_session()
-            async with session.post(
-                f'{self.config["gewechat_url"]}/v2/api/tools/getTokenId',
-                json={'app_id': self.config['app_id']},
-            ) as response:
-                if response.status != 200:
-                    raise Exception(f'获取gewechat token失败: {await response.text()}')
-                self.config['token'] = (await response.json())['data']
+            async with aiohttp.ClientSession() as session:
+                async with session.post(
+                    f'{self.config["gewechat_url"]}/v2/api/tools/getTokenId',
+                    json={'app_id': self.config['app_id']},
+                ) as response:
+                    if response.status != 200:
+                        raise Exception(f'获取gewechat token失败: {await response.text()}')
+                    self.config['token'] = (await response.json())['data']
 
         self.bot = gewechat_client.GewechatClient(f'{self.config["gewechat_url"]}/v2/api', self.config['token'])
 
diff --git a/src/langbot/pkg/platform/sources/telegram.py b/src/langbot/pkg/platform/sources/telegram.py
index d43b9333c..c2b2fd032 100644
--- a/src/langbot/pkg/platform/sources/telegram.py
+++ b/src/langbot/pkg/platform/sources/telegram.py
@@ -10,9 +10,9 @@
 import typing
 import traceback
 import base64
+import aiohttp
 import pydantic
 
-from langbot.pkg.utils import httpclient
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
 import langbot_plugin.api.entities.builtin.platform.message as platform_message
 import langbot_plugin.api.entities.builtin.platform.events as platform_events
@@ -34,9 +34,9 @@ async def yiri2target(message_chain: platform_message.MessageChain, bot: telegra
                 if component.base64:
                     photo_bytes = base64.b64decode(component.base64)
                 elif component.url:
-                    session = httpclient.get_session()
-                    async with session.get(component.url) as response:
-                        photo_bytes = await response.read()
+                    async with aiohttp.ClientSession() as session:
+                        async with session.get(component.url) as response:
+                            photo_bytes = await response.read()
                 elif component.path:
                     with open(component.path, 'rb') as f:
                         photo_bytes = f.read()
@@ -75,9 +75,10 @@ def parse_message_text(text: str) -> list[platform_message.MessageComponent]:
             file_bytes = None
             file_format = ''
 
-            async with httpclient.get_session(trust_env=True).get(file.file_path) as response:
-                file_bytes = await response.read()
-                file_format = 'image/jpeg'
+            async with aiohttp.ClientSession(trust_env=True) as session:
+                async with session.get(file.file_path) as response:
+                    file_bytes = await response.read()
+                    file_format = 'image/jpeg'
 
             message_components.append(
                 platform_message.Image(
@@ -94,8 +95,9 @@ def parse_message_text(text: str) -> list[platform_message.MessageComponent]:
             file_bytes = None
             file_format = message.voice.mime_type or 'audio/ogg'
 
-            async with httpclient.get_session(trust_env=True).get(file.file_path) as response:
-                file_bytes = await response.read()
+            async with aiohttp.ClientSession(trust_env=True) as session:
+                async with session.get(file.file_path) as response:
+                    file_bytes = await response.read()
 
             message_components.append(
                 platform_message.Voice(
@@ -193,31 +195,7 @@ async def telegram_callback(update: Update, context: ContextTypes.DEFAULT_TYPE):
         )
 
     async def send_message(self, target_type: str, target_id: str, message: platform_message.MessageChain):
-        components = await TelegramMessageConverter.yiri2target(message, self.bot)
-
-        chat_id_str, _, thread_id_str = str(target_id).partition('#')
-        chat_id: int | str = int(chat_id_str) if chat_id_str.lstrip('-').isdigit() else chat_id_str
-        message_thread_id = int(thread_id_str) if thread_id_str and thread_id_str.isdigit() else None
-
-        for component in components:
-            component_type = component.get('type')
-            args = {'chat_id': chat_id}
-            if message_thread_id is not None:
-                args['message_thread_id'] = message_thread_id
-
-            if component_type == 'text':
-                text = component.get('text', '')
-                if self.config['markdown_card'] is True:
-                    text = telegramify_markdown.markdownify(content=text)
-                    args['parse_mode'] = 'MarkdownV2'
-                args['text'] = text
-                await self.bot.send_message(**args)
-            elif component_type == 'photo':
-                photo = component.get('photo')
-                if photo is None:
-                    continue
-                args['photo'] = telegram.InputFile(photo)
-                await self.bot.send_photo(**args)
+        pass
 
     async def reply_message(
         self,
diff --git a/src/langbot/pkg/platform/webhook_pusher.py b/src/langbot/pkg/platform/webhook_pusher.py
index f3cf39b27..5a8d25644 100644
--- a/src/langbot/pkg/platform/webhook_pusher.py
+++ b/src/langbot/pkg/platform/webhook_pusher.py
@@ -3,8 +3,6 @@
 import asyncio
 import logging
 import aiohttp
-
-from langbot.pkg.utils import httpclient
 import uuid
 from typing import TYPE_CHECKING
 
@@ -121,23 +119,23 @@ async def _push_to_webhook(self, url: str, payload: dict) -> dict | None:
             dict | None: The response JSON if successful, None otherwise
         """
         try:
-            session = httpclient.get_session()
-            async with session.post(
-                url,
-                json=payload,
-                headers={'Content-Type': 'application/json'},
-                timeout=aiohttp.ClientTimeout(total=15),
-            ) as response:
-                if response.status >= 400:
-                    self.logger.warning(f'Webhook {url} returned status {response.status}')
-                    return None
-                else:
-                    self.logger.debug(f'Successfully pushed to webhook {url}')
-                    try:
-                        return await response.json()
-                    except Exception as json_error:
-                        self.logger.debug(f'Failed to parse JSON response from webhook {url}: {json_error}')
+            async with aiohttp.ClientSession() as session:
+                async with session.post(
+                    url,
+                    json=payload,
+                    headers={'Content-Type': 'application/json'},
+                    timeout=aiohttp.ClientTimeout(total=15),
+                ) as response:
+                    if response.status >= 400:
+                        self.logger.warning(f'Webhook {url} returned status {response.status}')
                         return None
+                    else:
+                        self.logger.debug(f'Successfully pushed to webhook {url}')
+                        try:
+                            return await response.json()
+                        except Exception as json_error:
+                            self.logger.debug(f'Failed to parse JSON response from webhook {url}: {json_error}')
+                            return None
         except asyncio.TimeoutError:
             self.logger.warning(f'Timeout pushing to webhook {url}')
             return None
diff --git a/src/langbot/pkg/provider/modelmgr/api_chain.py b/src/langbot/pkg/provider/modelmgr/api_chain.py
new file mode 100644
index 000000000..dc9316c77
--- /dev/null
+++ b/src/langbot/pkg/provider/modelmgr/api_chain.py
@@ -0,0 +1,757 @@
+"""API Chain Manager - handles API failover and health checking.
+
+chain_config item schema (per provider entry):
+{
+    "provider_uuid": "xxx",
+    "priority": 1,              # provider priority in the chain (lower = higher priority)
+    "is_aggregated": false,
+    "max_retries": 3,
+    "timeout_ms": 30000,
+    "model_configs": [          # optional: per-model configuration
+        {
+            "model_name": "gpt-4o",   # model name as stored in LLMModel.name
+            "priority": 1,             # priority within this provider
+            "api_key_indices": [        # optional: per-API-key priority
+                {"index": 0, "priority": 1},
+                {"index": 1, "priority": 2}
+            ]
+        }
+    ]
+}
+If model_configs is absent, the original query model is used with round-robin keys.
+If api_key_indices is absent for a model config, round-robin rotation is used.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import uuid as uuid_lib
+from datetime import datetime
+from typing import List, Dict, Any, Optional, Tuple, AsyncGenerator
+
+import sqlalchemy
+from ...core import app
+from ...entity.persistence import api_chain as api_chain_entity
+from . import requester
+from . import token
+
+import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
+import langbot_plugin.api.entities.builtin.provider.message as provider_message
+import langbot_plugin.api.entities.builtin.resource.tool as resource_tool
+
+
+class APIChainManager:
+    """Manages API chains with per-model/per-API-key failover and health checking"""
+
+    def __init__(self, ap: app.Application):
+        self.ap = ap
+        self.chains: Dict[str, api_chain_entity.APIChain] = {}
+        self.health_check_tasks: Dict[str, asyncio.Task] = {}
+
+    async def initialize(self):
+        """Initialize API chain manager"""
+        await self.load_chains_from_db()
+        await self.start_health_check_tasks()
+
+    async def load_chains_from_db(self):
+        """Load all API chains from database"""
+        result = await self.ap.persistence_mgr.execute_async(sqlalchemy.select(api_chain_entity.APIChain))
+        for row in result.all():
+            # result.all() returns read-only Row objects; wrap them in mutable instances
+            chain = api_chain_entity.APIChain(
+                uuid=row.uuid,
+                name=row.name,
+                description=row.description,
+                chain_config=row.chain_config,
+                health_check_interval=row.health_check_interval,
+                health_check_enabled=row.health_check_enabled,
+            )
+            self.chains[chain.uuid] = chain
+
+    async def start_health_check_tasks(self):
+        """Start background health check tasks for all chains"""
+        for chain_uuid, chain in self.chains.items():
+            if chain.health_check_enabled:
+                task = asyncio.create_task(self._health_check_loop(chain_uuid))
+                self.health_check_tasks[chain_uuid] = task
+
+    async def stop_health_check_tasks(self):
+        """Stop all health check tasks"""
+        for task in self.health_check_tasks.values():
+            task.cancel()
+        self.health_check_tasks.clear()
+
+    # ==================== Health Check ====================
+
+    async def _health_check_loop(self, chain_uuid: str):
+        """Background loop for health checking failed APIs.
+
+        An immediate check is performed on startup so that pre-existing
+        unhealthy records are evaluated without waiting for the full interval.
+        """
+        # Immediate check on start
+        try:
+            await self._perform_health_checks(chain_uuid)
+        except asyncio.CancelledError:
+            return
+        except Exception as e:
+            self.ap.logger.error(f'Initial health check error for chain {chain_uuid}: {e}')
+
+        while True:
+            try:
+                chain = self.chains.get(chain_uuid)
+                if not chain or not chain.health_check_enabled:
+                    break
+                await asyncio.sleep(chain.health_check_interval)
+                await self._perform_health_checks(chain_uuid)
+            except asyncio.CancelledError:
+                break
+            except Exception as e:
+                self.ap.logger.error(f'Health check loop error for chain {chain_uuid}: {e}')
+                await asyncio.sleep(60)
+
+    async def _perform_health_checks(self, chain_uuid: str):
+        """Perform health checks on all unhealthy status records in a chain"""
+        result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.select(api_chain_entity.APIChainStatus).where(
+                sqlalchemy.and_(
+                    api_chain_entity.APIChainStatus.chain_uuid == chain_uuid,
+                    api_chain_entity.APIChainStatus.is_healthy == False,
+                )
+            )
+        )
+        for status in result.all():
+            try:
+                provider = self.ap.model_mgr.provider_dict.get(status.provider_uuid)
+                if not provider:
+                    continue
+
+                is_healthy = await self._check_api_health(status, provider)
+
+                if is_healthy:
+                    await self._update_status(
+                        status.uuid,
+                        is_healthy=True,
+                        failure_count=0,
+                        health_check_last_failed=False,
+                        last_success_time=datetime.now(),
+                        last_health_check_time=datetime.now(),
+                        last_error_message=None,
+                    )
+                    self.ap.logger.info(
+                        f'API recovered: provider={status.provider_uuid} '
+                        f'model={status.model_name} key_index={status.api_key_index}'
+                    )
+                else:
+                    # Health check probe failed: mark the flag but do NOT increment failure_count
+                    await self._update_status(
+                        status.uuid,
+                        health_check_last_failed=True,
+                        last_health_check_time=datetime.now(),
+                    )
+            except Exception as e:
+                self.ap.logger.error(
+                    f'Health check loop error for provider={status.provider_uuid} '
+                    f'model={status.model_name} key_index={status.api_key_index}: {e}'
+                )
+                try:
+                    await self._update_status(
+                        status.uuid,
+                        health_check_last_failed=True,
+                        last_health_check_time=datetime.now(),
+                    )
+                except Exception:
+                    pass
+
+    async def _check_api_health(
+        self,
+        status: api_chain_entity.APIChainStatus,
+        provider: requester.RuntimeProvider,
+    ) -> bool:
+        """Check API health by making a minimal test request to the LLM endpoint.
+
+        Returns True if the request succeeds (API is reachable and authenticated),
+        False otherwise.  Does NOT raise exceptions.
+        """
+        try:
+            temp_provider = self._create_provider_for_key(provider, status.api_key_index)
+            model_entity = self._resolve_model_entity(provider, None, status.model_name)
+            if model_entity is None:
+                self.ap.logger.warning(
+                    f'Health check: no model found for provider={status.provider_uuid} '
+                    f'model_name={status.model_name}, skipping'
+                )
+                return False
+
+            temp_model = requester.RuntimeLLMModel(
+                model_entity=model_entity,
+                provider=temp_provider,
+            )
+            test_msg = provider_message.Message(role='user', content='hi')
+
+            await temp_provider.invoke_llm(
+                query=None,
+                model=temp_model,
+                messages=[test_msg],
+                funcs=None,
+                extra_args={},
+                remove_think=True,
+            )
+            return True
+        except Exception as e:
+            self.ap.logger.debug(
+                f'Health check request failed for provider={status.provider_uuid} '
+                f'model={status.model_name} key={status.api_key_index}: {e}'
+            )
+            return False
+
+    # ==================== Status Helpers ====================
+
+    async def _ensure_status(
+        self,
+        chain_uuid: str,
+        provider_uuid: str,
+        model_name: Optional[str],
+        api_key_index: Optional[int],
+    ) -> api_chain_entity.APIChainStatus:
+        """Get or create a status record for the given (chain, provider, model, key) tuple"""
+        conditions = [
+            api_chain_entity.APIChainStatus.chain_uuid == chain_uuid,
+            api_chain_entity.APIChainStatus.provider_uuid == provider_uuid,
+        ]
+        if model_name is None:
+            conditions.append(api_chain_entity.APIChainStatus.model_name == None)  # noqa: E711
+        else:
+            conditions.append(api_chain_entity.APIChainStatus.model_name == model_name)
+
+        if api_key_index is None:
+            conditions.append(api_chain_entity.APIChainStatus.api_key_index == None)  # noqa: E711
+        else:
+            conditions.append(api_chain_entity.APIChainStatus.api_key_index == api_key_index)
+
+        result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.select(api_chain_entity.APIChainStatus).where(sqlalchemy.and_(*conditions))
+        )
+        existing = result.first()
+        if existing:
+            return existing
+
+        new_uuid = str(uuid_lib.uuid4())
+        await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.insert(api_chain_entity.APIChainStatus).values(
+                uuid=new_uuid,
+                chain_uuid=chain_uuid,
+                provider_uuid=provider_uuid,
+                model_name=model_name,
+                api_key_index=api_key_index,
+                is_healthy=True,
+                failure_count=0,
+            )
+        )
+        result2 = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.select(api_chain_entity.APIChainStatus).where(api_chain_entity.APIChainStatus.uuid == new_uuid)
+        )
+        return result2.first()
+
+    async def _update_status(
+        self,
+        status_uuid: str,
+        is_healthy: Optional[bool] = None,
+        failure_count: Optional[int] = None,
+        last_failure_time: Optional[datetime] = None,
+        last_success_time: Optional[datetime] = None,
+        last_health_check_time: Optional[datetime] = None,
+        last_error_message: Optional[str] = None,
+        health_check_last_failed: Optional[bool] = None,
+    ):
+        """Update a status record by UUID"""
+        update_data: Dict[str, Any] = {}
+        if is_healthy is not None:
+            update_data['is_healthy'] = is_healthy
+        if failure_count is not None:
+            update_data['failure_count'] = failure_count
+        if last_failure_time is not None:
+            update_data['last_failure_time'] = last_failure_time
+        if last_success_time is not None:
+            update_data['last_success_time'] = last_success_time
+        if last_health_check_time is not None:
+            update_data['last_health_check_time'] = last_health_check_time
+        if last_error_message is not None:
+            update_data['last_error_message'] = last_error_message
+        elif is_healthy:
+            # Clear error message when marking healthy
+            update_data['last_error_message'] = None
+        if health_check_last_failed is not None:
+            update_data['health_check_last_failed'] = health_check_last_failed
+
+        if update_data:
+            await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.update(api_chain_entity.APIChainStatus)
+                .where(api_chain_entity.APIChainStatus.uuid == status_uuid)
+                .values(**update_data)
+            )
+
+    # ==================== Chain CRUD ====================
+
+    async def get_chain(self, chain_uuid: str) -> Optional[api_chain_entity.APIChain]:
+        """Get an API chain by UUID"""
+        return self.chains.get(chain_uuid)
+
+    async def create_chain(self, chain_data: Dict[str, Any]) -> str:
+        """Create a new API chain and start its health check loop"""
+        chain_uuid = chain_data.get('uuid', str(uuid_lib.uuid4()))
+
+        chain = api_chain_entity.APIChain(
+            uuid=chain_uuid,
+            name=chain_data['name'],
+            description=chain_data.get('description', ''),
+            chain_config=chain_data.get('chain_config', []),
+            health_check_interval=chain_data.get('health_check_interval', 300),
+            health_check_enabled=chain_data.get('health_check_enabled', True),
+        )
+
+        # Use explicit column values to avoid SQLAlchemy internal state pollution
+        await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.insert(api_chain_entity.APIChain).values(
+                uuid=chain.uuid,
+                name=chain.name,
+                description=chain.description,
+                chain_config=chain.chain_config,
+                health_check_interval=chain.health_check_interval,
+                health_check_enabled=chain.health_check_enabled,
+            )
+        )
+        self.chains[chain_uuid] = chain
+
+        if chain.health_check_enabled:
+            task = asyncio.create_task(self._health_check_loop(chain_uuid))
+            self.health_check_tasks[chain_uuid] = task
+
+        return chain_uuid
+
+    async def update_chain(self, chain_uuid: str, chain_data: Dict[str, Any]):
+        """Update an existing API chain"""
+        existing = self.chains.get(chain_uuid)
+
+        # Collect current attribute values (may come from an in-memory instance or DB)
+        if existing is not None:
+            current = {
+                'uuid': existing.uuid,
+                'name': existing.name,
+                'description': existing.description,
+                'chain_config': existing.chain_config,
+                'health_check_interval': existing.health_check_interval,
+                'health_check_enabled': existing.health_check_enabled,
+            }
+        else:
+            db_result = await self.ap.persistence_mgr.execute_async(
+                sqlalchemy.select(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
+            )
+            row = db_result.first()
+            if not row:
+                raise ValueError(f'Chain {chain_uuid} not found')
+            current = {
+                'uuid': row.uuid,
+                'name': row.name,
+                'description': row.description,
+                'chain_config': row.chain_config,
+                'health_check_interval': row.health_check_interval,
+                'health_check_enabled': row.health_check_enabled,
+            }
+
+        # Merge incoming changes
+        for key, value in chain_data.items():
+            if key in current and key != 'uuid':
+                current[key] = value
+
+        # Persist changes to DB
+        await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.update(api_chain_entity.APIChain)
+            .where(api_chain_entity.APIChain.uuid == chain_uuid)
+            .values(**{k: v for k, v in chain_data.items() if k != 'uuid'})
+        )
+
+        # Rebuild mutable in-memory instance with merged data
+        new_chain = api_chain_entity.APIChain(
+            uuid=current['uuid'],
+            name=current['name'],
+            description=current.get('description', ''),
+            chain_config=current.get('chain_config', []),
+            health_check_interval=current.get('health_check_interval', 300),
+            health_check_enabled=current.get('health_check_enabled', True),
+        )
+        self.chains[chain_uuid] = new_chain
+
+        # Cancel existing task and restart to pick up new config immediately
+        existing_task = self.health_check_tasks.pop(chain_uuid, None)
+        if existing_task is not None:
+            existing_task.cancel()
+        if new_chain.health_check_enabled:
+            task = asyncio.create_task(self._health_check_loop(chain_uuid))
+            self.health_check_tasks[chain_uuid] = task
+
+    async def delete_chain(self, chain_uuid: str):
+        """Delete an API chain"""
+        if chain_uuid in self.health_check_tasks:
+            self.health_check_tasks[chain_uuid].cancel()
+            del self.health_check_tasks[chain_uuid]
+
+        await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.delete(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
+        )
+        await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.delete(api_chain_entity.APIChainStatus).where(
+                api_chain_entity.APIChainStatus.chain_uuid == chain_uuid
+            )
+        )
+        self.chains.pop(chain_uuid, None)
+
+    # ==================== Invoke Helpers ====================
+
+    def _build_invoke_tasks(
+        self,
+        model_configs: List[Dict[str, Any]],
+    ) -> List[Tuple[Optional[str], Optional[int]]]:
+        """Build an ordered list of (model_name, api_key_index) tuples to try.
+
+        Returns [(None, None)] when model_configs is empty, meaning the caller's
+        original model and round-robin key rotation will be used (legacy behaviour).
+        When api_key_indices is configured for a model, each key index becomes a
+        separate failover task ordered by priority. When api_key_indices is absent,
+        the entry uses (model_name, None) so the provider's TokenManager performs
+        round-robin rotation across all configured keys.
+        """
+        if not model_configs:
+            return [(None, None)]
+
+        tasks: List[Tuple[Optional[str], Optional[int]]] = []
+        sorted_models = sorted(model_configs, key=lambda x: x.get('priority', 0))
+        for mc in sorted_models:
+            model_name: Optional[str] = mc.get('model_name') or None
+            api_key_indices: List[Dict] = mc.get('api_key_indices') or []
+            if api_key_indices:
+                # Expand each configured key index as an independent failover task
+                sorted_keys = sorted(api_key_indices, key=lambda x: x.get('priority', 0))
+                for key_config in sorted_keys:
+                    tasks.append((model_name, key_config['index']))
+            else:
+                # No specific key configured: use round-robin rotation
+                tasks.append((model_name, None))
+        return tasks if tasks else [(None, None)]
+
+    def _create_provider_for_key(
+        self,
+        provider: requester.RuntimeProvider,
+        api_key_index: Optional[int],
+    ) -> requester.RuntimeProvider:
+        """Return a provider restricted to a single API key.
+
+        Creates a lightweight wrapper with a single-token TokenManager so that
+        shared mutable state on the original provider is not modified.
+        Returns the original provider unchanged when api_key_index is None.
+        """
+        if api_key_index is None:
+            return provider
+
+        tokens = provider.token_mgr.tokens
+        if not tokens or api_key_index >= len(tokens):
+            return provider  # index out of range 鈥?fall back gracefully
+
+        single_token_mgr = token.TokenManager(
+            name=provider.token_mgr.name,
+            tokens=[tokens[api_key_index]],
+        )
+        return requester.RuntimeProvider(
+            provider_entity=provider.provider_entity,
+            token_mgr=single_token_mgr,
+            requester=provider.requester,
+        )
+
+    def _resolve_model_entity(
+        self,
+        provider: requester.RuntimeProvider,
+        default_model: Optional[requester.RuntimeLLMModel],
+        model_name: Optional[str],
+    ) -> Any:
+        """Return the model entity for model_name under the given provider.
+
+        Falls back to default_model.model_entity when model_name is None or no
+        matching model is found. When default_model is also None, falls back to
+        the first available model for the provider.
+        """
+        if not model_name:
+            if default_model is not None:
+                return default_model.model_entity
+            for m in self.ap.model_mgr.llm_models:
+                if m.model_entity.provider_uuid == provider.provider_entity.uuid:
+                    return m.model_entity
+            return None
+
+        for m in self.ap.model_mgr.llm_models:
+            if m.model_entity.provider_uuid == provider.provider_entity.uuid and m.model_entity.name == model_name:
+                return m.model_entity
+
+        if default_model is not None:
+            return default_model.model_entity
+        for m in self.ap.model_mgr.llm_models:
+            if m.model_entity.provider_uuid == provider.provider_entity.uuid:
+                return m.model_entity
+        return None
+
+    # ==================== LLM Invocation ====================
+
+    async def invoke_chain_llm(
+        self,
+        chain_uuid: str,
+        query: pipeline_query.Query,
+        model: Optional[requester.RuntimeLLMModel],
+        messages: List[provider_message.Message],
+        funcs: Optional[List[resource_tool.LLMTool]] = None,
+        extra_args: Dict[str, Any] = {},
+        remove_think: bool = False,
+    ) -> provider_message.Message:
+        """Invoke LLM through API chain with per-model/per-API-key failover"""
+        chain = self.chains.get(chain_uuid)
+        if not chain:
+            raise ValueError(f'Chain {chain_uuid} not found')
+
+        sorted_items = sorted(chain.chain_config, key=lambda x: x.get('priority', 0))
+        last_error: Optional[Exception] = None
+
+        for item in sorted_items:
+            provider_uuid: str = item['provider_uuid']
+            is_aggregated: bool = item.get('is_aggregated', False)
+            max_retries: int = item.get('max_retries', 3)
+            model_configs: List[Dict] = item.get('model_configs') or []
+
+            provider = self.ap.model_mgr.provider_dict.get(provider_uuid)
+            if not provider:
+                self.ap.logger.warning(f'Provider {provider_uuid} not found in chain {chain_uuid}')
+                continue
+
+            tasks = self._build_invoke_tasks(model_configs)
+
+            for task_model_name, task_api_key_index in tasks:
+                status = await self._ensure_status(chain_uuid, provider_uuid, task_model_name, task_api_key_index)
+
+                if status and not status.is_healthy and not is_aggregated:
+                    self.ap.logger.debug(
+                        f'Skipping unhealthy: provider={provider_uuid} model={task_model_name} key={task_api_key_index}'
+                    )
+                    continue
+
+                temp_provider = self._create_provider_for_key(provider, task_api_key_index)
+                model_entity = self._resolve_model_entity(provider, model, task_model_name)
+                if model_entity is None:
+                    self.ap.logger.warning(
+                        f'No model found for provider {provider_uuid} in chain {chain_uuid}, skipping'
+                    )
+                    continue
+                temp_model = requester.RuntimeLLMModel(
+                    model_entity=model_entity,
+                    provider=temp_provider,
+                )
+
+                retry_count = 0 if is_aggregated else max_retries
+
+                for attempt in range(max(1, retry_count + 1)):
+                    try:
+                        result = await temp_provider.invoke_llm(
+                            query=query,
+                            model=temp_model,
+                            messages=messages,
+                            funcs=funcs,
+                            extra_args=extra_args,
+                            remove_think=remove_think,
+                        )
+
+                        # Advance round-robin token rotation on success
+                        if task_api_key_index is None:
+                            provider.token_mgr.next_token()
+
+                        if status:
+                            await self._update_status(
+                                status.uuid,
+                                is_healthy=True,
+                                failure_count=0,
+                                health_check_last_failed=False,
+                                last_success_time=datetime.now(),
+                            )
+                        return result
+
+                    except Exception as e:
+                        last_error = e
+                        self.ap.logger.warning(
+                            f'Chain {chain_uuid} provider={provider_uuid} '
+                            f'model={task_model_name} key={task_api_key_index} '
+                            f'attempt {attempt + 1}/{max(1, retry_count + 1)} failed: {e}'
+                        )
+                        # Advance round-robin token rotation on failure too
+                        if task_api_key_index is None:
+                            provider.token_mgr.next_token()
+
+                        if attempt + 1 >= max(1, retry_count + 1):
+                            # All retries exhausted for this (model, key) task
+                            if is_aggregated:
+                                # Aggregated: track failure count but keep is_healthy=True
+                                if status:
+                                    await self._update_status(
+                                        status.uuid,
+                                        failure_count=(status.failure_count or 0) + 1,
+                                        last_failure_time=datetime.now(),
+                                        last_error_message=str(e)[:1024],
+                                    )
+                            else:
+                                if status:
+                                    await self._update_status(
+                                        status.uuid,
+                                        is_healthy=False,
+                                        failure_count=(status.failure_count or 0) + 1,
+                                        health_check_last_failed=False,
+                                        last_failure_time=datetime.now(),
+                                        last_error_message=str(e)[:1024],
+                                    )
+                            break  # Move to next (model_name, key_index) task
+
+        error_msg = f'All providers in chain {chain_uuid} failed'
+        if last_error:
+            error_msg += f': {last_error}'
+        raise Exception(error_msg)
+
+    async def invoke_chain_llm_stream(
+        self,
+        chain_uuid: str,
+        query: pipeline_query.Query,
+        model: Optional[requester.RuntimeLLMModel],
+        messages: List[provider_message.Message],
+        funcs: Optional[List[resource_tool.LLMTool]] = None,
+        extra_args: Dict[str, Any] = {},
+        remove_think: bool = False,
+    ) -> AsyncGenerator[provider_message.MessageChunk, None]:
+        """Invoke LLM stream through API chain with per-model/per-API-key failover"""
+        chain = self.chains.get(chain_uuid)
+        if not chain:
+            raise ValueError(f'Chain {chain_uuid} not found')
+
+        sorted_items = sorted(chain.chain_config, key=lambda x: x.get('priority', 0))
+        last_error: Optional[Exception] = None
+        # True if the stream started yielding and then failed mid-flight.
+        # In this case we must NOT fall through to the next provider because
+        # partial output has already been sent to the caller.
+        failed_mid_stream: bool = False
+
+        for item in sorted_items:
+            provider_uuid: str = item['provider_uuid']
+            is_aggregated: bool = item.get('is_aggregated', False)
+            max_retries: int = item.get('max_retries', 3)
+            model_configs: List[Dict] = item.get('model_configs') or []
+
+            provider = self.ap.model_mgr.provider_dict.get(provider_uuid)
+            if not provider:
+                self.ap.logger.warning(f'Provider {provider_uuid} not found in chain {chain_uuid}')
+                continue
+
+            tasks = self._build_invoke_tasks(model_configs)
+
+            for task_model_name, task_api_key_index in tasks:
+                status = await self._ensure_status(chain_uuid, provider_uuid, task_model_name, task_api_key_index)
+
+                if status and not status.is_healthy and not is_aggregated:
+                    self.ap.logger.debug(
+                        f'Skipping unhealthy: provider={provider_uuid} model={task_model_name} key={task_api_key_index}'
+                    )
+                    continue
+
+                temp_provider = self._create_provider_for_key(provider, task_api_key_index)
+                model_entity = self._resolve_model_entity(provider, model, task_model_name)
+                if model_entity is None:
+                    self.ap.logger.warning(
+                        f'No model found for provider {provider_uuid} in chain {chain_uuid}, skipping'
+                    )
+                    continue
+                temp_model = requester.RuntimeLLMModel(
+                    model_entity=model_entity,
+                    provider=temp_provider,
+                )
+
+                retry_count = 0 if is_aggregated else max_retries
+
+                for attempt in range(max(1, retry_count + 1)):
+                    has_yielded = False
+                    try:
+                        async for chunk in temp_provider.invoke_llm_stream(
+                            query=query,
+                            model=temp_model,
+                            messages=messages,
+                            funcs=funcs,
+                            extra_args=extra_args,
+                            remove_think=remove_think,
+                        ):
+                            has_yielded = True
+                            yield chunk
+
+                        # Advance round-robin token rotation on success
+                        if task_api_key_index is None:
+                            provider.token_mgr.next_token()
+
+                        if status:
+                            await self._update_status(
+                                status.uuid,
+                                is_healthy=True,
+                                failure_count=0,
+                                health_check_last_failed=False,
+                                last_success_time=datetime.now(),
+                            )
+                        return
+
+                    except Exception as e:
+                        last_error = e
+                        self.ap.logger.warning(
+                            f'Chain {chain_uuid} provider={provider_uuid} '
+                            f'model={task_model_name} key={task_api_key_index} '
+                            f'stream attempt {attempt + 1}/{max(1, retry_count + 1)} failed: {e}'
+                        )
+                        # Advance round-robin token rotation on failure too
+                        if task_api_key_index is None:
+                            provider.token_mgr.next_token()
+
+                        if has_yielded or attempt + 1 >= max(1, retry_count + 1):
+                            # Cannot retry if chunks were already yielded (would duplicate output),
+                            # or all retries are exhausted for this task
+                            if is_aggregated:
+                                # Aggregated: track failure count but keep is_healthy=True
+                                if status:
+                                    await self._update_status(
+                                        status.uuid,
+                                        failure_count=(status.failure_count or 0) + 1,
+                                        last_failure_time=datetime.now(),
+                                        last_error_message=str(e)[:1024],
+                                    )
+                            else:
+                                if status:
+                                    await self._update_status(
+                                        status.uuid,
+                                        is_healthy=False,
+                                        failure_count=(status.failure_count or 0) + 1,
+                                        health_check_last_failed=False,
+                                        last_failure_time=datetime.now(),
+                                        last_error_message=str(e)[:1024],
+                                    )
+                            if has_yielded:
+                                # Partial output already sent to caller; stop processing
+                                # entirely to avoid mixing output from different providers.
+                                failed_mid_stream = True
+                            break  # Move to next (model_name, key_index) task
+                if failed_mid_stream:
+                    break  # Exit for-task loop
+            if failed_mid_stream:
+                break  # Exit for-item loop
+
+        if failed_mid_stream and last_error:
+            # Re-raise original exception; caller already received partial chunks
+            raise last_error
+
+        error_msg = f'All providers in chain {chain_uuid} failed'
+        if last_error:
+            error_msg += f': {last_error}'
+        raise Exception(error_msg)
diff --git a/src/langbot/pkg/provider/runners/localagent.py b/src/langbot/pkg/provider/runners/localagent.py
index 52e78b9d4..a4ccbd8ee 100644
--- a/src/langbot/pkg/provider/runners/localagent.py
+++ b/src/langbot/pkg/provider/runners/localagent.py
@@ -119,23 +119,37 @@ async def run(
 
         remove_think = query.pipeline_config['output'].get('misc', '').get('remove-think')
 
-        use_llm_model = await self.ap.model_mgr.get_model_by_uuid(query.use_llm_model_uuid)
+        use_api_chain_uuid = (query.variables or {}).get('_use_api_chain_uuid')
+        use_llm_model = (
+            None if use_api_chain_uuid else await self.ap.model_mgr.get_model_by_uuid(query.use_llm_model_uuid)
+        )
 
         self.ap.logger.debug(
-            f'localagent req: query={query.query_id} req_messages={req_messages} use_llm_model={query.use_llm_model_uuid}'
+            f'localagent req: query={query.query_id} req_messages={req_messages} '
+            f'use_llm_model={query.use_llm_model_uuid} use_api_chain={use_api_chain_uuid}'
         )
 
         if not is_stream:
             # 非流式输出，直接请求
-
-            msg = await use_llm_model.provider.invoke_llm(
-                query,
-                use_llm_model,
-                req_messages,
-                query.use_funcs,
-                extra_args=use_llm_model.model_entity.extra_args,
-                remove_think=remove_think,
-            )
+            if use_api_chain_uuid:
+                msg = await self.ap.api_chain_mgr.invoke_chain_llm(
+                    use_api_chain_uuid,
+                    query,
+                    None,
+                    req_messages,
+                    query.use_funcs,
+                    extra_args={},
+                    remove_think=remove_think,
+                )
+            else:
+                msg = await use_llm_model.provider.invoke_llm(
+                    query,
+                    use_llm_model,
+                    req_messages,
+                    query.use_funcs,
+                    extra_args=use_llm_model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
             yield msg
             final_msg = msg
         else:
@@ -145,14 +159,26 @@ async def run(
             accumulated_content = ''  # 从开始累积的所有内容
             last_role = 'assistant'
             msg_sequence = 1
-            async for msg in use_llm_model.provider.invoke_llm_stream(
-                query,
-                use_llm_model,
-                req_messages,
-                query.use_funcs,
-                extra_args=use_llm_model.model_entity.extra_args,
-                remove_think=remove_think,
-            ):
+            if use_api_chain_uuid:
+                stream_src = self.ap.api_chain_mgr.invoke_chain_llm_stream(
+                    use_api_chain_uuid,
+                    query,
+                    None,
+                    req_messages,
+                    query.use_funcs,
+                    extra_args={},
+                    remove_think=remove_think,
+                )
+            else:
+                stream_src = use_llm_model.provider.invoke_llm_stream(
+                    query,
+                    use_llm_model,
+                    req_messages,
+                    query.use_funcs,
+                    extra_args=use_llm_model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
+            async for msg in stream_src:
                 msg_idx = msg_idx + 1
 
                 # 记录角色
@@ -253,7 +279,8 @@ async def run(
                     req_messages.append(err_msg)
 
             self.ap.logger.debug(
-                f'localagent req: query={query.query_id} req_messages={req_messages} use_llm_model={query.use_llm_model_uuid}'
+                f'localagent req: query={query.query_id} req_messages={req_messages} '
+                f'use_llm_model={query.use_llm_model_uuid} use_api_chain={use_api_chain_uuid}'
             )
 
             if is_stream:
@@ -263,14 +290,26 @@ async def run(
                 last_role = 'assistant'
                 msg_sequence = first_end_sequence
 
-                async for msg in use_llm_model.provider.invoke_llm_stream(
-                    query,
-                    use_llm_model,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args=use_llm_model.model_entity.extra_args,
-                    remove_think=remove_think,
-                ):
+                if use_api_chain_uuid:
+                    tool_stream_src = self.ap.api_chain_mgr.invoke_chain_llm_stream(
+                        use_api_chain_uuid,
+                        query,
+                        None,
+                        req_messages,
+                        query.use_funcs,
+                        extra_args={},
+                        remove_think=remove_think,
+                    )
+                else:
+                    tool_stream_src = use_llm_model.provider.invoke_llm_stream(
+                        query,
+                        use_llm_model,
+                        req_messages,
+                        query.use_funcs,
+                        extra_args=use_llm_model.model_entity.extra_args,
+                        remove_think=remove_think,
+                    )
+                async for msg in tool_stream_src:
                     msg_idx += 1
 
                     # 记录角色
@@ -319,14 +358,25 @@ async def run(
                 )
             else:
                 # 处理完所有调用，再次请求
-                msg = await use_llm_model.provider.invoke_llm(
-                    query,
-                    use_llm_model,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args=use_llm_model.model_entity.extra_args,
-                    remove_think=remove_think,
-                )
+                if use_api_chain_uuid:
+                    msg = await self.ap.api_chain_mgr.invoke_chain_llm(
+                        use_api_chain_uuid,
+                        query,
+                        None,
+                        req_messages,
+                        query.use_funcs,
+                        extra_args={},
+                        remove_think=remove_think,
+                    )
+                else:
+                    msg = await use_llm_model.provider.invoke_llm(
+                        query,
+                        use_llm_model,
+                        req_messages,
+                        query.use_funcs,
+                        extra_args=use_llm_model.model_entity.extra_args,
+                        remove_think=remove_think,
+                    )
 
                 yield msg
                 final_msg = msg
diff --git a/src/langbot/pkg/provider/runners/n8nsvapi.py b/src/langbot/pkg/provider/runners/n8nsvapi.py
index d177d6b81..d7ec3ccbf 100644
--- a/src/langbot/pkg/provider/runners/n8nsvapi.py
+++ b/src/langbot/pkg/provider/runners/n8nsvapi.py
@@ -5,8 +5,6 @@
 import uuid
 import aiohttp
 
-from langbot.pkg.utils import httpclient
-
 from .. import runner
 from ...core import app
 import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
@@ -219,50 +217,50 @@ async def _call_webhook(self, query: pipeline_query.Query) -> typing.AsyncGenera
                 self.ap.logger.debug('no auth')
 
             # 调用webhook
-            session = httpclient.get_session()
-            if is_stream:
-                # 流式请求
-                async with session.post(
-                    self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
-                ) as response:
-                    if response.status != 200:
-                        error_text = await response.text()
-                        self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
-                        raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
-
-                    # 处理流式响应
-                    async for chunk in self._process_stream_response(response):
-                        yield chunk
-            else:
-                async with session.post(
-                    self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
-                ) as response:
-                    try:
-                        async for chunk in self._process_stream_response(response):
-                            output_content = chunk.content if chunk.is_final else ''
-                    except:
-                        # 非流式请求（保持原有逻辑）
+            async with aiohttp.ClientSession() as session:
+                if is_stream:
+                    # 流式请求
+                    async with session.post(
+                        self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
+                    ) as response:
                         if response.status != 200:
                             error_text = await response.text()
                             self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
                             raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
 
-                        # 解析响应
-                        response_data = await response.json()
-                        self.ap.logger.debug(f'n8n webhook response: {response_data}')
-
-                        # 从响应中提取输出
-                        if self.output_key in response_data:
-                            output_content = response_data[self.output_key]
-                        else:
-                            # 如果没有指定的输出键，则使用整个响应
-                            output_content = json.dumps(response_data, ensure_ascii=False)
-
-                    # 返回消息
-                    yield provider_message.Message(
-                        role='assistant',
-                        content=output_content,
-                    )
+                        # 处理流式响应
+                        async for chunk in self._process_stream_response(response):
+                            yield chunk
+                else:
+                    async with session.post(
+                        self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
+                    ) as response:
+                        try:
+                            async for chunk in self._process_stream_response(response):
+                                output_content = chunk.content if chunk.is_final else ''
+                        except:
+                            # 非流式请求（保持原有逻辑）
+                            if response.status != 200:
+                                error_text = await response.text()
+                                self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
+                                raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
+
+                            # 解析响应
+                            response_data = await response.json()
+                            self.ap.logger.debug(f'n8n webhook response: {response_data}')
+
+                            # 从响应中提取输出
+                            if self.output_key in response_data:
+                                output_content = response_data[self.output_key]
+                            else:
+                                # 如果没有指定的输出键，则使用整个响应
+                                output_content = json.dumps(response_data, ensure_ascii=False)
+
+                        # 返回消息
+                        yield provider_message.Message(
+                            role='assistant',
+                            content=output_content,
+                        )
         except Exception as e:
             self.ap.logger.error(f'n8n webhook call exception: {str(e)}')
             raise N8nAPIError(f'n8n webhook call exception: {str(e)}')
diff --git a/src/langbot/pkg/utils/image.py b/src/langbot/pkg/utils/image.py
index 5716b07d6..e07caec67 100644
--- a/src/langbot/pkg/utils/image.py
+++ b/src/langbot/pkg/utils/image.py
@@ -5,8 +5,6 @@
 import ssl
 
 import aiohttp
-
-from langbot.pkg.utils import httpclient
 import PIL.Image
 import httpx
 
@@ -49,54 +47,53 @@ async def get_gewechat_image_base64(
     )
 
     try:
-        session = httpclient.get_session()
-        # 获取图片下载链接
-        try:
-            async with session.post(
-                f'{gewechat_url}/v2/api/message/downloadImage',
-                headers=headers,
-                json={'appId': app_id, 'type': image_type, 'xml': xml_content},
-                timeout=timeout,
-            ) as response:
-                if response.status != 200:
-                    # print(response)
-                    raise Exception(f'获取gewechat图片下载失败: {await response.text()}')
-
-                resp_data = await response.json()
-                if resp_data.get('ret') != 200:
-                    raise Exception(f'获取gewechat图片下载链接失败: {resp_data}')
-
-                file_url = resp_data['data']['fileUrl']
-        except asyncio.TimeoutError:
-            raise Exception('获取图片下载链接超时')
-        except aiohttp.ClientError as e:
-            raise Exception(f'获取图片下载链接网络错误: {str(e)}')
-
-        # 解析原始URL并替换端口
-        base_url = gewechat_file_url
-        download_url = f'{base_url}/download/{file_url}'
-
-        # 下载图片
-        try:
-            async with session.get(download_url) as img_response:
-                if img_response.status != 200:
-                    raise Exception(f'下载图片失败: {await img_response.text()}, URL: {download_url}')
-
-                image_data = await img_response.read()
-
-                content_type = img_response.headers.get('Content-Type', '')
-                if content_type:
-                    image_format = content_type.split('/')[-1]
-                else:
-                    image_format = file_url.split('.')[-1]
-
-                base64_str = base64.b64encode(image_data).decode('utf-8')
-
-                return base64_str, image_format
-        except asyncio.TimeoutError:
-            raise Exception(f'下载图片超时, URL: {download_url}')
-        except aiohttp.ClientError as e:
-            raise Exception(f'下载图片网络错误: {str(e)}, URL: {download_url}')
+        async with aiohttp.ClientSession(timeout=timeout) as session:
+            # 获取图片下载链接
+            try:
+                async with session.post(
+                    f'{gewechat_url}/v2/api/message/downloadImage',
+                    headers=headers,
+                    json={'appId': app_id, 'type': image_type, 'xml': xml_content},
+                ) as response:
+                    if response.status != 200:
+                        # print(response)
+                        raise Exception(f'获取gewechat图片下载失败: {await response.text()}')
+
+                    resp_data = await response.json()
+                    if resp_data.get('ret') != 200:
+                        raise Exception(f'获取gewechat图片下载链接失败: {resp_data}')
+
+                    file_url = resp_data['data']['fileUrl']
+            except asyncio.TimeoutError:
+                raise Exception('获取图片下载链接超时')
+            except aiohttp.ClientError as e:
+                raise Exception(f'获取图片下载链接网络错误: {str(e)}')
+
+            # 解析原始URL并替换端口
+            base_url = gewechat_file_url
+            download_url = f'{base_url}/download/{file_url}'
+
+            # 下载图片
+            try:
+                async with session.get(download_url) as img_response:
+                    if img_response.status != 200:
+                        raise Exception(f'下载图片失败: {await img_response.text()}, URL: {download_url}')
+
+                    image_data = await img_response.read()
+
+                    content_type = img_response.headers.get('Content-Type', '')
+                    if content_type:
+                        image_format = content_type.split('/')[-1]
+                    else:
+                        image_format = file_url.split('.')[-1]
+
+                    base64_str = base64.b64encode(image_data).decode('utf-8')
+
+                    return base64_str, image_format
+            except asyncio.TimeoutError:
+                raise Exception(f'下载图片超时, URL: {download_url}')
+            except aiohttp.ClientError as e:
+                raise Exception(f'下载图片网络错误: {str(e)}, URL: {download_url}')
     except Exception as e:
         raise Exception(f'获取图片失败: {str(e)}') from e
 
@@ -107,24 +104,24 @@ async def get_wecom_image_base64(pic_url: str) -> tuple[str, str]:
     :param pic_url: 企业微信图片URL
     :return: (base64_str, image_format)
     """
-    session = httpclient.get_session()
-    async with session.get(pic_url) as response:
-        if response.status != 200:
-            raise Exception(f'Failed to download image: {response.status}')
+    async with aiohttp.ClientSession() as session:
+        async with session.get(pic_url) as response:
+            if response.status != 200:
+                raise Exception(f'Failed to download image: {response.status}')
 
-        # 读取图片数据
-        image_data = await response.read()
+            # 读取图片数据
+            image_data = await response.read()
 
-        # 获取图片格式
-        content_type = response.headers.get('Content-Type', '')
-        image_format = content_type.split('/')[-1]  # 例如 'image/jpeg' -> 'jpeg'
+            # 获取图片格式
+            content_type = response.headers.get('Content-Type', '')
+            image_format = content_type.split('/')[-1]  # 例如 'image/jpeg' -> 'jpeg'
 
-        # 转换为 base64
-        import base64
+            # 转换为 base64
+            import base64
 
-        image_base64 = base64.b64encode(image_data).decode('utf-8')
+            image_base64 = base64.b64encode(image_data).decode('utf-8')
 
-        return image_base64, image_format
+            return image_base64, image_format
 
 
 async def get_qq_official_image_base64(pic_url: str, content_type: str) -> tuple[str, str]:
@@ -155,19 +152,21 @@ async def get_qq_image_bytes(image_url: str, query: dict = {}) -> tuple[bytes, s
     ssl_context = ssl.create_default_context()
     ssl_context.check_hostname = False
     ssl_context.verify_mode = ssl.CERT_NONE
-    session = httpclient.get_session()
-    async with session.get(image_url, params=query, ssl=ssl_context, timeout=aiohttp.ClientTimeout(total=30.0)) as resp:
-        resp.raise_for_status()
-        file_bytes = await resp.read()
-        content_type = resp.headers.get('Content-Type')
-        if not content_type:
-            image_format = 'jpeg'
-        elif not content_type.startswith('image/'):
-            pil_img = PIL.Image.open(io.BytesIO(file_bytes))
-            image_format = pil_img.format.lower()
-        else:
-            image_format = content_type.split('/')[-1]
-        return file_bytes, image_format
+    async with aiohttp.ClientSession(trust_env=False) as session:
+        async with session.get(
+            image_url, params=query, ssl=ssl_context, timeout=aiohttp.ClientTimeout(total=30.0)
+        ) as resp:
+            resp.raise_for_status()
+            file_bytes = await resp.read()
+            content_type = resp.headers.get('Content-Type')
+            if not content_type:
+                image_format = 'jpeg'
+            elif not content_type.startswith('image/'):
+                pil_img = PIL.Image.open(io.BytesIO(file_bytes))
+                image_format = pil_img.format.lower()
+            else:
+                image_format = content_type.split('/')[-1]
+            return file_bytes, image_format
 
 
 async def qq_image_url_to_base64(image_url: str) -> typing.Tuple[str, str]:
@@ -205,11 +204,11 @@ async def extract_b64_and_format(image_base64_data: str) -> typing.Tuple[str, st
 async def get_slack_image_to_base64(pic_url: str, bot_token: str):
     headers = {'Authorization': f'Bearer {bot_token}'}
     try:
-        session = httpclient.get_session()
-        async with session.get(pic_url, headers=headers) as resp:
-            mime_type = resp.headers.get('Content-Type', 'application/octet-stream')
-            file_bytes = await resp.read()
-            base64_str = base64.b64encode(file_bytes).decode('utf-8')
-        return f'data:{mime_type};base64,{base64_str}'
+        async with aiohttp.ClientSession() as session:
+            async with session.get(pic_url, headers=headers) as resp:
+                mime_type = resp.headers.get('Content-Type', 'application/octet-stream')
+                file_bytes = await resp.read()
+                base64_str = base64.b64encode(file_bytes).decode('utf-8')
+            return f'data:{mime_type};base64,{base64_str}'
     except Exception as e:
         raise (e)
diff --git a/src/langbot/templates/metadata/pipeline/ai.yaml b/src/langbot/templates/metadata/pipeline/ai.yaml
index 7a13b2b14..974684475 100644
--- a/src/langbot/templates/metadata/pipeline/ai.yaml
+++ b/src/langbot/templates/metadata/pipeline/ai.yaml
@@ -57,9 +57,9 @@ stages:
     config:
       - name: model
         label:
-          en_US: Model
-          zh_Hans: 模型
-        type: llm-model-selector
+          en_US: Model / API Chain
+          zh_Hans: 模型 / API 链
+        type: model-or-api-chain-selector
         required: true
       - name: max-round
         label:
diff --git a/web/eslint.config.mjs b/web/eslint.config.mjs
index 18b74c95d..d9a1d0e10 100644
--- a/web/eslint.config.mjs
+++ b/web/eslint.config.mjs
@@ -11,6 +11,9 @@ const compat = new FlatCompat({
 });
 
 const eslintConfig = [
+  {
+    ignores: ['.next/**', 'node_modules/**'],
+  },
   ...compat.extends('next/core-web-vitals', 'next/typescript'),
   eslintPluginPrettierRecommended,
 ];
diff --git a/web/src/app/home/bots/components/bot-form/BotForm.tsx b/web/src/app/home/bots/components/bot-form/BotForm.tsx
index d2ca22d79..1e2439575 100644
--- a/web/src/app/home/bots/components/bot-form/BotForm.tsx
+++ b/web/src/app/home/bots/components/bot-form/BotForm.tsx
@@ -124,12 +124,6 @@ export default function BotForm({
   const currentAdapter = form.watch('adapter');
   const currentAdapterConfig = form.watch('adapter_config');
 
-  // Serialize adapter_config to a stable string so it can be used as a
-  // useEffect dependency without triggering on every render.  form.watch()
-  // returns a new object reference each time, which would otherwise cause
-  // the filtering effect below to loop indefinitely.
-  const adapterConfigJson = JSON.stringify(currentAdapterConfig);
-
   useEffect(() => {
     setBotFormValues();
   }, []);
@@ -153,7 +147,7 @@ export default function BotForm({
       // For non-Lark adapters, show all fields
       setFilteredDynamicFormConfigList(dynamicFormConfigList);
     }
-  }, [currentAdapter, adapterConfigJson, dynamicFormConfigList]);
+  }, [currentAdapter, currentAdapterConfig, dynamicFormConfigList]);
 
   // 复制到剪贴板的辅助函数 - 使用页面上的真实input元素
   const copyToClipboard = () => {
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx b/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
new file mode 100644
index 000000000..9d7cb3e27
--- /dev/null
+++ b/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
@@ -0,0 +1,495 @@
+﻿'use client';
+
+import {
+  APIChain,
+  APIChainStatus,
+  LLMModel,
+  ModelProvider,
+} from '@/app/infra/entities/api';
+import { Card, CardContent } from '@/components/ui/card';
+import { Button } from '@/components/ui/button';
+import {
+  Edit,
+  Trash2,
+  ChevronDown,
+  ChevronRight,
+  AlertCircle,
+  CheckCircle2,
+  AlertTriangle,
+} from 'lucide-react';
+import { useState, useMemo } from 'react';
+import { useTranslation } from 'react-i18next';
+import { cn } from '@/lib/utils';
+
+interface APIChainCardProps {
+  chain: APIChain;
+  providers: ModelProvider[];
+  llmModels: LLMModel[];
+  onEdit: () => void;
+  onDelete: () => void;
+}
+
+function calculateHealthPercentage(
+  statuses: APIChainStatus[] | undefined,
+  chainConfig: APIChain['chain_config'],
+): number {
+  if (!statuses || statuses.length === 0 || chainConfig.length === 0)
+    return 100;
+  // Collect UUIDs of aggregated providers so their statuses are excluded from
+  // the unhealthy calculation (they never become unhealthy by design).
+  const aggregatedUuids = new Set(
+    chainConfig.filter((c) => c.is_aggregated).map((c) => c.provider_uuid),
+  );
+  const trackable = statuses.filter(
+    (s) => !aggregatedUuids.has(s.provider_uuid),
+  );
+  if (trackable.length === 0) return 100;
+  const healthyCount = trackable.filter((s) => s.is_healthy).length;
+  return Math.round((healthyCount / trackable.length) * 100);
+}
+
+function getErrorStats(statuses: APIChainStatus[] | undefined): {
+  totalFailures: number;
+} {
+  if (!statuses || statuses.length === 0) return { totalFailures: 0 };
+  return {
+    totalFailures: statuses.reduce((sum, s) => sum + (s.failure_count || 0), 0),
+  };
+}
+
+function getHealthColorClass(healthPercentage: number): string {
+  if (healthPercentage === 0) return 'border-destructive bg-destructive/5';
+  if (healthPercentage < 50) return 'border-yellow-500 bg-yellow-500/5';
+  return '';
+}
+
+function getHealthIcon(healthPercentage: number) {
+  if (healthPercentage === 0)
+    return <AlertCircle className="h-4 w-4 text-destructive" />;
+  if (healthPercentage < 50)
+    return <AlertTriangle className="h-4 w-4 text-yellow-500" />;
+  return <CheckCircle2 className="h-4 w-4 text-green-500" />;
+}
+
+export default function APIChainCard({
+  chain,
+  providers,
+  llmModels: _llmModels, // eslint-disable-line @typescript-eslint/no-unused-vars
+  onEdit,
+  onDelete,
+}: APIChainCardProps) {
+  const { t } = useTranslation();
+  const [expanded, setExpanded] = useState(false);
+
+  const getProviderName = (uuid: string) =>
+    providers.find((p) => p.uuid === uuid)?.name ?? uuid;
+
+  const sortedConfigs = [...chain.chain_config].sort(
+    (a, b) => a.priority - b.priority,
+  );
+
+  const healthPercentage = useMemo(
+    () => calculateHealthPercentage(chain.statuses, chain.chain_config),
+    [chain.statuses, chain.chain_config],
+  );
+
+  const { totalFailures } = useMemo(
+    () => getErrorStats(chain.statuses),
+    [chain.statuses],
+  );
+
+  /** Get all status records for a given (provider, model_name, api_key_index) combination */
+  function getStatus(
+    providerUuid: string,
+    modelName: string | null,
+    apiKeyIndex: number | null,
+  ): APIChainStatus | undefined {
+    return chain.statuses?.find(
+      (s) =>
+        s.provider_uuid === providerUuid &&
+        (s.model_name ?? null) === modelName &&
+        (s.api_key_index ?? null) === apiKeyIndex,
+    );
+  }
+
+  /** Get all status records for a provider (any granularity) */
+  function getProviderStatuses(providerUuid: string): APIChainStatus[] {
+    return (
+      chain.statuses?.filter((s) => s.provider_uuid === providerUuid) ?? []
+    );
+  }
+
+  /** Compute provider-level health summary */
+  function providerHealthSummary(
+    providerUuid: string,
+    isAggregated: boolean,
+  ): { healthy: number; total: number } {
+    // Aggregated providers never become unhealthy by design; always report full health.
+    if (isAggregated) return { healthy: 1, total: 1 };
+    const ss = getProviderStatuses(providerUuid);
+    if (ss.length === 0) return { healthy: 1, total: 1 }; // assume healthy if no data
+    return { healthy: ss.filter((s) => s.is_healthy).length, total: ss.length };
+  }
+
+  return (
+    <Card
+      className={cn(
+        'mb-3 transition-colors',
+        getHealthColorClass(healthPercentage),
+      )}
+    >
+      <CardContent className="p-4">
+        {/* Header */}
+        <div className="flex items-start justify-between">
+          <div className="flex-1 min-w-0">
+            <div className="flex items-center gap-2 mb-1">
+              <button
+                onClick={() => setExpanded(!expanded)}
+                className="p-0.5 hover:bg-accent rounded"
+              >
+                {expanded ? (
+                  <ChevronDown className="h-4 w-4" />
+                ) : (
+                  <ChevronRight className="h-4 w-4" />
+                )}
+              </button>
+              <h3 className="font-semibold text-base truncate">{chain.name}</h3>
+              {getHealthIcon(healthPercentage)}
+              <span
+                className={cn(
+                  'text-xs px-2 py-0.5 rounded',
+                  healthPercentage === 0
+                    ? 'bg-destructive/10 text-destructive'
+                    : healthPercentage < 50
+                      ? 'bg-yellow-500/10 text-yellow-600'
+                      : 'bg-green-500/10 text-green-600',
+                )}
+              >
+                {healthPercentage}%
+              </span>
+            </div>
+            {chain.description && (
+              <p className="text-sm text-muted-foreground ml-6 mb-2">
+                {chain.description}
+              </p>
+            )}
+            <div className="text-xs text-muted-foreground ml-6">
+              {t('apiChains.providerCount', {
+                count: chain.chain_config.length,
+              })}
+            </div>
+          </div>
+          <div className="flex gap-1 ml-2">
+            <Button
+              variant="ghost"
+              size="icon"
+              className="h-8 w-8"
+              onClick={onEdit}
+            >
+              <Edit className="h-4 w-4" />
+            </Button>
+            <Button
+              variant="ghost"
+              size="icon"
+              className="h-8 w-8 text-destructive hover:text-destructive"
+              onClick={onDelete}
+            >
+              <Trash2 className="h-4 w-4" />
+            </Button>
+          </div>
+        </div>
+
+        {/* Expanded: per-provider / per-model / per-key health */}
+        {expanded && (
+          <div className="mt-3 ml-6 space-y-2 border-l-2 border-border pl-3">
+            {sortedConfigs.map((config, index) => {
+              const { healthy, total } = providerHealthSummary(
+                config.provider_uuid,
+                config.is_aggregated,
+              );
+              const providerHealthy = healthy === total;
+              const modelConfigs = config.model_configs ?? [];
+
+              return (
+                <div
+                  key={config.provider_uuid + index}
+                  className={cn(
+                    'text-sm p-2 rounded bg-accent/50 border-l-4',
+                    providerHealthy
+                      ? 'border-l-green-500'
+                      : 'border-l-destructive',
+                  )}
+                >
+                  {/* Provider row */}
+                  <div className="flex items-center gap-2 mb-1">
+                    <span className="font-medium">
+                      {index + 1}. {getProviderName(config.provider_uuid)}
+                    </span>
+                    {config.is_aggregated && (
+                      <span className="text-xs bg-primary/10 text-primary px-2 py-0.5 rounded">
+                        {t('apiChains.aggregation')}
+                      </span>
+                    )}
+                    <span
+                      className={cn(
+                        'text-xs px-2 py-0.5 rounded',
+                        providerHealthy
+                          ? 'bg-green-500/10 text-green-600'
+                          : 'bg-destructive/10 text-destructive',
+                      )}
+                    >
+                      {providerHealthy
+                        ? t('apiChains.healthy')
+                        : `${healthy}/${total}`}
+                    </span>
+                  </div>
+
+                  {/* Per-model breakdown */}
+                  {modelConfigs.length > 0 ? (
+                    <div className="mt-1 space-y-1 pl-3 border-l border-border">
+                      {[...modelConfigs]
+                        .sort((a, b) => a.priority - b.priority)
+                        .map((mc, mi) => {
+                          // ── Aggregated mode ──────────────────────────────────────────
+                          // Aggregated providers never become unhealthy and are not subject
+                          // to health checks. After retries are exhausted the chain simply
+                          // moves to the next model. Always render a green "healthy" badge
+                          // and omit the per-key sub-list (not meaningful here).
+                          if (config.is_aggregated) {
+                            // Sum failure counts across all key variants for display.
+                            const aggStatuses = [
+                              getStatus(
+                                config.provider_uuid,
+                                mc.model_name,
+                                null,
+                              ),
+                              ...(mc.api_key_indices ?? []).map((k) =>
+                                getStatus(
+                                  config.provider_uuid,
+                                  mc.model_name,
+                                  k.index,
+                                ),
+                              ),
+                            ].filter(Boolean) as APIChainStatus[];
+                            const aggFailures = aggStatuses.reduce(
+                              (sum, s) => sum + (s.failure_count || 0),
+                              0,
+                            );
+                            return (
+                              <div key={mi} className="text-xs">
+                                <div className="flex items-center gap-1.5 flex-wrap">
+                                  <span className="text-muted-foreground">
+                                    #{mi + 1}
+                                  </span>
+                                  <span className="font-mono">
+                                    {mc.model_name}
+                                  </span>
+                                  <span className="px-1.5 py-0.5 rounded bg-green-500/10 text-green-600">
+                                    {t('apiChains.healthy')}
+                                  </span>
+                                  {aggFailures > 0 && (
+                                    <span className="text-muted-foreground">
+                                      {t('apiChains.failureCount')}:{' '}
+                                      {aggFailures}
+                                    </span>
+                                  )}
+                                </div>
+                              </div>
+                            );
+                          }
+
+                          // ── Non-aggregated mode ──────────────────────────────────────
+                          // When api_key_indices are configured, look up the status for
+                          // each specific key; otherwise fall back to the round-robin
+                          // (api_key_index=null) record.
+                          const apiKeyIndices = mc.api_key_indices ?? [];
+                          const relevantStatuses: APIChainStatus[] =
+                            apiKeyIndices.length > 0
+                              ? (apiKeyIndices
+                                  .map((k) =>
+                                    getStatus(
+                                      config.provider_uuid,
+                                      mc.model_name,
+                                      k.index,
+                                    ),
+                                  )
+                                  .filter(Boolean) as APIChainStatus[])
+                              : ([
+                                  getStatus(
+                                    config.provider_uuid,
+                                    mc.model_name,
+                                    null,
+                                  ),
+                                ].filter(Boolean) as APIChainStatus[]);
+                          const modelHealthy =
+                            relevantStatuses.length === 0 ||
+                            relevantStatuses.every((s) => s.is_healthy);
+                          const totalFailures = relevantStatuses.reduce(
+                            (sum, s) => sum + (s.failure_count || 0),
+                            0,
+                          );
+                          const modelHcFailed = relevantStatuses.some(
+                            (s) =>
+                              !s.is_healthy && !!s.health_check_last_failed,
+                          );
+                          const modelLastError = relevantStatuses.find(
+                            (s) =>
+                              s.last_error_message &&
+                              !s.health_check_last_failed,
+                          )?.last_error_message;
+                          return (
+                            <div key={mi} className="text-xs">
+                              <div className="flex items-center gap-1.5 flex-wrap">
+                                <span className="text-muted-foreground">
+                                  #{mi + 1}
+                                </span>
+                                <span className="font-mono">
+                                  {mc.model_name}
+                                </span>
+                                <span
+                                  className={cn(
+                                    'px-1.5 py-0.5 rounded',
+                                    modelHealthy
+                                      ? 'bg-green-500/10 text-green-600'
+                                      : 'bg-destructive/10 text-destructive',
+                                  )}
+                                >
+                                  {modelHealthy
+                                    ? t('apiChains.healthy')
+                                    : t('apiChains.unhealthy')}
+                                </span>
+                                {/* health check failed badge */}
+                                {!modelHealthy && modelHcFailed && (
+                                  <span className="px-1.5 py-0.5 rounded bg-yellow-500/10 text-yellow-600">
+                                    {t('apiChains.healthCheckFailed')}
+                                  </span>
+                                )}
+                                {totalFailures > 0 && (
+                                  <span className="text-destructive">
+                                    {t('apiChains.failureCount')}:{' '}
+                                    {totalFailures}
+                                  </span>
+                                )}
+                              </div>
+                              {modelLastError && (
+                                <p
+                                  className="text-destructive pl-4 truncate"
+                                  title={modelLastError}
+                                >
+                                  {t('apiChains.lastError')}: {modelLastError}
+                                </p>
+                              )}
+                              {/* Per-key sub-list when api_key_indices are configured */}
+                              {apiKeyIndices.length > 0 && (
+                                <div className="mt-0.5 ml-3 space-y-0.5 border-l border-border pl-2">
+                                  {[...apiKeyIndices]
+                                    .sort((a, b) => a.priority - b.priority)
+                                    .map((k) => {
+                                      const kst = getStatus(
+                                        config.provider_uuid,
+                                        mc.model_name,
+                                        k.index,
+                                      );
+                                      const keyHealthy = kst
+                                        ? kst.is_healthy
+                                        : true;
+                                      return (
+                                        <div
+                                          key={k.index}
+                                          className="flex items-center gap-1.5 flex-wrap"
+                                        >
+                                          <span className="text-muted-foreground font-mono">
+                                            key[{k.index}]
+                                          </span>
+                                          <span
+                                            className={cn(
+                                              'px-1.5 py-0.5 rounded',
+                                              keyHealthy
+                                                ? 'bg-green-500/10 text-green-600'
+                                                : 'bg-destructive/10 text-destructive',
+                                            )}
+                                          >
+                                            {keyHealthy
+                                              ? t('apiChains.healthy')
+                                              : t('apiChains.unhealthy')}
+                                          </span>
+                                          {kst &&
+                                            !kst.is_healthy &&
+                                            kst.health_check_last_failed && (
+                                              <span className="px-1.5 py-0.5 rounded bg-yellow-500/10 text-yellow-600">
+                                                {t(
+                                                  'apiChains.healthCheckFailed',
+                                                )}
+                                              </span>
+                                            )}
+                                          {kst && kst.failure_count > 0 && (
+                                            <span className="text-destructive">
+                                              {kst.failure_count}×
+                                            </span>
+                                          )}
+                                        </div>
+                                      );
+                                    })}
+                                </div>
+                              )}
+                            </div>
+                          );
+                        })}
+                    </div>
+                  ) : (
+                    /* No model configs: show provider-level status detail */
+                    <div className="text-xs text-muted-foreground space-y-0.5">
+                      <div>
+                        {t('apiChains.maxRetries')}: {config.max_retries}
+                      </div>
+                      <div>
+                        {t('apiChains.timeout')}: {config.timeout_ms}ms
+                      </div>
+                      {(() => {
+                        const st = getStatus(config.provider_uuid, null, null);
+                        if (!st) return null;
+                        return (
+                          <>
+                            {/* health check failed badge (only for non-aggregated unhealthy) */}
+                            {!st.is_healthy && st.health_check_last_failed && (
+                              <div className="text-yellow-600 font-medium">
+                                ⚠ {t('apiChains.healthCheckFailed')}
+                              </div>
+                            )}
+                            {st.failure_count > 0 && (
+                              <div className="text-destructive">
+                                {t('apiChains.failureCount')}:{' '}
+                                {st.failure_count}
+                              </div>
+                            )}
+                            {st.last_error_message &&
+                              !st.health_check_last_failed && (
+                                <div
+                                  className="text-destructive truncate"
+                                  title={st.last_error_message}
+                                >
+                                  {t('apiChains.lastError')}:{' '}
+                                  {st.last_error_message}
+                                </div>
+                              )}
+                          </>
+                        );
+                      })()}
+                    </div>
+                  )}
+                </div>
+              );
+            })}
+          </div>
+        )}
+
+        {/* Bottom summary */}
+        <div className="flex justify-end mt-2 gap-4 text-xs text-muted-foreground">
+          <span className={cn(totalFailures > 0 && 'text-destructive')}>
+            {t('apiChains.errorCount')}: {totalFailures}
+          </span>
+        </div>
+      </CardContent>
+    </Card>
+  );
+}
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx b/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
new file mode 100644
index 000000000..39568c956
--- /dev/null
+++ b/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
@@ -0,0 +1,665 @@
+﻿'use client';
+
+import { useState, useEffect } from 'react';
+import { httpClient } from '@/app/infra/http/HttpClient';
+import {
+  APIChainItem,
+  APIChainModelConfig,
+  LLMModel,
+  ModelProvider,
+} from '@/app/infra/entities/api';
+import { Button } from '@/components/ui/button';
+import { Input } from '@/components/ui/input';
+import { Label } from '@/components/ui/label';
+import { Textarea } from '@/components/ui/textarea';
+import { Switch } from '@/components/ui/switch';
+import {
+  Select,
+  SelectContent,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from '@/components/ui/select';
+import { toast } from 'sonner';
+import { useTranslation } from 'react-i18next';
+import {
+  Plus,
+  Trash2,
+  GripVertical,
+  ChevronDown,
+  ChevronRight,
+} from 'lucide-react';
+
+interface APIChainFormProps {
+  chainId?: string;
+  providers: ModelProvider[];
+  llmModels: LLMModel[];
+  onFormSubmit: () => void;
+  onFormCancel: () => void;
+}
+
+export default function APIChainForm({
+  chainId,
+  providers,
+  llmModels,
+  onFormSubmit,
+  onFormCancel,
+}: APIChainFormProps) {
+  const { t } = useTranslation();
+  const [loading, setLoading] = useState(false);
+  const [name, setName] = useState('');
+  const [description, setDescription] = useState('');
+  const [chainConfig, setChainConfig] = useState<APIChainItem[]>([]);
+  const [healthCheckEnabled, setHealthCheckEnabled] = useState(true);
+  const [healthCheckInterval, setHealthCheckInterval] = useState(300);
+  /** Track which provider item has model_configs expanded */
+  const [expandedModelConfigs, setExpandedModelConfigs] = useState<Set<number>>(
+    new Set(),
+  );
+  /** Track which provider item has advanced config expanded */
+  const [expandedAdvanced, setExpandedAdvanced] = useState<Set<number>>(
+    new Set(),
+  );
+
+  useEffect(() => {
+    if (chainId) {
+      loadChain();
+    } else {
+      setChainConfig([
+        {
+          provider_uuid: '',
+          priority: 1,
+          is_aggregated: false,
+          max_retries: 3,
+          timeout_ms: 30000,
+          model_configs: [],
+        },
+      ]);
+    }
+  }, [chainId]);
+
+  async function loadChain() {
+    try {
+      setLoading(true);
+      const resp = await httpClient.getAPIChain(chainId!);
+      setName(resp.chain.name);
+      setDescription(resp.chain.description || '');
+      setChainConfig(resp.chain.chain_config);
+      setHealthCheckEnabled(resp.chain.health_check_enabled);
+      setHealthCheckInterval(resp.chain.health_check_interval);
+    } catch (err) {
+      toast.error(t('apiChains.loadError') + ': ' + (err as Error).message);
+    } finally {
+      setLoading(false);
+    }
+  }
+
+  /** Return models belonging to the given provider */
+  function modelsForProvider(providerUuid: string): LLMModel[] {
+    return llmModels.filter((m) => m.provider_uuid === providerUuid);
+  }
+
+  // ---- Provider item CRUD ----
+
+  function addProvider() {
+    const maxPriority = Math.max(...chainConfig.map((c) => c.priority), 0);
+    setChainConfig([
+      ...chainConfig,
+      {
+        provider_uuid: '',
+        priority: maxPriority + 1,
+        is_aggregated: false,
+        max_retries: 3,
+        timeout_ms: 30000,
+        model_configs: [],
+      },
+    ]);
+  }
+
+  function removeProvider(index: number) {
+    const newConfig = chainConfig.filter((_, i) => i !== index);
+    newConfig.forEach((c, i) => {
+      c.priority = i + 1;
+    });
+    setChainConfig(newConfig);
+    setExpandedModelConfigs((prev) => {
+      const next = new Set<number>();
+      prev.forEach((v) => {
+        if (v < index) next.add(v);
+        else if (v > index) next.add(v - 1);
+      });
+      return next;
+    });
+    setExpandedAdvanced((prev) => {
+      const next = new Set<number>();
+      prev.forEach((v) => {
+        if (v < index) next.add(v);
+        else if (v > index) next.add(v - 1);
+      });
+      return next;
+    });
+  }
+
+  function updateProvider(
+    index: number,
+    field: keyof APIChainItem,
+    value: string | number | boolean,
+  ) {
+    const newConfig = [...chainConfig];
+    newConfig[index] = { ...newConfig[index], [field]: value };
+    // If provider changes, reset model_configs
+    if (field === 'provider_uuid') {
+      newConfig[index].model_configs = [];
+    }
+    setChainConfig(newConfig);
+  }
+
+  function moveProvider(index: number, direction: 'up' | 'down') {
+    if (
+      (direction === 'up' && index === 0) ||
+      (direction === 'down' && index === chainConfig.length - 1)
+    )
+      return;
+    const newConfig = [...chainConfig];
+    const target = direction === 'up' ? index - 1 : index + 1;
+    [newConfig[index], newConfig[target]] = [
+      newConfig[target],
+      newConfig[index],
+    ];
+    newConfig.forEach((c, i) => {
+      c.priority = i + 1;
+    });
+    setChainConfig(newConfig);
+  }
+
+  // ---- Model config CRUD ----
+
+  function addModelConfig(providerIndex: number) {
+    const newConfig = [...chainConfig];
+    const existing = newConfig[providerIndex].model_configs ?? [];
+    const maxPriority = Math.max(...existing.map((m) => m.priority), 0);
+    newConfig[providerIndex] = {
+      ...newConfig[providerIndex],
+      model_configs: [
+        ...existing,
+        { model_name: '', priority: maxPriority + 1 },
+      ],
+    };
+    setChainConfig(newConfig);
+  }
+
+  function removeModelConfig(providerIndex: number, modelIndex: number) {
+    const newConfig = [...chainConfig];
+    const existing = (newConfig[providerIndex].model_configs ?? []).filter(
+      (_, i) => i !== modelIndex,
+    );
+    existing.forEach((m, i) => {
+      m.priority = i + 1;
+    });
+    newConfig[providerIndex] = {
+      ...newConfig[providerIndex],
+      model_configs: existing,
+    };
+    setChainConfig(newConfig);
+  }
+
+  function updateModelConfig(
+    providerIndex: number,
+    modelIndex: number,
+    field: keyof APIChainModelConfig,
+    value: string | number | boolean,
+  ) {
+    const newConfig = [...chainConfig];
+    const models = [...(newConfig[providerIndex].model_configs ?? [])];
+    models[modelIndex] = { ...models[modelIndex], [field]: value };
+    newConfig[providerIndex] = {
+      ...newConfig[providerIndex],
+      model_configs: models,
+    };
+    setChainConfig(newConfig);
+  }
+
+  function moveModelConfig(
+    providerIndex: number,
+    modelIndex: number,
+    direction: 'up' | 'down',
+  ) {
+    const models = [...(chainConfig[providerIndex].model_configs ?? [])];
+    if (
+      (direction === 'up' && modelIndex === 0) ||
+      (direction === 'down' && modelIndex === models.length - 1)
+    )
+      return;
+    const target = direction === 'up' ? modelIndex - 1 : modelIndex + 1;
+    [models[modelIndex], models[target]] = [models[target], models[modelIndex]];
+    models.forEach((m, i) => {
+      m.priority = i + 1;
+    });
+    const newConfig = [...chainConfig];
+    newConfig[providerIndex] = {
+      ...newConfig[providerIndex],
+      model_configs: models,
+    };
+    setChainConfig(newConfig);
+  }
+
+  // ---- Submit ----
+
+  async function handleSubmit() {
+    if (!name.trim()) {
+      toast.error(t('apiChains.nameRequired'));
+      return;
+    }
+    if (chainConfig.length === 0) {
+      toast.error(t('apiChains.atLeastOneProvider'));
+      return;
+    }
+    for (const config of chainConfig) {
+      if (!config.provider_uuid) {
+        toast.error(t('apiChains.selectAllProviders'));
+        return;
+      }
+      for (const mc of config.model_configs ?? []) {
+        if (!mc.model_name) {
+          toast.error(t('apiChains.selectAllModels'));
+          return;
+        }
+      }
+    }
+
+    setLoading(true);
+    try {
+      const data = {
+        name,
+        description: description || undefined,
+        chain_config: chainConfig,
+        health_check_enabled: healthCheckEnabled,
+        health_check_interval: healthCheckInterval,
+      };
+
+      if (chainId) {
+        await httpClient.updateAPIChain(chainId, data);
+        toast.success(t('apiChains.updateSuccess'));
+      } else {
+        await httpClient.createAPIChain(data);
+        toast.success(t('apiChains.createSuccess'));
+      }
+      onFormSubmit();
+    } catch (err) {
+      toast.error(
+        t(chainId ? 'apiChains.updateError' : 'apiChains.createError') +
+          ': ' +
+          (err as Error).message,
+      );
+    } finally {
+      setLoading(false);
+    }
+  }
+
+  return (
+    <div className="space-y-4">
+      {/* Name */}
+      <div className="space-y-2">
+        <Label htmlFor="name">
+          {t('apiChains.name')}
+          <span className="text-red-500 ml-1">*</span>
+        </Label>
+        <Input
+          id="name"
+          value={name}
+          onChange={(e) => setName(e.target.value)}
+          placeholder={t('apiChains.namePlaceholder')}
+        />
+      </div>
+
+      {/* Description */}
+      <div className="space-y-2">
+        <Label htmlFor="description">{t('apiChains.description')}</Label>
+        <Textarea
+          id="description"
+          value={description}
+          onChange={(e) => setDescription(e.target.value)}
+          placeholder={t('apiChains.descriptionPlaceholder')}
+          className="min-h-[60px]"
+        />
+      </div>
+
+      {/* Provider Chain */}
+      <div className="space-y-2">
+        <div className="flex items-center justify-between">
+          <Label>
+            {t('apiChains.providers')}
+            <span className="text-red-500 ml-1">*</span>
+          </Label>
+          <Button
+            type="button"
+            size="sm"
+            variant="outline"
+            onClick={addProvider}
+          >
+            <Plus className="h-4 w-4 mr-1" />
+            {t('apiChains.addProvider')}
+          </Button>
+        </div>
+
+        <div className="space-y-3 max-h-[420px] overflow-y-auto pr-1">
+          {chainConfig.map((config, idx) => {
+            const providerModels = modelsForProvider(config.provider_uuid);
+            const modelConfigsExpanded = expandedModelConfigs.has(idx);
+
+            return (
+              <div
+                key={idx}
+                className="border rounded-lg p-3 space-y-3 bg-accent/30"
+              >
+                {/* Provider row */}
+                <div className="flex items-start gap-2">
+                  {/* Up/Down buttons */}
+                  <div className="flex flex-col gap-0.5 pt-1">
+                    <button
+                      type="button"
+                      onClick={() => moveProvider(idx, 'up')}
+                      disabled={idx === 0}
+                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
+                    >
+                      <GripVertical className="h-3 w-3" />
+                    </button>
+                    <button
+                      type="button"
+                      onClick={() => moveProvider(idx, 'down')}
+                      disabled={idx === chainConfig.length - 1}
+                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
+                    >
+                      <GripVertical className="h-3 w-3" />
+                    </button>
+                  </div>
+
+                  <div className="flex-1 space-y-2">
+                    {/* Provider selector */}
+                    <div className="flex items-center gap-2">
+                      <span className="text-sm font-medium w-6">
+                        #{idx + 1}
+                      </span>
+                      <Select
+                        value={config.provider_uuid}
+                        onValueChange={(v) =>
+                          updateProvider(idx, 'provider_uuid', v)
+                        }
+                      >
+                        <SelectTrigger className="flex-1">
+                          <SelectValue
+                            placeholder={t('apiChains.selectProvider')}
+                          />
+                        </SelectTrigger>
+                        <SelectContent>
+                          {providers.map((p) => (
+                            <SelectItem key={p.uuid} value={p.uuid}>
+                              {p.name}
+                            </SelectItem>
+                          ))}
+                        </SelectContent>
+                      </Select>
+                    </div>
+
+                    {/* Advanced config expander */}
+                    <button
+                      type="button"
+                      className="flex items-center gap-1 text-xs text-muted-foreground hover:text-foreground"
+                      onClick={() =>
+                        setExpandedAdvanced((prev) => {
+                          const next = new Set(prev);
+                          if (next.has(idx)) {
+                            next.delete(idx);
+                          } else {
+                            next.add(idx);
+                          }
+                          return next;
+                        })
+                      }
+                    >
+                      {expandedAdvanced.has(idx) ? (
+                        <ChevronDown className="h-3 w-3" />
+                      ) : (
+                        <ChevronRight className="h-3 w-3" />
+                      )}
+                      {t('apiChains.advanced')}
+                    </button>
+
+                    {expandedAdvanced.has(idx) && (
+                      <div className="space-y-2 pl-2 border-l-2 border-border">
+                        {/* Retries / Timeout */}
+                        <div className="grid grid-cols-2 gap-2">
+                          <div className="space-y-1">
+                            <Label className="text-xs">
+                              {t('apiChains.maxRetries')}
+                            </Label>
+                            <Input
+                              type="number"
+                              min="0"
+                              value={config.max_retries}
+                              onChange={(e) =>
+                                updateProvider(
+                                  idx,
+                                  'max_retries',
+                                  Number(e.target.value),
+                                )
+                              }
+                            />
+                          </div>
+                          <div className="space-y-1">
+                            <Label className="text-xs">
+                              {t('apiChains.timeout')}
+                            </Label>
+                            <Input
+                              type="number"
+                              min="1000"
+                              step="1000"
+                              value={config.timeout_ms}
+                              onChange={(e) =>
+                                updateProvider(
+                                  idx,
+                                  'timeout_ms',
+                                  Number(e.target.value),
+                                )
+                              }
+                            />
+                          </div>
+                        </div>
+
+                        {/* Aggregation toggle */}
+                        <div className="flex items-center gap-2">
+                          <Switch
+                            checked={config.is_aggregated}
+                            onCheckedChange={(v) =>
+                              updateProvider(idx, 'is_aggregated', v)
+                            }
+                          />
+                          <Label className="text-xs">
+                            {t('apiChains.aggregation')}
+                          </Label>
+                        </div>
+                      </div>
+                    )}
+
+                    {/* Model configs expander */}
+                    {config.provider_uuid && (
+                      <div className="mt-1">
+                        <button
+                          type="button"
+                          className="flex items-center gap-1 text-xs text-muted-foreground hover:text-foreground"
+                          onClick={() =>
+                            setExpandedModelConfigs((prev) => {
+                              const next = new Set(prev);
+                              if (next.has(idx)) {
+                                next.delete(idx);
+                              } else {
+                                next.add(idx);
+                              }
+                              return next;
+                            })
+                          }
+                        >
+                          {modelConfigsExpanded ? (
+                            <ChevronDown className="h-3 w-3" />
+                          ) : (
+                            <ChevronRight className="h-3 w-3" />
+                          )}
+                          {t('apiChains.modelConfigs')}
+                          {(config.model_configs?.length ?? 0) > 0 && (
+                            <span className="ml-1 bg-primary/10 text-primary px-1.5 py-0.5 rounded text-[10px]">
+                              {config.model_configs!.length}
+                            </span>
+                          )}
+                        </button>
+
+                        {modelConfigsExpanded && (
+                          <div className="mt-2 space-y-2 pl-2 border-l-2 border-border">
+                            <p className="text-xs text-muted-foreground">
+                              {t('apiChains.modelConfigsHint')}
+                            </p>
+
+                            {(config.model_configs ?? []).map((mc, mi) => (
+                              <div
+                                key={mi}
+                                className="border rounded p-2 space-y-2 bg-background"
+                              >
+                                {/* Model selector + move + delete */}
+                                <div className="flex items-center gap-1">
+                                  <div className="flex flex-col gap-0.5">
+                                    <button
+                                      type="button"
+                                      onClick={() =>
+                                        moveModelConfig(idx, mi, 'up')
+                                      }
+                                      disabled={mi === 0}
+                                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
+                                    >
+                                      <GripVertical className="h-3 w-3" />
+                                    </button>
+                                    <button
+                                      type="button"
+                                      onClick={() =>
+                                        moveModelConfig(idx, mi, 'down')
+                                      }
+                                      disabled={
+                                        mi ===
+                                        (config.model_configs?.length ?? 0) - 1
+                                      }
+                                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
+                                    >
+                                      <GripVertical className="h-3 w-3" />
+                                    </button>
+                                  </div>
+                                  <span className="text-xs font-medium w-5">
+                                    #{mi + 1}
+                                  </span>
+                                  <Select
+                                    value={mc.model_name}
+                                    onValueChange={(v) =>
+                                      updateModelConfig(
+                                        idx,
+                                        mi,
+                                        'model_name',
+                                        v,
+                                      )
+                                    }
+                                  >
+                                    <SelectTrigger className="flex-1 h-8 text-xs">
+                                      <SelectValue
+                                        placeholder={t('apiChains.selectModel')}
+                                      />
+                                    </SelectTrigger>
+                                    <SelectContent>
+                                      {providerModels.map((m) => (
+                                        <SelectItem key={m.uuid} value={m.name}>
+                                          {m.name}
+                                        </SelectItem>
+                                      ))}
+                                    </SelectContent>
+                                  </Select>
+                                  <Button
+                                    type="button"
+                                    variant="ghost"
+                                    size="icon"
+                                    className="h-7 w-7 text-destructive hover:text-destructive"
+                                    onClick={() => removeModelConfig(idx, mi)}
+                                  >
+                                    <Trash2 className="h-3 w-3" />
+                                  </Button>
+                                </div>
+                              </div>
+                            ))}
+
+                            <Button
+                              type="button"
+                              variant="outline"
+                              size="sm"
+                              className="h-7 text-xs"
+                              onClick={() => addModelConfig(idx)}
+                            >
+                              <Plus className="h-3 w-3 mr-1" />
+                              {t('apiChains.addModelConfig')}
+                            </Button>
+                          </div>
+                        )}
+                      </div>
+                    )}
+                  </div>
+
+                  <Button
+                    type="button"
+                    variant="ghost"
+                    size="icon"
+                    onClick={() => removeProvider(idx)}
+                    disabled={chainConfig.length === 1}
+                    className="text-destructive hover:text-destructive mt-0.5"
+                  >
+                    <Trash2 className="h-4 w-4" />
+                  </Button>
+                </div>
+              </div>
+            );
+          })}
+        </div>
+      </div>
+
+      {/* Health Check */}
+      <div className="space-y-3 border-t pt-3">
+        <div className="flex items-center justify-between">
+          <Label>{t('apiChains.healthCheck')}</Label>
+          <Switch
+            checked={healthCheckEnabled}
+            onCheckedChange={setHealthCheckEnabled}
+          />
+        </div>
+        {healthCheckEnabled && (
+          <div className="space-y-2">
+            <Label htmlFor="interval">
+              {t('apiChains.healthCheckInterval')}
+            </Label>
+            <Input
+              id="interval"
+              type="number"
+              min="60"
+              value={healthCheckInterval}
+              onChange={(e) => setHealthCheckInterval(Number(e.target.value))}
+            />
+            <p className="text-xs text-muted-foreground">
+              {t('apiChains.healthCheckIntervalHint')}
+            </p>
+          </div>
+        )}
+      </div>
+
+      {/* Actions */}
+      <div className="flex justify-end gap-2 pt-2">
+        <Button variant="outline" onClick={onFormCancel} disabled={loading}>
+          {t('common.cancel')}
+        </Button>
+        <Button onClick={handleSubmit} disabled={loading}>
+          {loading ? t('common.saving') : t('common.save')}
+        </Button>
+      </div>
+    </div>
+  );
+}
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx b/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
new file mode 100644
index 000000000..0d4435fdb
--- /dev/null
+++ b/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
@@ -0,0 +1,179 @@
+'use client';
+
+import { useState, useEffect } from 'react';
+import { Plus, Link2 } from 'lucide-react';
+import { httpClient } from '@/app/infra/http/HttpClient';
+import { APIChain, LLMModel, ModelProvider } from '@/app/infra/entities/api';
+import {
+  Dialog,
+  DialogContent,
+  DialogHeader,
+  DialogTitle,
+} from '@/components/ui/dialog';
+import { Button } from '@/components/ui/button';
+import { toast } from 'sonner';
+import { useTranslation } from 'react-i18next';
+import APIChainForm from './APIChainForm';
+import APIChainCard from './APIChainCard';
+
+interface APIChainsDialogProps {
+  open: boolean;
+  onOpenChange: (open: boolean) => void;
+}
+
+export default function APIChainsDialog({
+  open,
+  onOpenChange,
+}: APIChainsDialogProps) {
+  const { t } = useTranslation();
+
+  const [chains, setChains] = useState<APIChain[]>([]);
+  const [providers, setProviders] = useState<ModelProvider[]>([]);
+  const [llmModels, setLlmModels] = useState<LLMModel[]>([]);
+  const [chainFormOpen, setChainFormOpen] = useState(false);
+  const [editingChainId, setEditingChainId] = useState<string | null>(null);
+
+  useEffect(() => {
+    if (open) {
+      loadChains();
+      loadProviders();
+      loadLLMModels();
+    }
+  }, [open]);
+
+  async function loadChains() {
+    try {
+      if (typeof httpClient.getAPIChains !== 'function') {
+        console.error('httpClient.getAPIChains is not defined');
+        toast.error(t('apiChains.loadError') + ': API method not found');
+        return;
+      }
+      const resp = await httpClient.getAPIChains();
+      setChains(resp.chains);
+    } catch (err) {
+      console.error('Failed to load API chains', err);
+      toast.error(t('apiChains.loadError') + ': ' + (err as Error).message);
+    }
+  }
+
+  async function loadProviders() {
+    try {
+      if (typeof httpClient.getModelProviders !== 'function') {
+        console.error('httpClient.getModelProviders is not defined');
+        return;
+      }
+      const resp = await httpClient.getModelProviders();
+      setProviders(resp.providers);
+    } catch (err) {
+      console.error('Failed to load providers', err);
+      toast.error((err as Error).message);
+    }
+  }
+
+  async function loadLLMModels() {
+    try {
+      const resp = await httpClient.getProviderLLMModels();
+      setLlmModels(resp.models);
+    } catch (err) {
+      console.error('Failed to load LLM models', err);
+    }
+  }
+
+  function handleCreateChain() {
+    setEditingChainId(null);
+    setChainFormOpen(true);
+  }
+
+  function handleEditChain(chainId: string) {
+    setEditingChainId(chainId);
+    setChainFormOpen(true);
+  }
+
+  async function handleDeleteChain(chainId: string) {
+    try {
+      await httpClient.deleteAPIChain(chainId);
+      toast.success(t('apiChains.chainDeleted'));
+      loadChains();
+    } catch (err) {
+      toast.error(t('apiChains.chainDeleteError') + (err as Error).message);
+    }
+  }
+
+  function handleFormClose() {
+    setChainFormOpen(false);
+    loadChains();
+  }
+
+  return (
+    <>
+      <Dialog
+        open={open}
+        onOpenChange={(newOpen) => {
+          if (!newOpen && chainFormOpen) return;
+          onOpenChange(newOpen);
+        }}
+      >
+        <DialogContent className="overflow-hidden p-0 h-[80vh] flex flex-col !max-w-[37rem]">
+          <DialogHeader className="px-6 pt-6 pb-0 flex-shrink-0">
+            <DialogTitle>{t('apiChains.title')}</DialogTitle>
+          </DialogHeader>
+
+          <div className="flex-1 overflow-auto px-6 pb-6 mt-0">
+            {/* Add Chain Button */}
+            <div className="mb-3 flex justify-between items-center sticky top-0 bg-background py-2 z-10">
+              <span className="text-sm text-muted-foreground">
+                {chains.length === 0
+                  ? t('apiChains.addChainHint')
+                  : t('apiChains.chainCount', { count: chains.length })}
+              </span>
+              <Button size="sm" variant="outline" onClick={handleCreateChain}>
+                <Plus className="h-4 w-4 mr-1" />
+                {t('apiChains.addChain')}
+              </Button>
+            </div>
+
+            {/* Chain List */}
+            {chains.length === 0 ? (
+              <div className="flex flex-col items-center justify-center py-12 text-muted-foreground">
+                <Link2 className="h-12 w-12 mb-3 opacity-50" />
+                <p className="text-sm">{t('apiChains.noChains')}</p>
+              </div>
+            ) : (
+              chains.map((chain) => (
+                <APIChainCard
+                  key={chain.uuid}
+                  chain={chain}
+                  providers={providers}
+                  llmModels={llmModels}
+                  onEdit={() => handleEditChain(chain.uuid)}
+                  onDelete={() => handleDeleteChain(chain.uuid)}
+                />
+              ))
+            )}
+          </div>
+        </DialogContent>
+      </Dialog>
+
+      <Dialog open={chainFormOpen} onOpenChange={setChainFormOpen}>
+        <DialogContent className="overflow-hidden p-0 h-[80vh] flex flex-col !max-w-[37rem]">
+          <DialogHeader className="px-6 pt-6 pb-0 flex-shrink-0">
+            <DialogTitle>
+              {editingChainId
+                ? t('apiChains.editChain')
+                : t('apiChains.addChain')}
+            </DialogTitle>
+          </DialogHeader>
+          <div className="flex-1 overflow-y-auto px-6 pb-6 pt-4">
+            <APIChainForm
+              chainId={editingChainId || undefined}
+              providers={providers}
+              llmModels={llmModels}
+              onFormSubmit={handleFormClose}
+              onFormCancel={() => setChainFormOpen(false)}
+            />
+          </div>
+        </DialogContent>
+      </Dialog>
+    </>
+  );
+}
diff --git a/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx b/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
index b40563ae8..5ee04b3d6 100644
--- a/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
+++ b/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
@@ -11,7 +11,7 @@ import {
   FormMessage,
 } from '@/components/ui/form';
 import DynamicFormItemComponent from '@/app/home/components/dynamic-form/DynamicFormItemComponent';
-import { useCallback, useEffect, useRef } from 'react';
+import { useEffect, useRef } from 'react';
 import { extractI18nObject } from '@/i18n/I18nProvider';
 import { useTranslation } from 'react-i18next';
 
@@ -160,39 +160,34 @@ export default function DynamicFormComponent({
   const onSubmitRef = useRef(onSubmit);
   onSubmitRef.current = onSubmit;
 
-  // Track the last emitted values to avoid emitting identical snapshots,
-  // which would cause the parent to call setValue with an equivalent object,
-  // triggering a re-render loop.
-  const lastEmittedRef = useRef<string>('');
-
-  const emitValues = useCallback(() => {
+  // 监听表单值变化
+  useEffect(() => {
+    // Emit initial form values immediately so the parent always has a valid snapshot,
+    // even if the user saves without modifying any field.
+    // form.watch(callback) only fires on subsequent changes, not on mount.
     const formValues = form.getValues();
-    const finalValues = itemConfigList.reduce(
+    const initialFinalValues = itemConfigList.reduce(
       (acc, item) => {
         acc[item.name] = formValues[item.name] ?? item.default;
         return acc;
       },
       {} as Record<string, object>,
     );
-    const serialized = JSON.stringify(finalValues);
-    if (serialized !== lastEmittedRef.current) {
-      lastEmittedRef.current = serialized;
-      onSubmitRef.current?.(finalValues);
-    }
-  }, [form, itemConfigList]);
-
-  // 监听表单值变化
-  useEffect(() => {
-    // Emit initial form values immediately so the parent always has a valid snapshot,
-    // even if the user saves without modifying any field.
-    // form.watch(callback) only fires on subsequent changes, not on mount.
-    emitValues();
+    onSubmitRef.current?.(initialFinalValues);
 
     const subscription = form.watch(() => {
-      emitValues();
+      const formValues = form.getValues();
+      const finalValues = itemConfigList.reduce(
+        (acc, item) => {
+          acc[item.name] = formValues[item.name] ?? item.default;
+          return acc;
+        },
+        {} as Record<string, object>,
+      );
+      onSubmitRef.current?.(finalValues);
     });
     return () => subscription.unsubscribe();
-  }, [form, itemConfigList, emitValues]);
+  }, [form, itemConfigList]);
 
   return (
     <Form {...form}>
diff --git a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
index ca2f4e72d..7c7a13efd 100644
--- a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
+++ b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
@@ -23,6 +23,9 @@ import {
   Bot,
   KnowledgeBase,
   EmbeddingModel,
+  ExternalKnowledgeBase,
+  ApiRespPluginSystemStatus,
+  APIChain,
 } from '@/app/infra/entities/api';
 import { toast } from 'sonner';
 import { useTranslation } from 'react-i18next';
@@ -51,6 +54,7 @@ export default function DynamicFormItemComponent({
 }) {
   const [llmModels, setLlmModels] = useState<LLMModel[]>([]);
   const [embeddingModels, setEmbeddingModels] = useState<EmbeddingModel[]>([]);
+  const [apiChains, setApiChains] = useState<APIChain[]>([]);
   const [knowledgeBases, setKnowledgeBases] = useState<KnowledgeBase[]>([]);
   const [bots, setBots] = useState<Bot[]>([]);
   const [uploading, setUploading] = useState<boolean>(false);
@@ -124,6 +128,37 @@ export default function DynamicFormItemComponent({
     }
   }, [config.type]);
 
+  useEffect(() => {
+    if (config.type === DynamicFormItemType.MODEL_OR_API_CHAIN_SELECTOR) {
+      httpClient
+        .getProviderLLMModels()
+        .then((resp) => {
+          let models = resp.models;
+          if (
+            systemInfo.disable_models_service ||
+            userInfo?.account_type !== 'space'
+          ) {
+            models = models.filter(
+              (m) => m.provider?.requester !== 'space-chat-completions',
+            );
+          }
+          setLlmModels(models);
+        })
+        .catch((err) => {
+          toast.error('Failed to get LLM model list: ' + err.msg);
+        });
+
+      httpClient
+        .getAPIChains()
+        .then((resp) => {
+          setApiChains(resp.chains);
+        })
+        .catch((err) => {
+          console.error('Failed to get API chains:', err);
+        });
+    }
+  }, [config.type]);
+
   useEffect(() => {
     if (
       config.type === DynamicFormItemType.KNOWLEDGE_BASE_SELECTOR ||
@@ -171,12 +206,7 @@ export default function DynamicFormItemComponent({
       return <Textarea {...field} className="min-h-[120px]" />;
 
     case DynamicFormItemType.BOOLEAN:
-      return (
-        <Switch
-          checked={field.value ?? false}
-          onCheckedChange={field.onChange}
-        />
-      );
+      return <Switch checked={field.value} onCheckedChange={field.onChange} />;
 
     case DynamicFormItemType.STRING_ARRAY:
       return (
@@ -227,7 +257,7 @@ export default function DynamicFormItemComponent({
 
     case DynamicFormItemType.SELECT:
       return (
-        <Select value={field.value ?? ''} onValueChange={field.onChange}>
+        <Select value={field.value} onValueChange={field.onChange}>
           <SelectTrigger className="bg-[#ffffff] dark:bg-[#2a2a2e]">
             <SelectValue placeholder={t('common.select')} />
           </SelectTrigger>
@@ -318,6 +348,66 @@ export default function DynamicFormItemComponent({
         </Select>
       );
 
+    case DynamicFormItemType.MODEL_OR_API_CHAIN_SELECTOR:
+      // Group models by provider
+      const groupedModelsForChain = llmModels.reduce(
+        (acc, model) => {
+          const providerName =
+            model.provider?.name || model.provider?.requester || 'Unknown';
+          if (!acc[providerName]) acc[providerName] = [];
+          acc[providerName].push(model);
+          return acc;
+        },
+        {} as Record<string, LLMModel[]>,
+      );
+
+      return (
+        <Select value={field.value} onValueChange={field.onChange}>
+          <SelectTrigger className="bg-[#ffffff] dark:bg-[#2a2a2e]">
+            <SelectValue placeholder={t('common.selectOption')} />
+          </SelectTrigger>
+          <SelectContent>
+            {/* Models Section */}
+            {Object.entries(groupedModelsForChain).length > 0 && (
+              <SelectGroup>
+                <SelectLabel>{t('models.title')}</SelectLabel>
+                {Object.entries(groupedModelsForChain).map(
+                  ([providerName, models]) => (
+                    <SelectGroup key={providerName}>
+                      <SelectLabel className="pl-4">{providerName}</SelectLabel>
+                      {models.map((model) => (
+                        <SelectItem key={model.uuid} value={model.uuid}>
+                          <span className="inline-flex items-center gap-1">
+                            {model.name}
+                            {model.abilities?.includes('vision') && (
+                              <Eye className="h-3 w-3 text-muted-foreground" />
+                            )}
+                            {model.abilities?.includes('func_call') && (
+                              <Wrench className="h-3 w-3 text-muted-foreground" />
+                            )}
+                          </span>
+                        </SelectItem>
+                      ))}
+                    </SelectGroup>
+                  ),
+                )}
+              </SelectGroup>
+            )}
+            {/* API Chains Section */}
+            {apiChains.length > 0 && (
+              <SelectGroup>
+                <SelectLabel>{t('apiChains.title')}</SelectLabel>
+                {apiChains.map((chain) => (
+                  <SelectItem key={chain.uuid} value={chain.uuid}>
+                    {chain.name}
+                  </SelectItem>
+                ))}
+              </SelectGroup>
+            )}
+          </SelectContent>
+        </Select>
+      );
+
     case DynamicFormItemType.KNOWLEDGE_BASE_SELECTOR:
       // Group KBs by Knowledge Engine name
       const kbsByEngine = knowledgeBases.reduce(
diff --git a/web/src/app/home/components/models-dialog/ModelsDialog.tsx b/web/src/app/home/components/models-dialog/ModelsDialog.tsx
index 4f1307731..4b361f56b 100644
--- a/web/src/app/home/components/models-dialog/ModelsDialog.tsx
+++ b/web/src/app/home/components/models-dialog/ModelsDialog.tsx
@@ -1,9 +1,10 @@
 'use client';
 
 import { useState, useEffect } from 'react';
-import { Plus, Boxes } from 'lucide-react';
+import { Plus, Boxes, Link2 } from 'lucide-react';
 import { httpClient, systemInfo } from '@/app/infra/http/HttpClient';
 import { ModelProvider } from '@/app/infra/entities/api';
+import APIChainsDialog from '../api-chains-dialog/APIChainsDialog';
 import {
   Dialog,
   DialogContent,
@@ -70,6 +71,9 @@ export default function ModelsDialog({
     null,
   );
 
+  // API Chains dialog
+  const [apiChainsDialogOpen, setApiChainsDialogOpen] = useState(false);
+
   // Popover states
   const [addModelPopoverOpen, setAddModelPopoverOpen] = useState<string | null>(
     null,
@@ -463,14 +467,24 @@ export default function ModelsDialog({
                     )
                   : t('models.providerCount', { count: otherProviders.length })}
               </span>
-              <Button
-                size="sm"
-                variant="outline"
-                onClick={handleCreateProvider}
-              >
-                <Plus className="h-4 w-4 mr-1" />
-                {t('models.addProvider')}
-              </Button>
+              <div className="flex gap-2">
+                <Button
+                  size="sm"
+                  variant="outline"
+                  onClick={() => setApiChainsDialogOpen(true)}
+                >
+                  <Link2 className="h-4 w-4 mr-1" />
+                  {t('apiChains.manageChains')}
+                </Button>
+                <Button
+                  size="sm"
+                  variant="outline"
+                  onClick={handleCreateProvider}
+                >
+                  <Plus className="h-4 w-4 mr-1" />
+                  {t('models.addProvider')}
+                </Button>
+              </div>
             </div>
 
             {/* Provider List */}
@@ -502,6 +516,11 @@ export default function ModelsDialog({
           />
         </DialogContent>
       </Dialog>
+
+      <APIChainsDialog
+        open={apiChainsDialogOpen}
+        onOpenChange={setApiChainsDialogOpen}
+      />
     </>
   );
 }
diff --git a/web/src/app/infra/entities/api/api_chain.ts b/web/src/app/infra/entities/api/api_chain.ts
new file mode 100644
index 000000000..05efc386e
--- /dev/null
+++ b/web/src/app/infra/entities/api/api_chain.ts
@@ -0,0 +1,64 @@
+export interface APIChain {
+  uuid: string;
+  name: string;
+  description?: string;
+  chain_config: APIChainItem[];
+  health_check_interval: number;
+  health_check_enabled: boolean;
+  created_at?: string;
+  updated_at?: string;
+  statuses?: APIChainStatus[];
+}
+
+export interface APIChainKeyPriority {
+  index: number;
+  priority: number;
+}
+
+export interface APIChainModelConfig {
+  model_name: string;
+  priority: number;
+  api_key_indices?: APIChainKeyPriority[];
+}
+
+export interface APIChainItem {
+  provider_uuid: string;
+  priority: number;
+  is_aggregated: boolean;
+  max_retries: number;
+  timeout_ms: number;
+  /** Per-model configuration (optional). Empty = use original query model */
+  model_configs?: APIChainModelConfig[];
+}
+
+export interface APIChainStatus {
+  provider_uuid: string;
+  /** null = provider-level, non-null = specific model */
+  model_name: string | null;
+  /** null = round-robin, non-null = specific API key index */
+  api_key_index: number | null;
+  is_healthy: boolean;
+  failure_count: number;
+  last_failure_time?: string;
+  last_success_time?: string;
+  last_health_check_time?: string;
+  last_error_message?: string;
+  /** True when the last health-check probe itself failed (not a normal request failure) */
+  health_check_last_failed?: boolean;
+}
+
+export interface CreateAPIChainRequest {
+  name: string;
+  description?: string;
+  chain_config: APIChainItem[];
+  health_check_interval?: number;
+  health_check_enabled?: boolean;
+}
+
+export interface UpdateAPIChainRequest {
+  name?: string;
+  description?: string;
+  chain_config?: APIChainItem[];
+  health_check_interval?: number;
+  health_check_enabled?: boolean;
+}
diff --git a/web/src/app/infra/entities/api/index.ts b/web/src/app/infra/entities/api/index.ts
index b9af3d93c..223f83473 100644
--- a/web/src/app/infra/entities/api/index.ts
+++ b/web/src/app/infra/entities/api/index.ts
@@ -451,3 +451,61 @@ export interface MCPTool {
   description: string;
   parameters?: object;
 }
+
+// API Chain
+export interface APIChain {
+  uuid: string;
+  name: string;
+  description?: string;
+  chain_config: APIChainItem[];
+  health_check_interval: number;
+  health_check_enabled: boolean;
+  created_at?: string;
+  updated_at?: string;
+  statuses?: APIChainStatus[];
+}
+
+export interface APIChainKeyPriority {
+  index: number;
+  priority: number;
+}
+
+export interface APIChainModelConfig {
+  model_name: string;
+  priority: number;
+  api_key_indices?: APIChainKeyPriority[];
+}
+
+export interface APIChainItem {
+  provider_uuid: string;
+  priority: number;
+  is_aggregated: boolean;
+  max_retries: number;
+  timeout_ms: number;
+  /** Per-model configuration (optional). Empty = use original query model */
+  model_configs?: APIChainModelConfig[];
+}
+
+export interface APIChainStatus {
+  provider_uuid: string;
+  /** null = provider-level, non-null = specific model */
+  model_name: string | null;
+  /** null = round-robin, non-null = specific API key index */
+  api_key_index: number | null;
+  is_healthy: boolean;
+  failure_count: number;
+  last_failure_time?: string;
+  last_success_time?: string;
+  last_health_check_time?: string;
+  last_error_message?: string;
+  /** True when the last health-check probe itself failed (not a normal request failure) */
+  health_check_last_failed?: boolean;
+}
+
+export interface ApiRespAPIChains {
+  chains: APIChain[];
+}
+
+export interface ApiRespAPIChain {
+  chain: APIChain;
+}
diff --git a/web/src/app/infra/entities/form/dynamic.ts b/web/src/app/infra/entities/form/dynamic.ts
index b6f0a47fc..3c641ef33 100644
--- a/web/src/app/infra/entities/form/dynamic.ts
+++ b/web/src/app/infra/entities/form/dynamic.ts
@@ -35,6 +35,7 @@ export enum DynamicFormItemType {
   SELECT = 'select',
   LLM_MODEL_SELECTOR = 'llm-model-selector',
   EMBEDDING_MODEL_SELECTOR = 'embedding-model-selector',
+  MODEL_OR_API_CHAIN_SELECTOR = 'model-or-api-chain-selector',
   PROMPT_EDITOR = 'prompt-editor',
   UNKNOWN = 'unknown',
   KNOWLEDGE_BASE_SELECTOR = 'knowledge-base-selector',
diff --git a/web/src/app/infra/http/BackendClient.ts b/web/src/app/infra/http/BackendClient.ts
index d234ddd11..9e144ad3f 100644
--- a/web/src/app/infra/http/BackendClient.ts
+++ b/web/src/app/infra/http/BackendClient.ts
@@ -41,6 +41,9 @@ import {
   ApiRespKnowledgeEngines,
   ApiRespParsers,
   RagMigrationStatusResp,
+  ApiRespAPIChains,
+  ApiRespAPIChain,
+  APIChain,
 } from '@/app/infra/entities/api';
 import { Plugin } from '@/app/infra/entities/plugin';
 import { GetBotLogsRequest } from '@/app/infra/http/requestParam/bots/GetBotLogsRequest';
@@ -104,6 +107,32 @@ export class BackendClient extends BaseHttpClient {
     return this.delete(`/api/v1/provider/providers/${uuid}`);
   }
 
+  // ============ API Chains ============
+  public getAPIChains(): Promise<ApiRespAPIChains> {
+    return this.get('/api/v1/provider/api-chains');
+  }
+
+  public getAPIChain(uuid: string): Promise<ApiRespAPIChain> {
+    return this.get(`/api/v1/provider/api-chains/${uuid}`);
+  }
+
+  public createAPIChain(
+    chain: Omit<APIChain, 'uuid'>,
+  ): Promise<{ uuid: string }> {
+    return this.post('/api/v1/provider/api-chains', chain);
+  }
+
+  public updateAPIChain(
+    uuid: string,
+    chain: Partial<APIChain>,
+  ): Promise<object> {
+    return this.put(`/api/v1/provider/api-chains/${uuid}`, chain);
+  }
+
+  public deleteAPIChain(uuid: string): Promise<object> {
+    return this.delete(`/api/v1/provider/api-chains/${uuid}`);
+  }
+
   // ============ Provider Model LLM ============
   public getProviderLLMModels(
     providerUuid?: string,
diff --git a/web/src/i18n/locales/en-US.ts b/web/src/i18n/locales/en-US.ts
index 7310d7bde..88becc75c 100644
--- a/web/src/i18n/locales/en-US.ts
+++ b/web/src/i18n/locales/en-US.ts
@@ -1040,6 +1040,62 @@ const enUS = {
     maxExtensionsReached:
       'Maximum number of extensions ({{max}}) reached. Please remove an existing MCP server or plugin before adding a new one.',
   },
+  apiChains: {
+    title: 'API Chains',
+    description: 'Manage API chains for failover and load balancing',
+    name: 'Chain Name',
+    namePlaceholder: 'Enter chain name',
+    nameRequired: 'Chain name is required',
+    descriptionPlaceholder: 'Enter description (optional)',
+    providers: 'Provider Chain',
+    addProvider: 'Add Provider',
+    selectProvider: 'Select Provider',
+    selectAllProviders: 'Please select all providers',
+    atLeastOneProvider: 'At least one provider is required',
+    maxRetries: 'Max Retries',
+    timeout: 'Timeout (ms)',
+    aggregation: 'Enable Aggregation',
+    healthCheck: 'Health Check',
+    healthCheckInterval: 'Check Interval (seconds)',
+    healthCheckIntervalHint: 'Minimum 60 seconds',
+    createSuccess: 'API chain created successfully',
+    createError: 'Failed to create API chain',
+    updateSuccess: 'API chain updated successfully',
+    updateError: 'Failed to update API chain',
+    deleteSuccess: 'API chain deleted successfully',
+    deleteError: 'Failed to delete API chain',
+    deleteConfirm: 'Are you sure you want to delete this API chain?',
+    loadError: 'Failed to load API chain',
+    noChains: 'No API chains configured',
+    createChain: 'Create API Chain',
+    editChain: 'Edit API Chain',
+    addChain: 'Add Chain',
+    addChainHint: 'Add API chains to manage failover',
+    chainCount: '{{count}} chain(s)',
+    chainDeleted: 'API chain deleted successfully',
+    chainDeleteError: 'Failed to delete API chain: ',
+    providerCount: '{{count}} provider(s)',
+    status: 'Status',
+    active: 'Active',
+    inactive: 'Inactive',
+    manageChains: 'Manage API Chains',
+    selectChain: 'Select API Chain',
+    healthy: 'Healthy',
+    unhealthy: 'Unhealthy',
+    failureCount: 'Failures',
+    lastError: 'Last Error',
+    retryCount: 'Retries',
+    errorCount: 'Errors',
+    // Model configuration
+    modelConfigs: 'Model Configuration',
+    modelConfigsHint:
+      'Optional: specify model priority for this provider. Without this the original query model is used and API keys are rotated per provider settings.',
+    addModelConfig: 'Add Model',
+    selectModel: 'Select Model',
+    selectAllModels: 'Please select a model for each model config entry',
+    advanced: 'Advanced',
+    healthCheckFailed: 'Health Check Failed',
+  },
 };
 
 export default enUS;
diff --git a/web/src/i18n/locales/ja-JP.ts b/web/src/i18n/locales/ja-JP.ts
index 2d7e399c6..4ec21a370 100644
--- a/web/src/i18n/locales/ja-JP.ts
+++ b/web/src/i18n/locales/ja-JP.ts
@@ -1,4 +1,4 @@
-const jaJP = {
+﻿const jaJP = {
   common: {
     login: 'ログイン',
     logout: 'ログアウト',
@@ -1016,6 +1016,62 @@ const jaJP = {
     maxExtensionsReached:
       '拡張機能数が上限（{{max}}個）に達しました。新しい MCP サーバーやプラグインを追加するには、既存のものを削除してください。',
   },
+
+  apiChains: {
+    title: 'API チェーン',
+    description: 'フェイルオーバーと負荷分散のための API チェーンを管理する',
+    name: 'チェーン名',
+    namePlaceholder: 'チェーン名を入力',
+    nameRequired: 'チェーン名は必須です',
+    descriptionPlaceholder: '説明を入力（任意）',
+    providers: 'プロバイダーチェーン',
+    addProvider: 'プロバイダーを追加',
+    selectProvider: 'プロバイダーを選択',
+    selectAllProviders: 'すべてのプロバイダーを選択してください',
+    atLeastOneProvider: 'プロバイダーが少なくとも 1 つ必要です',
+    maxRetries: '最大リトライ回数',
+    timeout: 'タイムアウト（ミリ秒）',
+    aggregation: '集約モードを有効にする',
+    healthCheck: 'ヘルスチェック',
+    healthCheckInterval: 'チェック間隔（秒）',
+    healthCheckIntervalHint: '最小 60 秒',
+    createSuccess: 'API チェーンが作成されました',
+    createError: 'API チェーンの作成に失敗しました',
+    updateSuccess: 'API チェーンが更新されました',
+    updateError: 'API チェーンの更新に失敗しました',
+    deleteSuccess: 'API チェーンが削除されました',
+    deleteError: 'API チェーンの削除に失敗しました',
+    deleteConfirm: 'この API チェーンを削除してもよいですか？',
+    loadError: 'API チェーンの読み込みに失敗しました',
+    noChains: 'API チェーンが設定されていません',
+    createChain: 'API チェーンを作成',
+    editChain: 'API チェーンを編集',
+    addChain: 'チェーンを追加',
+    addChainHint: 'フェイルオーバー管理用の API チェーンを追加',
+    chainCount: '{{count}} 個のチェーン',
+    chainDeleted: 'API チェーンが削除されました',
+    chainDeleteError: 'API チェーンの削除に失敗しました：',
+    providerCount: '{{count}} 個のプロバイダー',
+    status: 'ステータス',
+    active: 'アクティブ',
+    inactive: '非アクティブ',
+    manageChains: 'API チェーンを管理',
+    selectChain: 'API チェーンを選択',
+    healthy: '正常',
+    unhealthy: '異常',
+    failureCount: '失敗回数',
+    lastError: '直近のエラー',
+    retryCount: 'リトライ回数',
+    errorCount: 'エラー回数',
+    modelConfigs: 'モデル設定',
+    modelConfigsHint:
+      '任意：このプロバイダーのモデル優先度を指定します。未設定の場合はリクエストのモデルをそのまま使用し、API キーはプロバイダー設定に従って自動ローテーションされます',
+    addModelConfig: 'モデルを追加',
+    selectModel: 'モデルを選択',
+    selectAllModels: 'すべてのモデル設定にモデルを選択してください',
+    advanced: '詳細',
+    healthCheckFailed: 'ヘルスチェック失敗',
+  },
 };
 
 export default jaJP;
diff --git a/web/src/i18n/locales/zh-Hans.ts b/web/src/i18n/locales/zh-Hans.ts
index 81c5841cc..083674e2d 100644
--- a/web/src/i18n/locales/zh-Hans.ts
+++ b/web/src/i18n/locales/zh-Hans.ts
@@ -998,6 +998,62 @@ const zhHans = {
     maxExtensionsReached:
       '已达到扩展数量上限（{{max}}个）。请先删除已有的 MCP 服务器或插件后再添加新的。',
   },
+  apiChains: {
+    title: 'API 链',
+    description: '管理 API 链以实现故障转移和负载均衡',
+    name: '链名称',
+    namePlaceholder: '输入链名称',
+    nameRequired: '链名称不能为空',
+    descriptionPlaceholder: '输入描述（可选）',
+    providers: '供应商链',
+    addProvider: '添加供应商',
+    selectProvider: '选择供应商',
+    selectAllProviders: '请选择所有供应商',
+    atLeastOneProvider: '至少需要一个供应商',
+    maxRetries: '最大重试次数',
+    timeout: '超时时间 (毫秒)',
+    aggregation: '启用聚合模式',
+    healthCheck: '健康检查',
+    healthCheckInterval: '检查间隔（秒）',
+    healthCheckIntervalHint: '最小 60 秒',
+    createSuccess: 'API 链创建成功',
+    createError: '创建 API 链失败',
+    updateSuccess: 'API 链更新成功',
+    updateError: '更新 API 链失败',
+    deleteSuccess: 'API 链删除成功',
+    deleteError: '删除 API 链失败',
+    deleteConfirm: '确定要删除此 API 链吗？',
+    loadError: '加载 API 链失败',
+    noChains: '暂无 API 链配置',
+    createChain: '创建 API 链',
+    editChain: '编辑 API 链',
+    addChain: '添加链',
+    addChainHint: '添加 API 链以管理故障转移',
+    chainCount: '共 {{count}} 个链',
+    chainDeleted: 'API 链删除成功',
+    chainDeleteError: '删除 API 链失败：',
+    providerCount: '{{count}} 个供应商',
+    status: '状态',
+    active: '活跃',
+    inactive: '不活跃',
+    manageChains: '管理 API 链',
+    selectChain: '选择 API 链',
+    healthy: '健康',
+    unhealthy: '不健康',
+    failureCount: '失败次数',
+    lastError: '最近错误',
+    retryCount: '重试次数',
+    errorCount: '错误次数',
+    // Model configuration
+    modelConfigs: '模型配置',
+    modelConfigsHint:
+      '可选：为该供应商指定模型优先级。不配置时使用请求的原始模型，API 将按厂商配置轮询',
+    addModelConfig: '添加模型',
+    selectModel: '选择模型',
+    selectAllModels: '请为所有模型配置条目选择模型',
+    advanced: '高级',
+    healthCheckFailed: '健康检查失败',
+  },
 };
 
 export default zhHans;
diff --git a/web/src/i18n/locales/zh-Hant.ts b/web/src/i18n/locales/zh-Hant.ts
index 0ed21a772..f1abc1325 100644
--- a/web/src/i18n/locales/zh-Hant.ts
+++ b/web/src/i18n/locales/zh-Hant.ts
@@ -962,6 +962,61 @@ const zhHant = {
     maxExtensionsReached:
       '已達到擴充功能數量上限（{{max}}個）。請先刪除已有的 MCP 伺服器或外掛後再新增。',
   },
+  apiChains: {
+    title: 'API 鏈',
+    description: '管理 API 鏈以實現故障轉移和負載均衡',
+    name: '鏈名稱',
+    namePlaceholder: '輸入鏈名稱',
+    nameRequired: '鏈名稱不能為空',
+    descriptionPlaceholder: '輸入描述（可選）',
+    providers: '供應商鏈',
+    addProvider: '新增供應商',
+    selectProvider: '選擇供應商',
+    selectAllProviders: '請選擇所有供應商',
+    atLeastOneProvider: '至少需要一個供應商',
+    maxRetries: '最大重試次數',
+    timeout: '逾時時間（毫秒）',
+    aggregation: '啟用聚合模式',
+    healthCheck: '健康檢查',
+    healthCheckInterval: '檢查間隔（秒）',
+    healthCheckIntervalHint: '最少 60 秒',
+    createSuccess: 'API 鏈建立成功',
+    createError: '建立 API 鏈失敗',
+    updateSuccess: 'API 鏈更新成功',
+    updateError: '更新 API 鏈失敗',
+    deleteSuccess: 'API 鏈刪除成功',
+    deleteError: '刪除 API 鏈失敗',
+    deleteConfirm: '確定要刪除此 API 鏈嗎？',
+    loadError: '載入 API 鏈失敗',
+    noChains: '暫無 API 鏈設定',
+    createChain: '建立 API 鏈',
+    editChain: '編輯 API 鏈',
+    addChain: '新增鏈',
+    addChainHint: '新增 API 鏈以管理故障轉移',
+    chainCount: '共 {{count}} 個鏈',
+    chainDeleted: 'API 鏈刪除成功',
+    chainDeleteError: '刪除 API 鏈失敗：',
+    providerCount: '{{count}} 個供應商',
+    status: '狀態',
+    active: '活躍',
+    inactive: '不活躍',
+    manageChains: '管理 API 鏈',
+    selectChain: '選擇 API 鏈',
+    healthy: '健康',
+    unhealthy: '不健康',
+    failureCount: '失敗次數',
+    lastError: '最近錯誤',
+    retryCount: '重試次數',
+    errorCount: '錯誤次數',
+    modelConfigs: '模型設定',
+    modelConfigsHint:
+      '可選：為該供應商指定模型優先級。不設定時使用請求的原始模型，API 將依廠商設定輪詢',
+    addModelConfig: '新增模型',
+    selectModel: '選擇模型',
+    selectAllModels: '請為所有模型設定條目選擇模型',
+    advanced: '進階',
+    healthCheckFailed: '健康檢查失敗',
+  },
 };
 
 export default zhHant;

From 1b6038d9d47132566b90700bca93c631122db624 Mon Sep 17 00:00:00 2001
From: RockChinQ <rockchinq@gmail.com>
Date: Sun, 1 Mar 2026 05:14:58 -0500
Subject: [PATCH 2/7] fix: adapt to master optimizations

- Restore find_spec in deps.py (avoid loading all modules at startup)
- Restore shared aiohttp session via httpclient.get_session()
---
 .../libs/wechatpad_api/util/http_util.py      | 28 +++----
 src/langbot/pkg/api/http/service/space.py     | 82 +++++++++----------
 src/langbot/pkg/core/bootutils/deps.py        |  8 +-
 3 files changed, 60 insertions(+), 58 deletions(-)

diff --git a/src/langbot/libs/wechatpad_api/util/http_util.py b/src/langbot/libs/wechatpad_api/util/http_util.py
index 447c29df0..7390f43ec 100644
--- a/src/langbot/libs/wechatpad_api/util/http_util.py
+++ b/src/langbot/libs/wechatpad_api/util/http_util.py
@@ -1,5 +1,5 @@
 import requests
-import aiohttp
+from langbot.pkg.utils import httpclient
 
 
 def post_json(base_url, token, data=None):
@@ -63,16 +63,16 @@ async def async_request(
     """
     headers = {'Content-Type': 'application/json'}
     url = f'{base_url}?key={token_key}'
-    async with aiohttp.ClientSession() as session:
-        async with session.request(
-            method=method, url=url, params=params, headers=headers, data=data, json=json
-        ) as response:
-            response.raise_for_status()  # 如果状态码不是200，抛出异常
-            result = await response.json()
-            # print(result)
-            return result
-            # if result.get('Code') == 200:
-            #
-            #     return await result
-            # else:
-            #     raise RuntimeError("请求失败",response.text)
+    session = httpclient.get_session()
+    async with session.request(
+        method=method, url=url, params=params, headers=headers, data=data, json=json
+    ) as response:
+        response.raise_for_status()  # 如果状态码不是200，抛出异常
+        result = await response.json()
+        # print(result)
+        return result
+        # if result.get('Code') == 200:
+        #
+        #     return await result
+        # else:
+        #     raise RuntimeError("请求失败",response.text)
diff --git a/src/langbot/pkg/api/http/service/space.py b/src/langbot/pkg/api/http/service/space.py
index cd6948833..c05e4896a 100644
--- a/src/langbot/pkg/api/http/service/space.py
+++ b/src/langbot/pkg/api/http/service/space.py
@@ -1,6 +1,6 @@
 from __future__ import annotations
 
-import aiohttp
+from langbot.pkg.utils import httpclient
 import typing
 import datetime
 import time
@@ -99,49 +99,49 @@ async def exchange_oauth_code(self, code: str) -> typing.Dict:
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        async with aiohttp.ClientSession() as session:
-            async with session.post(
-                f'{space_url}/api/v1/accounts/oauth/token',
-                json={'code': code, 'instance_id': constants.instance_id},
-            ) as response:
-                if response.status != 200:
-                    raise ValueError(f'Failed to exchange OAuth code: {await response.text()}')
-                data = await response.json()
-                if data.get('code') != 0:
-                    raise ValueError(f'Failed to exchange OAuth code: {data.get("msg")}')
-                return data.get('data', {})
+        session = httpclient.get_session()
+        async with session.post(
+            f'{space_url}/api/v1/accounts/oauth/token',
+            json={'code': code, 'instance_id': constants.instance_id},
+        ) as response:
+            if response.status != 200:
+                raise ValueError(f'Failed to exchange OAuth code: {await response.text()}')
+            data = await response.json()
+            if data.get('code') != 0:
+                raise ValueError(f'Failed to exchange OAuth code: {data.get("msg")}')
+            return data.get('data', {})
 
     async def refresh_token(self, refresh_token: str) -> typing.Dict:
         """Refresh Space access token"""
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        async with aiohttp.ClientSession() as session:
-            async with session.post(
-                f'{space_url}/api/v1/accounts/token/refresh', json={'refresh_token': refresh_token}
-            ) as response:
-                if response.status != 200:
-                    raise ValueError(f'Failed to refresh token: {await response.text()}')
-                data = await response.json()
-                if data.get('code') != 0:
-                    raise ValueError(f'Failed to refresh token: {data.get("msg")}')
-                return data.get('data', {})
+        session = httpclient.get_session()
+        async with session.post(
+            f'{space_url}/api/v1/accounts/token/refresh', json={'refresh_token': refresh_token}
+        ) as response:
+            if response.status != 200:
+                raise ValueError(f'Failed to refresh token: {await response.text()}')
+            data = await response.json()
+            if data.get('code') != 0:
+                raise ValueError(f'Failed to refresh token: {data.get("msg")}')
+            return data.get('data', {})
 
     async def get_user_info_raw(self, access_token: str) -> typing.Dict:
         """Get user info from Space using access token (no validation)"""
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        async with aiohttp.ClientSession() as session:
-            async with session.get(
-                f'{space_url}/api/v1/accounts/me', headers={'Authorization': f'Bearer {access_token}'}
-            ) as response:
-                if response.status != 200:
-                    raise ValueError(f'Failed to get user info: {await response.text()}')
-                data = await response.json()
-                if data.get('code') != 0:
-                    raise ValueError(f'Failed to get user info: {data.get("msg")}')
-                return data.get('data', {})
+        session = httpclient.get_session()
+        async with session.get(
+            f'{space_url}/api/v1/accounts/me', headers={'Authorization': f'Bearer {access_token}'}
+        ) as response:
+            if response.status != 200:
+                raise ValueError(f'Failed to get user info: {await response.text()}')
+            data = await response.json()
+            if data.get('code') != 0:
+                raise ValueError(f'Failed to get user info: {data.get("msg")}')
+            return data.get('data', {})
 
     # === API calls with token validation ===
 
@@ -178,12 +178,12 @@ async def get_models(self) -> typing.List[SpaceModel]:
         space_config = self._get_space_config()
         space_url = space_config['url']
 
-        async with aiohttp.ClientSession() as session:
-            async with session.get(f'{space_url}/api/v1/models') as response:
-                if response.status != 200:
-                    raise ValueError(f'Failed to get models: {await response.text()}')
-                data = await response.json()
-                if data.get('code') != 0:
-                    raise ValueError(f'Failed to get models: {data.get("msg")}')
-                models_data = data.get('data', {}).get('models', [])
-                return [SpaceModel.model_validate(model_dict) for model_dict in models_data]
+        session = httpclient.get_session()
+        async with session.get(f'{space_url}/api/v1/models') as response:
+            if response.status != 200:
+                raise ValueError(f'Failed to get models: {await response.text()}')
+            data = await response.json()
+            if data.get('code') != 0:
+                raise ValueError(f'Failed to get models: {data.get("msg")}')
+            models_data = data.get('data', {}).get('models', [])
+            return [SpaceModel.model_validate(model_dict) for model_dict in models_data]
diff --git a/src/langbot/pkg/core/bootutils/deps.py b/src/langbot/pkg/core/bootutils/deps.py
index b2508b22e..1f6530379 100644
--- a/src/langbot/pkg/core/bootutils/deps.py
+++ b/src/langbot/pkg/core/bootutils/deps.py
@@ -1,3 +1,4 @@
+import importlib.util
 import pip
 import os
 from ...utils import pkgmgr
@@ -49,9 +50,10 @@ async def check_deps() -> list[str]:
 
     missing_deps = []
     for dep in required_deps:
-        try:
-            __import__(dep)
-        except ImportError:
+        # Use find_spec instead of __import__ to avoid actually loading
+        # all modules into memory. find_spec only checks if the module
+        # can be found, without executing module-level code.
+        if importlib.util.find_spec(dep) is None:
             missing_deps.append(dep)
     return missing_deps
 

From 69035fbeaf84b4b8df9be882997113c035c054f2 Mon Sep 17 00:00:00 2001
From: RockChinQ <rockchinq@gmail.com>
Date: Sun, 1 Mar 2026 05:17:26 -0500
Subject: [PATCH 3/7] fix: restore shared httpclient.get_session() in unrelated
 files

Revert contributor's global aiohttp.ClientSession() changes that are
not part of the API Chain feature. These files should continue using
the shared session from httpclient module.
---
 .../cntfilter/filters/baiduexamine.py         |  83 +++++----
 src/langbot/pkg/platform/sources/discord.py   |  60 +++----
 src/langbot/pkg/platform/sources/kook.py      |  68 ++++----
 src/langbot/pkg/platform/sources/lark.py      |  24 +--
 .../pkg/platform/sources/legacy/gewechat.py   |  18 +-
 src/langbot/pkg/platform/sources/telegram.py  |  46 +++--
 src/langbot/pkg/platform/webhook_pusher.py    |  34 ++--
 src/langbot/pkg/provider/runners/n8nsvapi.py  |  80 ++++-----
 src/langbot/pkg/utils/image.py                | 163 +++++++++---------
 9 files changed, 302 insertions(+), 274 deletions(-)

diff --git a/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py b/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
index 4213e662b..a376310f6 100644
--- a/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
+++ b/src/langbot/pkg/pipeline/cntfilter/filters/baiduexamine.py
@@ -1,10 +1,9 @@
 from __future__ import annotations
 
-import aiohttp
-
 from .. import entities
 from .. import filter as filter_model
 import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
+from langbot.pkg.utils import httpclient
 
 BAIDU_EXAMINE_URL = 'https://aip.baidubce.com/rest/2.0/solution/v1/text_censor/v2/user_defined?access_token={}'
 BAIDU_EXAMINE_TOKEN_URL = 'https://aip.baidubce.com/oauth/2.0/token'
@@ -15,50 +14,50 @@ class BaiduCloudExamine(filter_model.ContentFilter):
     """百度云内容审核"""
 
     async def _get_token(self) -> str:
-        async with aiohttp.ClientSession() as session:
-            async with session.post(
-                BAIDU_EXAMINE_TOKEN_URL,
-                params={
-                    'grant_type': 'client_credentials',
-                    'client_id': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-key'],
-                    'client_secret': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-secret'],
-                },
-            ) as resp:
-                return (await resp.json())['access_token']
+        session = httpclient.get_session()
+        async with session.post(
+            BAIDU_EXAMINE_TOKEN_URL,
+            params={
+                'grant_type': 'client_credentials',
+                'client_id': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-key'],
+                'client_secret': self.ap.pipeline_cfg.data['baidu-cloud-examine']['api-secret'],
+            },
+        ) as resp:
+            return (await resp.json())['access_token']
 
     async def process(self, query: pipeline_query.Query, message: str) -> entities.FilterResult:
-        async with aiohttp.ClientSession() as session:
-            async with session.post(
-                BAIDU_EXAMINE_URL.format(await self._get_token()),
-                headers={
-                    'Content-Type': 'application/x-www-form-urlencoded',
-                    'Accept': 'application/json',
-                },
-                data=f'text={message}'.encode('utf-8'),
-            ) as resp:
-                result = await resp.json()
-
-                if 'error_code' in result:
+        session = httpclient.get_session()
+        async with session.post(
+            BAIDU_EXAMINE_URL.format(await self._get_token()),
+            headers={
+                'Content-Type': 'application/x-www-form-urlencoded',
+                'Accept': 'application/json',
+            },
+            data=f'text={message}'.encode('utf-8'),
+        ) as resp:
+            result = await resp.json()
+
+            if 'error_code' in result:
+                return entities.FilterResult(
+                    level=entities.ResultLevel.BLOCK,
+                    replacement=message,
+                    user_notice='',
+                    console_notice=f'百度云判定出错，错误信息：{result["error_msg"]}',
+                )
+            else:
+                conclusion = result['conclusion']
+
+                if conclusion in ('合规'):
                     return entities.FilterResult(
-                        level=entities.ResultLevel.BLOCK,
+                        level=entities.ResultLevel.PASS,
                         replacement=message,
                         user_notice='',
-                        console_notice=f'百度云判定出错，错误信息：{result["error_msg"]}',
+                        console_notice=f'百度云判定结果：{conclusion}',
                     )
                 else:
-                    conclusion = result['conclusion']
-
-                    if conclusion in ('合规'):
-                        return entities.FilterResult(
-                            level=entities.ResultLevel.PASS,
-                            replacement=message,
-                            user_notice='',
-                            console_notice=f'百度云判定结果：{conclusion}',
-                        )
-                    else:
-                        return entities.FilterResult(
-                            level=entities.ResultLevel.BLOCK,
-                            replacement=message,
-                            user_notice='消息中存在不合适的内容, 请修改',
-                            console_notice=f'百度云判定结果：{conclusion}',
-                        )
+                    return entities.FilterResult(
+                        level=entities.ResultLevel.BLOCK,
+                        replacement=message,
+                        user_notice='消息中存在不合适的内容, 请修改',
+                        console_notice=f'百度云判定结果：{conclusion}',
+                    )
diff --git a/src/langbot/pkg/platform/sources/discord.py b/src/langbot/pkg/platform/sources/discord.py
index cb80ce48e..e9cc7a37e 100644
--- a/src/langbot/pkg/platform/sources/discord.py
+++ b/src/langbot/pkg/platform/sources/discord.py
@@ -14,7 +14,7 @@
 import asyncio
 from enum import Enum
 
-import aiohttp
+from langbot.pkg.utils import httpclient
 import pydantic
 
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
@@ -622,23 +622,23 @@ async def yiri2target(
                     image_bytes = base64.b64decode(base64_data)
                 elif ele.url:
                     # 从URL下载图片
-                    async with aiohttp.ClientSession() as session:
-                        async with session.get(ele.url) as response:
-                            image_bytes = await response.read()
-                            # 从URL或Content-Type推断文件类型
-                            content_type = response.headers.get('Content-Type', '')
-                            if 'jpeg' in content_type or 'jpg' in content_type:
-                                filename = f'{uuid.uuid4()}.jpg'
-                            elif 'gif' in content_type:
-                                filename = f'{uuid.uuid4()}.gif'
-                            elif 'webp' in content_type:
-                                filename = f'{uuid.uuid4()}.webp'
-                            elif ele.url.lower().endswith(('.jpg', '.jpeg')):
-                                filename = f'{uuid.uuid4()}.jpg'
-                            elif ele.url.lower().endswith('.gif'):
-                                filename = f'{uuid.uuid4()}.gif'
-                            elif ele.url.lower().endswith('.webp'):
-                                filename = f'{uuid.uuid4()}.webp'
+                    session = httpclient.get_session()
+                    async with session.get(ele.url) as response:
+                        image_bytes = await response.read()
+                        # 从URL或Content-Type推断文件类型
+                        content_type = response.headers.get('Content-Type', '')
+                        if 'jpeg' in content_type or 'jpg' in content_type:
+                            filename = f'{uuid.uuid4()}.jpg'
+                        elif 'gif' in content_type:
+                            filename = f'{uuid.uuid4()}.gif'
+                        elif 'webp' in content_type:
+                            filename = f'{uuid.uuid4()}.webp'
+                        elif ele.url.lower().endswith(('.jpg', '.jpeg')):
+                            filename = f'{uuid.uuid4()}.jpg'
+                        elif ele.url.lower().endswith('.gif'):
+                            filename = f'{uuid.uuid4()}.gif'
+                        elif ele.url.lower().endswith('.webp'):
+                            filename = f'{uuid.uuid4()}.webp'
                 elif ele.path:
                     # 从文件路径读取图片
                     # 确保路径没有空字节
@@ -702,9 +702,9 @@ async def yiri2target(
                     file_base64 = ele.base64.split(',')[-1]
                     file_bytes = base64.b64decode(file_base64)
                 elif ele.url:
-                    async with aiohttp.ClientSession() as session:
-                        async with session.get(ele.url) as response:
-                            file_bytes = await response.read()
+                    session = httpclient.get_session()
+                    async with session.get(ele.url) as response:
+                        file_bytes = await response.read()
                 if file_bytes:
                     files.append(discord.File(fp=io.BytesIO(file_bytes), filename=filename))
             elif isinstance(ele, platform_message.File):
@@ -717,9 +717,9 @@ async def yiri2target(
                     else:
                         file_bytes = base64.b64decode(ele.base64)
                 elif ele.url:
-                    async with aiohttp.ClientSession() as session:
-                        async with session.get(ele.url) as response:
-                            file_bytes = await response.read()
+                    session = httpclient.get_session()
+                    async with session.get(ele.url) as response:
+                        file_bytes = await response.read()
                 if file_bytes:
                     files.append(discord.File(fp=io.BytesIO(file_bytes), filename=filename))
             elif isinstance(ele, platform_message.Forward):
@@ -775,12 +775,12 @@ def text_element_recur(
 
         # attachments
         for attachment in message.attachments:
-            async with aiohttp.ClientSession(trust_env=True) as session:
-                async with session.get(attachment.url) as response:
-                    image_data = await response.read()
-                    image_base64 = base64.b64encode(image_data).decode('utf-8')
-                    image_format = response.headers['Content-Type']
-                    element_list.append(platform_message.Image(base64=f'data:{image_format};base64,{image_base64}'))
+            session = httpclient.get_session(trust_env=True)
+            async with session.get(attachment.url) as response:
+                image_data = await response.read()
+                image_base64 = base64.b64encode(image_data).decode('utf-8')
+                image_format = response.headers['Content-Type']
+                element_list.append(platform_message.Image(base64=f'data:{image_format};base64,{image_base64}'))
 
         return platform_message.MessageChain(element_list)
 
diff --git a/src/langbot/pkg/platform/sources/kook.py b/src/langbot/pkg/platform/sources/kook.py
index 17777a95e..5a6bade36 100644
--- a/src/langbot/pkg/platform/sources/kook.py
+++ b/src/langbot/pkg/platform/sources/kook.py
@@ -9,6 +9,8 @@
 import time
 
 import aiohttp
+
+from langbot.pkg.utils import httpclient
 import websockets
 import pydantic
 
@@ -120,16 +122,16 @@ async def target2yiri(kook_message: dict, bot_account_id: str = '') -> platform_
             if content:
                 # Download image and convert to base64
                 try:
-                    async with aiohttp.ClientSession() as session:
-                        async with session.get(content) as response:
-                            if response.status == 200:
-                                image_bytes = await response.read()
-                                image_base64 = base64.b64encode(image_bytes).decode('utf-8')
-                                # Detect image format
-                                content_type = response.headers.get('Content-Type', 'image/png')
-                                components.append(
-                                    platform_message.Image(base64=f'data:{content_type};base64,{image_base64}')
-                                )
+                    session = httpclient.get_session()
+                    async with session.get(content) as response:
+                        if response.status == 200:
+                            image_bytes = await response.read()
+                            image_base64 = base64.b64encode(image_bytes).decode('utf-8')
+                            # Detect image format
+                            content_type = response.headers.get('Content-Type', 'image/png')
+                            components.append(
+                                platform_message.Image(base64=f'data:{content_type};base64,{image_base64}')
+                            )
                 except Exception:
                     # If download fails, just add as plain text
                     components.append(platform_message.Plain(text=f'[Image: {content}]'))
@@ -295,17 +297,17 @@ async def _get_gateway_url(self) -> str:
             'Authorization': f'Bot {self.config["token"]}',
         }
 
-        async with aiohttp.ClientSession() as session:
-            async with session.get(base_url, params=params, headers=headers) as response:
-                if response.status == 200:
-                    data = await response.json()
-                    if data.get('code') == 0:
-                        gateway_url = data['data']['url']
-                        return gateway_url
-                    else:
-                        raise Exception(f'Failed to get gateway URL: {data.get("message")}')
+        session = httpclient.get_session()
+        async with session.get(base_url, params=params, headers=headers) as response:
+            if response.status == 200:
+                data = await response.json()
+                if data.get('code') == 0:
+                    gateway_url = data['data']['url']
+                    return gateway_url
                 else:
-                    raise Exception(f'Failed to get gateway URL: HTTP {response.status}')
+                    raise Exception(f'Failed to get gateway URL: {data.get("message")}')
+            else:
+                raise Exception(f'Failed to get gateway URL: HTTP {response.status}')
 
     async def _get_bot_user_info(self) -> dict:
         """Get bot's own user information from KOOK API"""
@@ -315,17 +317,17 @@ async def _get_bot_user_info(self) -> dict:
             'Authorization': f'Bot {self.config["token"]}',
         }
 
-        async with aiohttp.ClientSession() as session:
-            async with session.get(base_url, headers=headers) as response:
-                if response.status == 200:
-                    data = await response.json()
-                    if data.get('code') == 0:
-                        user_info = data['data']
-                        return user_info
-                    else:
-                        raise Exception(f'Failed to get bot user info: {data.get("message")}')
+        session = httpclient.get_session()
+        async with session.get(base_url, headers=headers) as response:
+            if response.status == 200:
+                data = await response.json()
+                if data.get('code') == 0:
+                    user_info = data['data']
+                    return user_info
                 else:
-                    raise Exception(f'Failed to get bot user info: HTTP {response.status}')
+                    raise Exception(f'Failed to get bot user info: {data.get("message")}')
+            else:
+                raise Exception(f'Failed to get bot user info: HTTP {response.status}')
 
     async def _handle_hello(self, data: dict):
         """Handle HELLO signal (signal 1)"""
@@ -510,7 +512,7 @@ async def send_message(self, target_type: str, target_id: str, message: platform
 
         try:
             if not self.http_session:
-                self.http_session = aiohttp.ClientSession()
+                self.http_session = httpclient.get_session()
 
             async with self.http_session.post(url, json=payload, headers=headers) as response:
                 if response.status == 200:
@@ -576,7 +578,7 @@ async def reply_message(
 
         try:
             if not self.http_session:
-                self.http_session = aiohttp.ClientSession()
+                self.http_session = httpclient.get_session()
 
             async with self.http_session.post(url, json=payload, headers=headers) as response:
                 if response.status == 200:
@@ -624,7 +626,7 @@ async def run_async(self):
 
         try:
             # Create HTTP session
-            self.http_session = aiohttp.ClientSession()
+            self.http_session = httpclient.get_session()
 
             await self.logger.info('Starting KOOK adapter')
 
diff --git a/src/langbot/pkg/platform/sources/lark.py b/src/langbot/pkg/platform/sources/lark.py
index ce5277311..3ce4280cd 100644
--- a/src/langbot/pkg/platform/sources/lark.py
+++ b/src/langbot/pkg/platform/sources/lark.py
@@ -17,7 +17,7 @@
 import os
 import mimetypes
 
-import aiohttp
+from langbot.pkg.utils import httpclient
 import lark_oapi.ws.exception
 import quart
 from lark_oapi.api.im.v1 import *
@@ -78,13 +78,13 @@ async def upload_image_to_lark(msg: platform_message.Image, api_client: lark_oap
                 return None
         elif msg.url:
             try:
-                async with aiohttp.ClientSession() as session:
-                    async with session.get(msg.url) as response:
-                        if response.status == 200:
-                            image_bytes = await response.read()
-                        else:
-                            print(f'Failed to download image from {msg.url}: HTTP {response.status}')
-                            return None
+                session = httpclient.get_session()
+                async with session.get(msg.url) as response:
+                    if response.status == 200:
+                        image_bytes = await response.read()
+                    else:
+                        print(f'Failed to download image from {msg.url}: HTTP {response.status}')
+                        return None
             except Exception as e:
                 print(f'Failed to download image from {msg.url}: {e}')
                 traceback.print_exc()
@@ -208,10 +208,10 @@ async def _get_media_bytes(
                 pass
         elif msg.url:
             try:
-                async with aiohttp.ClientSession() as session:
-                    async with session.get(msg.url) as resp:
-                        if resp.status == 200:
-                            data = await resp.read()
+                session = httpclient.get_session()
+                async with session.get(msg.url) as resp:
+                    if resp.status == 200:
+                        data = await resp.read()
             except Exception:
                 pass
         elif msg.path:
diff --git a/src/langbot/pkg/platform/sources/legacy/gewechat.py b/src/langbot/pkg/platform/sources/legacy/gewechat.py
index 93bef53cb..68e1bdedd 100644
--- a/src/langbot/pkg/platform/sources/legacy/gewechat.py
+++ b/src/langbot/pkg/platform/sources/legacy/gewechat.py
@@ -9,7 +9,7 @@
 import threading
 
 import quart
-import aiohttp
+from langbot.pkg.utils import httpclient
 
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
 from ....core import app
@@ -639,14 +639,14 @@ def unregister_listener(
 
     async def run_async(self):
         if not self.config['token']:
-            async with aiohttp.ClientSession() as session:
-                async with session.post(
-                    f'{self.config["gewechat_url"]}/v2/api/tools/getTokenId',
-                    json={'app_id': self.config['app_id']},
-                ) as response:
-                    if response.status != 200:
-                        raise Exception(f'获取gewechat token失败: {await response.text()}')
-                    self.config['token'] = (await response.json())['data']
+            session = httpclient.get_session()
+            async with session.post(
+                f'{self.config["gewechat_url"]}/v2/api/tools/getTokenId',
+                json={'app_id': self.config['app_id']},
+            ) as response:
+                if response.status != 200:
+                    raise Exception(f'获取gewechat token失败: {await response.text()}')
+                self.config['token'] = (await response.json())['data']
 
         self.bot = gewechat_client.GewechatClient(f'{self.config["gewechat_url"]}/v2/api', self.config['token'])
 
diff --git a/src/langbot/pkg/platform/sources/telegram.py b/src/langbot/pkg/platform/sources/telegram.py
index c2b2fd032..d43b9333c 100644
--- a/src/langbot/pkg/platform/sources/telegram.py
+++ b/src/langbot/pkg/platform/sources/telegram.py
@@ -10,9 +10,9 @@
 import typing
 import traceback
 import base64
-import aiohttp
 import pydantic
 
+from langbot.pkg.utils import httpclient
 import langbot_plugin.api.definition.abstract.platform.adapter as abstract_platform_adapter
 import langbot_plugin.api.entities.builtin.platform.message as platform_message
 import langbot_plugin.api.entities.builtin.platform.events as platform_events
@@ -34,9 +34,9 @@ async def yiri2target(message_chain: platform_message.MessageChain, bot: telegra
                 if component.base64:
                     photo_bytes = base64.b64decode(component.base64)
                 elif component.url:
-                    async with aiohttp.ClientSession() as session:
-                        async with session.get(component.url) as response:
-                            photo_bytes = await response.read()
+                    session = httpclient.get_session()
+                    async with session.get(component.url) as response:
+                        photo_bytes = await response.read()
                 elif component.path:
                     with open(component.path, 'rb') as f:
                         photo_bytes = f.read()
@@ -75,10 +75,9 @@ def parse_message_text(text: str) -> list[platform_message.MessageComponent]:
             file_bytes = None
             file_format = ''
 
-            async with aiohttp.ClientSession(trust_env=True) as session:
-                async with session.get(file.file_path) as response:
-                    file_bytes = await response.read()
-                    file_format = 'image/jpeg'
+            async with httpclient.get_session(trust_env=True).get(file.file_path) as response:
+                file_bytes = await response.read()
+                file_format = 'image/jpeg'
 
             message_components.append(
                 platform_message.Image(
@@ -95,9 +94,8 @@ def parse_message_text(text: str) -> list[platform_message.MessageComponent]:
             file_bytes = None
             file_format = message.voice.mime_type or 'audio/ogg'
 
-            async with aiohttp.ClientSession(trust_env=True) as session:
-                async with session.get(file.file_path) as response:
-                    file_bytes = await response.read()
+            async with httpclient.get_session(trust_env=True).get(file.file_path) as response:
+                file_bytes = await response.read()
 
             message_components.append(
                 platform_message.Voice(
@@ -195,7 +193,31 @@ async def telegram_callback(update: Update, context: ContextTypes.DEFAULT_TYPE):
         )
 
     async def send_message(self, target_type: str, target_id: str, message: platform_message.MessageChain):
-        pass
+        components = await TelegramMessageConverter.yiri2target(message, self.bot)
+
+        chat_id_str, _, thread_id_str = str(target_id).partition('#')
+        chat_id: int | str = int(chat_id_str) if chat_id_str.lstrip('-').isdigit() else chat_id_str
+        message_thread_id = int(thread_id_str) if thread_id_str and thread_id_str.isdigit() else None
+
+        for component in components:
+            component_type = component.get('type')
+            args = {'chat_id': chat_id}
+            if message_thread_id is not None:
+                args['message_thread_id'] = message_thread_id
+
+            if component_type == 'text':
+                text = component.get('text', '')
+                if self.config['markdown_card'] is True:
+                    text = telegramify_markdown.markdownify(content=text)
+                    args['parse_mode'] = 'MarkdownV2'
+                args['text'] = text
+                await self.bot.send_message(**args)
+            elif component_type == 'photo':
+                photo = component.get('photo')
+                if photo is None:
+                    continue
+                args['photo'] = telegram.InputFile(photo)
+                await self.bot.send_photo(**args)
 
     async def reply_message(
         self,
diff --git a/src/langbot/pkg/platform/webhook_pusher.py b/src/langbot/pkg/platform/webhook_pusher.py
index 5a8d25644..f3cf39b27 100644
--- a/src/langbot/pkg/platform/webhook_pusher.py
+++ b/src/langbot/pkg/platform/webhook_pusher.py
@@ -3,6 +3,8 @@
 import asyncio
 import logging
 import aiohttp
+
+from langbot.pkg.utils import httpclient
 import uuid
 from typing import TYPE_CHECKING
 
@@ -119,23 +121,23 @@ async def _push_to_webhook(self, url: str, payload: dict) -> dict | None:
             dict | None: The response JSON if successful, None otherwise
         """
         try:
-            async with aiohttp.ClientSession() as session:
-                async with session.post(
-                    url,
-                    json=payload,
-                    headers={'Content-Type': 'application/json'},
-                    timeout=aiohttp.ClientTimeout(total=15),
-                ) as response:
-                    if response.status >= 400:
-                        self.logger.warning(f'Webhook {url} returned status {response.status}')
+            session = httpclient.get_session()
+            async with session.post(
+                url,
+                json=payload,
+                headers={'Content-Type': 'application/json'},
+                timeout=aiohttp.ClientTimeout(total=15),
+            ) as response:
+                if response.status >= 400:
+                    self.logger.warning(f'Webhook {url} returned status {response.status}')
+                    return None
+                else:
+                    self.logger.debug(f'Successfully pushed to webhook {url}')
+                    try:
+                        return await response.json()
+                    except Exception as json_error:
+                        self.logger.debug(f'Failed to parse JSON response from webhook {url}: {json_error}')
                         return None
-                    else:
-                        self.logger.debug(f'Successfully pushed to webhook {url}')
-                        try:
-                            return await response.json()
-                        except Exception as json_error:
-                            self.logger.debug(f'Failed to parse JSON response from webhook {url}: {json_error}')
-                            return None
         except asyncio.TimeoutError:
             self.logger.warning(f'Timeout pushing to webhook {url}')
             return None
diff --git a/src/langbot/pkg/provider/runners/n8nsvapi.py b/src/langbot/pkg/provider/runners/n8nsvapi.py
index d7ec3ccbf..d177d6b81 100644
--- a/src/langbot/pkg/provider/runners/n8nsvapi.py
+++ b/src/langbot/pkg/provider/runners/n8nsvapi.py
@@ -5,6 +5,8 @@
 import uuid
 import aiohttp
 
+from langbot.pkg.utils import httpclient
+
 from .. import runner
 from ...core import app
 import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
@@ -217,50 +219,50 @@ async def _call_webhook(self, query: pipeline_query.Query) -> typing.AsyncGenera
                 self.ap.logger.debug('no auth')
 
             # 调用webhook
-            async with aiohttp.ClientSession() as session:
-                if is_stream:
-                    # 流式请求
-                    async with session.post(
-                        self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
-                    ) as response:
+            session = httpclient.get_session()
+            if is_stream:
+                # 流式请求
+                async with session.post(
+                    self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
+                ) as response:
+                    if response.status != 200:
+                        error_text = await response.text()
+                        self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
+                        raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
+
+                    # 处理流式响应
+                    async for chunk in self._process_stream_response(response):
+                        yield chunk
+            else:
+                async with session.post(
+                    self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
+                ) as response:
+                    try:
+                        async for chunk in self._process_stream_response(response):
+                            output_content = chunk.content if chunk.is_final else ''
+                    except:
+                        # 非流式请求（保持原有逻辑）
                         if response.status != 200:
                             error_text = await response.text()
                             self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
                             raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
 
-                        # 处理流式响应
-                        async for chunk in self._process_stream_response(response):
-                            yield chunk
-                else:
-                    async with session.post(
-                        self.webhook_url, json=payload, headers=headers, auth=auth, timeout=self.timeout
-                    ) as response:
-                        try:
-                            async for chunk in self._process_stream_response(response):
-                                output_content = chunk.content if chunk.is_final else ''
-                        except:
-                            # 非流式请求（保持原有逻辑）
-                            if response.status != 200:
-                                error_text = await response.text()
-                                self.ap.logger.error(f'n8n webhook call failed: {response.status}, {error_text}')
-                                raise Exception(f'n8n webhook call failed: {response.status}, {error_text}')
-
-                            # 解析响应
-                            response_data = await response.json()
-                            self.ap.logger.debug(f'n8n webhook response: {response_data}')
-
-                            # 从响应中提取输出
-                            if self.output_key in response_data:
-                                output_content = response_data[self.output_key]
-                            else:
-                                # 如果没有指定的输出键，则使用整个响应
-                                output_content = json.dumps(response_data, ensure_ascii=False)
-
-                        # 返回消息
-                        yield provider_message.Message(
-                            role='assistant',
-                            content=output_content,
-                        )
+                        # 解析响应
+                        response_data = await response.json()
+                        self.ap.logger.debug(f'n8n webhook response: {response_data}')
+
+                        # 从响应中提取输出
+                        if self.output_key in response_data:
+                            output_content = response_data[self.output_key]
+                        else:
+                            # 如果没有指定的输出键，则使用整个响应
+                            output_content = json.dumps(response_data, ensure_ascii=False)
+
+                    # 返回消息
+                    yield provider_message.Message(
+                        role='assistant',
+                        content=output_content,
+                    )
         except Exception as e:
             self.ap.logger.error(f'n8n webhook call exception: {str(e)}')
             raise N8nAPIError(f'n8n webhook call exception: {str(e)}')
diff --git a/src/langbot/pkg/utils/image.py b/src/langbot/pkg/utils/image.py
index e07caec67..5716b07d6 100644
--- a/src/langbot/pkg/utils/image.py
+++ b/src/langbot/pkg/utils/image.py
@@ -5,6 +5,8 @@
 import ssl
 
 import aiohttp
+
+from langbot.pkg.utils import httpclient
 import PIL.Image
 import httpx
 
@@ -47,53 +49,54 @@ async def get_gewechat_image_base64(
     )
 
     try:
-        async with aiohttp.ClientSession(timeout=timeout) as session:
-            # 获取图片下载链接
-            try:
-                async with session.post(
-                    f'{gewechat_url}/v2/api/message/downloadImage',
-                    headers=headers,
-                    json={'appId': app_id, 'type': image_type, 'xml': xml_content},
-                ) as response:
-                    if response.status != 200:
-                        # print(response)
-                        raise Exception(f'获取gewechat图片下载失败: {await response.text()}')
-
-                    resp_data = await response.json()
-                    if resp_data.get('ret') != 200:
-                        raise Exception(f'获取gewechat图片下载链接失败: {resp_data}')
-
-                    file_url = resp_data['data']['fileUrl']
-            except asyncio.TimeoutError:
-                raise Exception('获取图片下载链接超时')
-            except aiohttp.ClientError as e:
-                raise Exception(f'获取图片下载链接网络错误: {str(e)}')
-
-            # 解析原始URL并替换端口
-            base_url = gewechat_file_url
-            download_url = f'{base_url}/download/{file_url}'
-
-            # 下载图片
-            try:
-                async with session.get(download_url) as img_response:
-                    if img_response.status != 200:
-                        raise Exception(f'下载图片失败: {await img_response.text()}, URL: {download_url}')
-
-                    image_data = await img_response.read()
-
-                    content_type = img_response.headers.get('Content-Type', '')
-                    if content_type:
-                        image_format = content_type.split('/')[-1]
-                    else:
-                        image_format = file_url.split('.')[-1]
-
-                    base64_str = base64.b64encode(image_data).decode('utf-8')
-
-                    return base64_str, image_format
-            except asyncio.TimeoutError:
-                raise Exception(f'下载图片超时, URL: {download_url}')
-            except aiohttp.ClientError as e:
-                raise Exception(f'下载图片网络错误: {str(e)}, URL: {download_url}')
+        session = httpclient.get_session()
+        # 获取图片下载链接
+        try:
+            async with session.post(
+                f'{gewechat_url}/v2/api/message/downloadImage',
+                headers=headers,
+                json={'appId': app_id, 'type': image_type, 'xml': xml_content},
+                timeout=timeout,
+            ) as response:
+                if response.status != 200:
+                    # print(response)
+                    raise Exception(f'获取gewechat图片下载失败: {await response.text()}')
+
+                resp_data = await response.json()
+                if resp_data.get('ret') != 200:
+                    raise Exception(f'获取gewechat图片下载链接失败: {resp_data}')
+
+                file_url = resp_data['data']['fileUrl']
+        except asyncio.TimeoutError:
+            raise Exception('获取图片下载链接超时')
+        except aiohttp.ClientError as e:
+            raise Exception(f'获取图片下载链接网络错误: {str(e)}')
+
+        # 解析原始URL并替换端口
+        base_url = gewechat_file_url
+        download_url = f'{base_url}/download/{file_url}'
+
+        # 下载图片
+        try:
+            async with session.get(download_url) as img_response:
+                if img_response.status != 200:
+                    raise Exception(f'下载图片失败: {await img_response.text()}, URL: {download_url}')
+
+                image_data = await img_response.read()
+
+                content_type = img_response.headers.get('Content-Type', '')
+                if content_type:
+                    image_format = content_type.split('/')[-1]
+                else:
+                    image_format = file_url.split('.')[-1]
+
+                base64_str = base64.b64encode(image_data).decode('utf-8')
+
+                return base64_str, image_format
+        except asyncio.TimeoutError:
+            raise Exception(f'下载图片超时, URL: {download_url}')
+        except aiohttp.ClientError as e:
+            raise Exception(f'下载图片网络错误: {str(e)}, URL: {download_url}')
     except Exception as e:
         raise Exception(f'获取图片失败: {str(e)}') from e
 
@@ -104,24 +107,24 @@ async def get_wecom_image_base64(pic_url: str) -> tuple[str, str]:
     :param pic_url: 企业微信图片URL
     :return: (base64_str, image_format)
     """
-    async with aiohttp.ClientSession() as session:
-        async with session.get(pic_url) as response:
-            if response.status != 200:
-                raise Exception(f'Failed to download image: {response.status}')
+    session = httpclient.get_session()
+    async with session.get(pic_url) as response:
+        if response.status != 200:
+            raise Exception(f'Failed to download image: {response.status}')
 
-            # 读取图片数据
-            image_data = await response.read()
+        # 读取图片数据
+        image_data = await response.read()
 
-            # 获取图片格式
-            content_type = response.headers.get('Content-Type', '')
-            image_format = content_type.split('/')[-1]  # 例如 'image/jpeg' -> 'jpeg'
+        # 获取图片格式
+        content_type = response.headers.get('Content-Type', '')
+        image_format = content_type.split('/')[-1]  # 例如 'image/jpeg' -> 'jpeg'
 
-            # 转换为 base64
-            import base64
+        # 转换为 base64
+        import base64
 
-            image_base64 = base64.b64encode(image_data).decode('utf-8')
+        image_base64 = base64.b64encode(image_data).decode('utf-8')
 
-            return image_base64, image_format
+        return image_base64, image_format
 
 
 async def get_qq_official_image_base64(pic_url: str, content_type: str) -> tuple[str, str]:
@@ -152,21 +155,19 @@ async def get_qq_image_bytes(image_url: str, query: dict = {}) -> tuple[bytes, s
     ssl_context = ssl.create_default_context()
     ssl_context.check_hostname = False
     ssl_context.verify_mode = ssl.CERT_NONE
-    async with aiohttp.ClientSession(trust_env=False) as session:
-        async with session.get(
-            image_url, params=query, ssl=ssl_context, timeout=aiohttp.ClientTimeout(total=30.0)
-        ) as resp:
-            resp.raise_for_status()
-            file_bytes = await resp.read()
-            content_type = resp.headers.get('Content-Type')
-            if not content_type:
-                image_format = 'jpeg'
-            elif not content_type.startswith('image/'):
-                pil_img = PIL.Image.open(io.BytesIO(file_bytes))
-                image_format = pil_img.format.lower()
-            else:
-                image_format = content_type.split('/')[-1]
-            return file_bytes, image_format
+    session = httpclient.get_session()
+    async with session.get(image_url, params=query, ssl=ssl_context, timeout=aiohttp.ClientTimeout(total=30.0)) as resp:
+        resp.raise_for_status()
+        file_bytes = await resp.read()
+        content_type = resp.headers.get('Content-Type')
+        if not content_type:
+            image_format = 'jpeg'
+        elif not content_type.startswith('image/'):
+            pil_img = PIL.Image.open(io.BytesIO(file_bytes))
+            image_format = pil_img.format.lower()
+        else:
+            image_format = content_type.split('/')[-1]
+        return file_bytes, image_format
 
 
 async def qq_image_url_to_base64(image_url: str) -> typing.Tuple[str, str]:
@@ -204,11 +205,11 @@ async def extract_b64_and_format(image_base64_data: str) -> typing.Tuple[str, st
 async def get_slack_image_to_base64(pic_url: str, bot_token: str):
     headers = {'Authorization': f'Bearer {bot_token}'}
     try:
-        async with aiohttp.ClientSession() as session:
-            async with session.get(pic_url, headers=headers) as resp:
-                mime_type = resp.headers.get('Content-Type', 'application/octet-stream')
-                file_bytes = await resp.read()
-                base64_str = base64.b64encode(file_bytes).decode('utf-8')
-            return f'data:{mime_type};base64,{base64_str}'
+        session = httpclient.get_session()
+        async with session.get(pic_url, headers=headers) as resp:
+            mime_type = resp.headers.get('Content-Type', 'application/octet-stream')
+            file_bytes = await resp.read()
+            base64_str = base64.b64encode(file_bytes).decode('utf-8')
+        return f'data:{mime_type};base64,{base64_str}'
     except Exception as e:
         raise (e)

From 92f31d6f74be1de0fb45b11db93ab650bdf643ca Mon Sep 17 00:00:00 2001
From: Typer_Body <marcelacelani74@gmail.com>
Date: Sun, 1 Mar 2026 21:54:27 +0800
Subject: [PATCH 4/7] Update eslint.config.mjs

---
 web/eslint.config.mjs | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/web/eslint.config.mjs b/web/eslint.config.mjs
index d9a1d0e10..18b74c95d 100644
--- a/web/eslint.config.mjs
+++ b/web/eslint.config.mjs
@@ -11,9 +11,6 @@ const compat = new FlatCompat({
 });
 
 const eslintConfig = [
-  {
-    ignores: ['.next/**', 'node_modules/**'],
-  },
   ...compat.extends('next/core-web-vitals', 'next/typescript'),
   eslintPluginPrettierRecommended,
 ];

From 9f3b627d9be3936ae3edf76310dfd007dcf7d201 Mon Sep 17 00:00:00 2001
From: Junyan Qin <rockchinq@gmail.com>
Date: Thu, 12 Mar 2026 01:37:21 +0800
Subject: [PATCH 5/7] chore: remove redundant api_chain migration files after
 rebase

---
 .../dbm020_api_chain_model_api_level.py       | 39 -------------------
 .../dbm021_api_chain_health_check_flag.py     | 27 -------------
 2 files changed, 66 deletions(-)
 delete mode 100644 src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
 delete mode 100644 src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py

diff --git a/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py b/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
deleted file mode 100644
index 861d7b840..000000000
--- a/src/langbot/pkg/persistence/migrations/dbm020_api_chain_model_api_level.py
+++ /dev/null
@@ -1,39 +0,0 @@
-import sqlalchemy
-from .. import migration
-
-
-@migration.migration_class(20)
-class DBMigrateAPIChainModelAPILevel(migration.DBMigration):
-    """Add model_name and api_key_index columns to api_chain_status for per-model/api-key health tracking"""
-
-    async def upgrade(self):
-        """Upgrade"""
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text('ALTER TABLE api_chain_status ADD COLUMN model_name VARCHAR(255) DEFAULT NULL')
-            )
-        except Exception:
-            pass
-
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text('ALTER TABLE api_chain_status ADD COLUMN api_key_index INTEGER DEFAULT NULL')
-            )
-        except Exception:
-            pass
-
-    async def downgrade(self):
-        """Downgrade"""
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN model_name')
-            )
-        except Exception:
-            pass
-
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN api_key_index')
-            )
-        except Exception:
-            pass
diff --git a/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py b/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py
deleted file mode 100644
index d4d9a1c87..000000000
--- a/src/langbot/pkg/persistence/migrations/dbm021_api_chain_health_check_flag.py
+++ /dev/null
@@ -1,27 +0,0 @@
-import sqlalchemy
-from .. import migration
-
-
-@migration.migration_class(21)
-class DBMigrateAPIChainHealthCheckFlag(migration.DBMigration):
-    """Add health_check_last_failed column to api_chain_status"""
-
-    async def upgrade(self):
-        """Upgrade"""
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text(
-                    'ALTER TABLE api_chain_status ADD COLUMN health_check_last_failed BOOLEAN NOT NULL DEFAULT 0'
-                )
-            )
-        except Exception:
-            pass
-
-    async def downgrade(self):
-        """Downgrade"""
-        try:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.text('ALTER TABLE api_chain_status DROP COLUMN health_check_last_failed')
-            )
-        except Exception:
-            pass

From 580f709dbc04048c0a12e50c79cb2cc93e7b14e1 Mon Sep 17 00:00:00 2001
From: Junyan Qin <rockchinq@gmail.com>
Date: Thu, 12 Mar 2026 03:05:32 +0800
Subject: [PATCH 6/7] refactor: remove API Chains functionality and related
 components

- Deleted APIChainsDialog component and its references in ModelsDialog.
- Removed APIChain interface and related types from the API entities.
- Updated DynamicFormComponent and DynamicFormItemComponent to replace model-or-api-chain-selector with model-fallback-selector.
- Added fallback model selection logic in DynamicFormItemComponent.
- Updated translations to remove API Chains related entries and add fallback model entries.
---
 .../controller/groups/provider/api_chains.py  |  41 -
 src/langbot/pkg/api/http/service/api_chain.py | 149 ----
 src/langbot/pkg/core/app.py                   |   8 +-
 src/langbot/pkg/core/stages/build_app.py      |   9 -
 .../pkg/entity/persistence/api_chain.py       |  98 ---
 .../migrations/dbm008_api_chain.py            |  46 --
 .../dbm023_model_fallback_config.py           | 102 +++
 src/langbot/pkg/pipeline/preproc/preproc.py   |  43 +-
 .../pkg/provider/modelmgr/api_chain.py        | 757 ------------------
 .../pkg/provider/runners/localagent.py        | 261 +++---
 src/langbot/pkg/utils/constants.py            |   2 +-
 .../templates/metadata/pipeline/ai.yaml       |   9 +-
 .../api-chains-dialog/APIChainCard.tsx        | 495 ------------
 .../api-chains-dialog/APIChainForm.tsx        | 665 ---------------
 .../api-chains-dialog/APIChainsDialog.tsx     | 179 -----
 .../dynamic-form/DynamicFormComponent.tsx     |   7 +
 .../dynamic-form/DynamicFormItemComponent.tsx | 202 +++--
 .../components/models-dialog/ModelsDialog.tsx |  19 +-
 web/src/app/infra/entities/api/api_chain.ts   |  64 --
 web/src/app/infra/entities/api/index.ts       |  58 --
 web/src/app/infra/entities/form/dynamic.ts    |   2 +-
 web/src/app/infra/http/BackendClient.ts       |  29 -
 web/src/i18n/locales/en-US.ts                 |  61 +-
 web/src/i18n/locales/ja-JP.ts                 |  61 +-
 web/src/i18n/locales/zh-Hans.ts               |  61 +-
 web/src/i18n/locales/zh-Hant.ts               |  60 +-
 26 files changed, 465 insertions(+), 3023 deletions(-)
 delete mode 100644 src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
 delete mode 100644 src/langbot/pkg/api/http/service/api_chain.py
 delete mode 100644 src/langbot/pkg/entity/persistence/api_chain.py
 delete mode 100644 src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
 create mode 100644 src/langbot/pkg/persistence/migrations/dbm023_model_fallback_config.py
 delete mode 100644 src/langbot/pkg/provider/modelmgr/api_chain.py
 delete mode 100644 web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
 delete mode 100644 web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
 delete mode 100644 web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
 delete mode 100644 web/src/app/infra/entities/api/api_chain.ts

diff --git a/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py b/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
deleted file mode 100644
index fd921f135..000000000
--- a/src/langbot/pkg/api/http/controller/groups/provider/api_chains.py
+++ /dev/null
@@ -1,41 +0,0 @@
-"""API Chain HTTP Controller"""
-
-import quart
-
-from ... import group
-
-
-@group.group_class('api_chains', '/api/v1/provider/api-chains')
-class APIChainRouterGroup(group.RouterGroup):
-    async def initialize(self) -> None:
-        @self.route('', methods=['GET', 'POST'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
-        async def _() -> str:
-            if quart.request.method == 'GET':
-                chains = await self.ap.api_chain_service.get_api_chains()
-                return self.success(data={'chains': chains})
-            elif quart.request.method == 'POST':
-                json_data = await quart.request.json
-                chain_uuid = await self.ap.api_chain_service.create_api_chain(json_data)
-                return self.success(data={'uuid': chain_uuid})
-
-        @self.route('/<chain_uuid>', methods=['GET', 'PUT', 'DELETE'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
-        async def _(chain_uuid: str) -> str:
-            if quart.request.method == 'GET':
-                chain = await self.ap.api_chain_service.get_api_chain(chain_uuid)
-
-                if chain is None:
-                    return self.http_status(404, -1, 'API chain not found')
-
-                return self.success(data={'chain': chain})
-            elif quart.request.method == 'PUT':
-                json_data = await quart.request.json
-                await self.ap.api_chain_service.update_api_chain(chain_uuid, json_data)
-                return self.success()
-            elif quart.request.method == 'DELETE':
-                await self.ap.api_chain_service.delete_api_chain(chain_uuid)
-                return self.success()
-
-        @self.route('/<chain_uuid>/test', methods=['POST'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
-        async def _(chain_uuid: str) -> str:
-            result = await self.ap.api_chain_service.test_api_chain(chain_uuid)
-            return self.success(data=result)
diff --git a/src/langbot/pkg/api/http/service/api_chain.py b/src/langbot/pkg/api/http/service/api_chain.py
deleted file mode 100644
index 5d12196cb..000000000
--- a/src/langbot/pkg/api/http/service/api_chain.py
+++ /dev/null
@@ -1,149 +0,0 @@
-"""API Chain Service - HTTP service for managing API chains"""
-
-from __future__ import annotations
-
-import uuid
-from typing import Dict, Any, List
-import sqlalchemy
-
-from ....core import app
-from ....entity.persistence import api_chain as api_chain_entity
-# NOTE: uuid and sqlalchemy are kept for the read methods; mutations delegate to api_chain_mgr
-
-
-class APIChainService:
-    """Service for managing API chains"""
-
-    ap: app.Application
-
-    def __init__(self, ap: app.Application) -> None:
-        self.ap = ap
-
-    async def get_api_chains(self) -> List[Dict[str, Any]]:
-        """Get all API chains with their statuses"""
-        result = await self.ap.persistence_mgr.execute_async(sqlalchemy.select(api_chain_entity.APIChain))
-
-        chains = []
-        for chain in result.all():
-            # Get status for all providers in this chain
-            status_result = await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.select(api_chain_entity.APIChainStatus).where(
-                    api_chain_entity.APIChainStatus.chain_uuid == chain.uuid
-                )
-            )
-
-            statuses = []
-            for status in status_result.all():
-                statuses.append(
-                    {
-                        'provider_uuid': status.provider_uuid,
-                        'model_name': status.model_name,
-                        'api_key_index': status.api_key_index,
-                        'is_healthy': status.is_healthy,
-                        'failure_count': status.failure_count,
-                        'last_failure_time': status.last_failure_time.isoformat() if status.last_failure_time else None,
-                        'last_success_time': status.last_success_time.isoformat() if status.last_success_time else None,
-                        'last_health_check_time': status.last_health_check_time.isoformat()
-                        if status.last_health_check_time
-                        else None,
-                        'last_error_message': status.last_error_message,
-                        'health_check_last_failed': status.health_check_last_failed,
-                    }
-                )
-
-            chains.append(
-                {
-                    'uuid': chain.uuid,
-                    'name': chain.name,
-                    'description': chain.description,
-                    'chain_config': chain.chain_config,
-                    'health_check_interval': chain.health_check_interval,
-                    'health_check_enabled': chain.health_check_enabled,
-                    'created_at': chain.created_at.isoformat() if chain.created_at else None,
-                    'updated_at': chain.updated_at.isoformat() if chain.updated_at else None,
-                    'statuses': statuses,
-                }
-            )
-
-        return chains
-
-    async def get_api_chain(self, chain_uuid: str) -> Dict[str, Any] | None:
-        """Get a specific API chain"""
-        result = await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.select(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
-        )
-
-        chain = result.first()
-        if not chain:
-            return None
-
-        # Get status for all providers in the chain
-        status_result = await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.select(api_chain_entity.APIChainStatus).where(
-                api_chain_entity.APIChainStatus.chain_uuid == chain_uuid
-            )
-        )
-
-        statuses = []
-        for status in status_result.all():
-            statuses.append(
-                {
-                    'provider_uuid': status.provider_uuid,
-                    'model_name': status.model_name,
-                    'api_key_index': status.api_key_index,
-                    'is_healthy': status.is_healthy,
-                    'failure_count': status.failure_count,
-                    'last_failure_time': status.last_failure_time.isoformat() if status.last_failure_time else None,
-                    'last_success_time': status.last_success_time.isoformat() if status.last_success_time else None,
-                    'last_health_check_time': status.last_health_check_time.isoformat()
-                    if status.last_health_check_time
-                    else None,
-                    'last_error_message': status.last_error_message,
-                    'health_check_last_failed': status.health_check_last_failed,
-                }
-            )
-
-        return {
-            'uuid': chain.uuid,
-            'name': chain.name,
-            'description': chain.description,
-            'chain_config': chain.chain_config,
-            'health_check_interval': chain.health_check_interval,
-            'health_check_enabled': chain.health_check_enabled,
-            'created_at': chain.created_at.isoformat() if chain.created_at else None,
-            'updated_at': chain.updated_at.isoformat() if chain.updated_at else None,
-            'statuses': statuses,
-        }
-
-    async def create_api_chain(self, chain_data: Dict[str, Any]) -> str:
-        """Create a new API chain"""
-        chain_data = dict(chain_data)
-        chain_data.setdefault('uuid', str(uuid.uuid4()))
-        chain_data.setdefault('chain_config', [])
-        chain_data.setdefault('health_check_interval', 300)
-        chain_data.setdefault('health_check_enabled', True)
-
-        # Delegate to manager so in-memory state and health-check task are created
-        await self.ap.api_chain_mgr.create_chain(chain_data)
-        return chain_data['uuid']
-
-    async def update_api_chain(self, chain_uuid: str, chain_data: Dict[str, Any]):
-        """Update an existing API chain"""
-        chain_data = dict(chain_data)
-        chain_data.pop('uuid', None)
-        chain_data.pop('created_at', None)
-        chain_data.pop('updated_at', None)
-
-        # Delegate to manager so in-memory state and health-check task are refreshed
-        await self.ap.api_chain_mgr.update_chain(chain_uuid, chain_data)
-
-    async def delete_api_chain(self, chain_uuid: str):
-        """Delete an API chain"""
-        # Delegate to manager which handles both DB deletion and memory/task cleanup
-        await self.ap.api_chain_mgr.delete_chain(chain_uuid)
-
-    async def test_api_chain(self, chain_uuid: str) -> Dict[str, Any]:
-        """Test an API chain by making a simple request"""
-        # This would make a test request through the chain
-        # For now, just return success
-        return {'success': True, 'message': 'API chain test not yet implemented'}
diff --git a/src/langbot/pkg/core/app.py b/src/langbot/pkg/core/app.py
index a7928341f..12849f2a9 100644
--- a/src/langbot/pkg/core/app.py
+++ b/src/langbot/pkg/core/app.py
@@ -9,7 +9,7 @@
 from ..platform.webhook_pusher import WebhookPusher
 from ..provider.session import sessionmgr as llm_session_mgr
 from ..provider.modelmgr import modelmgr as llm_model_mgr
-from ..provider.modelmgr import api_chain as api_chain_module
+
 from langbot.pkg.provider.tools import toolmgr as llm_tool_mgr
 from ..config import manager as config_mgr
 from ..command import cmdmgr
@@ -31,7 +31,7 @@
 from ..api.http.service import apikey as apikey_service
 from ..api.http.service import webhook as webhook_service
 from ..api.http.service import monitoring as monitoring_service
-from ..api.http.service import api_chain as api_chain_service
+
 from ..discover import engine as discover_engine
 from ..storage import mgr as storagemgr
 from ..utils import logcache
@@ -64,8 +64,6 @@ class Application:
 
     model_mgr: llm_model_mgr.ModelManager = None
 
-    api_chain_mgr: api_chain_module.APIChainManager = None
-
     rag_mgr: rag_mgr.RAGManager = None
     rag_runtime_service: RAGRuntimeService = None
 
@@ -155,8 +153,6 @@ class Application:
 
     monitoring_service: monitoring_service.MonitoringService = None
 
-    api_chain_service: api_chain_service.APIChainService = None
-
     def __init__(self):
         pass
 
diff --git a/src/langbot/pkg/core/stages/build_app.py b/src/langbot/pkg/core/stages/build_app.py
index d20a1340b..62f0ae7b5 100644
--- a/src/langbot/pkg/core/stages/build_app.py
+++ b/src/langbot/pkg/core/stages/build_app.py
@@ -10,7 +10,6 @@
 from ...command import cmdmgr
 from ...provider.session import sessionmgr as llm_session_mgr
 from ...provider.modelmgr import modelmgr as llm_model_mgr
-from ...provider.modelmgr import api_chain as api_chain_module
 from ...provider.tools import toolmgr as llm_tool_mgr
 from ...rag.knowledge import kbmgr as rag_mgr
 from ...rag.service import RAGRuntimeService
@@ -29,7 +28,6 @@
 from ...api.http.service import apikey as apikey_service
 from ...api.http.service import webhook as webhook_service
 from ...api.http.service import monitoring as monitoring_service
-from ...api.http.service import api_chain as api_chain_service
 from ...discover import engine as discover_engine
 from ...storage import mgr as storagemgr
 from ...utils import logcache
@@ -123,10 +121,6 @@ async def run(self, ap: app.Application):
         ap.model_mgr = llm_model_mgr_inst
         await llm_model_mgr_inst.initialize()
 
-        api_chain_mgr_inst = api_chain_module.APIChainManager(ap)
-        ap.api_chain_mgr = api_chain_mgr_inst
-        await api_chain_mgr_inst.initialize()
-
         llm_session_mgr_inst = llm_session_mgr.SessionManager(ap)
         await llm_session_mgr_inst.initialize()
         ap.sess_mgr = llm_session_mgr_inst
@@ -170,9 +164,6 @@ async def run(self, ap: app.Application):
         monitoring_service_inst = monitoring_service.MonitoringService(ap)
         ap.monitoring_service = monitoring_service_inst
 
-        api_chain_service_inst = api_chain_service.APIChainService(ap)
-        ap.api_chain_service = api_chain_service_inst
-
         async def runtime_disconnect_callback(connector: plugin_connector.PluginRuntimeConnector) -> None:
             await asyncio.sleep(3)
             await plugin_connector_inst.initialize()
diff --git a/src/langbot/pkg/entity/persistence/api_chain.py b/src/langbot/pkg/entity/persistence/api_chain.py
deleted file mode 100644
index b40903008..000000000
--- a/src/langbot/pkg/entity/persistence/api_chain.py
+++ /dev/null
@@ -1,98 +0,0 @@
-import sqlalchemy
-from sqlalchemy import JSON, Integer, String, DateTime, Boolean
-from .base import Base
-
-
-class APIChain(Base):
-    """API Chain - manages multiple API providers with priority and failover"""
-
-    __tablename__ = 'api_chains'
-
-    uuid = sqlalchemy.Column(String(255), primary_key=True, unique=True)
-    name = sqlalchemy.Column(String(255), nullable=False)
-    description = sqlalchemy.Column(String(512), nullable=True)
-
-    # Chain configuration
-    chain_config = sqlalchemy.Column(JSON, nullable=False, default=list)
-    """
-    List of API chain items:
-    [
-        {
-            "provider_uuid": "xxx",
-            "priority": 1,              // provider priority in the chain
-            "is_aggregated": false,
-            "max_retries": 3,
-            "timeout_ms": 30000,
-            "model_configs": [          // optional: per-model priority config
-                {
-                    "model_name": "gpt-4o",   // model name (as in LLMModel.name)
-                    "priority": 1,             // model priority within this provider
-                    "api_key_indices": [        // optional: per-API-key priority
-                        {"index": 0, "priority": 1},
-                        {"index": 1, "priority": 2}
-                    ]
-                }
-            ]
-        },
-        ...
-    ]
-    If model_configs is empty/absent, the chain uses the query's original model
-    with round-robin API key rotation. If api_key_indices is empty/absent for a
-    model config, round-robin rotation is used for that model.
-    """
-
-    # Health check configuration
-    health_check_interval = sqlalchemy.Column(Integer, nullable=False, default=300)
-    """Health check interval in seconds for failed APIs"""
-
-    health_check_enabled = sqlalchemy.Column(Boolean, nullable=False, default=True)
-    """Whether to enable automatic health check for failed APIs"""
-
-    # Metadata
-    created_at = sqlalchemy.Column(DateTime, nullable=False, server_default=sqlalchemy.func.now())
-    updated_at = sqlalchemy.Column(
-        DateTime,
-        nullable=False,
-        server_default=sqlalchemy.func.now(),
-        onupdate=sqlalchemy.func.now(),
-    )
-
-
-class APIChainStatus(Base):
-    """API Chain Status - tracks the health status of APIs in chains"""
-
-    __tablename__ = 'api_chain_status'
-
-    uuid = sqlalchemy.Column(String(255), primary_key=True, unique=True)
-    chain_uuid = sqlalchemy.Column(String(255), nullable=False, index=True)
-    provider_uuid = sqlalchemy.Column(String(255), nullable=False, index=True)
-
-    # Granularity: model-level and API-key-level tracking
-    model_name = sqlalchemy.Column(String(255), nullable=True, index=True)
-    """Model name (from LLMModel.name); NULL means provider-level status"""
-
-    api_key_index = sqlalchemy.Column(Integer, nullable=True)
-    """Index into the provider's api_keys list; NULL means all/round-robin"""
-
-    # Status tracking
-    is_healthy = sqlalchemy.Column(Boolean, nullable=False, default=True)
-    failure_count = sqlalchemy.Column(Integer, nullable=False, default=0)
-    last_failure_time = sqlalchemy.Column(DateTime, nullable=True)
-    last_success_time = sqlalchemy.Column(DateTime, nullable=True)
-    last_health_check_time = sqlalchemy.Column(DateTime, nullable=True)
-
-    # Error information
-    last_error_message = sqlalchemy.Column(String(1024), nullable=True)
-
-    health_check_last_failed = sqlalchemy.Column(Boolean, nullable=False, default=False)
-    """True when the last health-check probe itself failed (not a normal request failure).
-    Is_healthy remains False while this is True. Does NOT increment failure_count."""
-
-    # Metadata
-    created_at = sqlalchemy.Column(DateTime, nullable=False, server_default=sqlalchemy.func.now())
-    updated_at = sqlalchemy.Column(
-        DateTime,
-        nullable=False,
-        server_default=sqlalchemy.func.now(),
-        onupdate=sqlalchemy.func.now(),
-    )
diff --git a/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py b/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
deleted file mode 100644
index 931a36322..000000000
--- a/src/langbot/pkg/persistence/migrations/dbm008_api_chain.py
+++ /dev/null
@@ -1,46 +0,0 @@
-"""Database migration for API Chain feature"""
-
-from sqlalchemy import text
-
-
-async def migrate(ap):
-    """Add API chain tables"""
-
-    # Create api_chains table
-    await ap.persistence_mgr.execute_async(
-        text("""
-        CREATE TABLE IF NOT EXISTS api_chains (
-            uuid VARCHAR(255) PRIMARY KEY,
-            name VARCHAR(255) NOT NULL,
-            description VARCHAR(512),
-            chain_config JSON NOT NULL,
-            health_check_interval INTEGER NOT NULL DEFAULT 300,
-            health_check_enabled BOOLEAN NOT NULL DEFAULT 1,
-            created_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
-            updated_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP
-        )
-        """)
-    )
-
-    # Create api_chain_status table
-    await ap.persistence_mgr.execute_async(
-        text("""
-        CREATE TABLE IF NOT EXISTS api_chain_status (
-            uuid VARCHAR(255) PRIMARY KEY,
-            chain_uuid VARCHAR(255) NOT NULL,
-            provider_uuid VARCHAR(255) NOT NULL,
-            is_healthy BOOLEAN NOT NULL DEFAULT 1,
-            failure_count INTEGER NOT NULL DEFAULT 0,
-            last_failure_time DATETIME,
-            last_success_time DATETIME,
-            last_health_check_time DATETIME,
-            last_error_message VARCHAR(1024),
-            created_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
-            updated_at DATETIME NOT NULL DEFAULT CURRENT_TIMESTAMP,
-            INDEX idx_chain_uuid (chain_uuid),
-            INDEX idx_provider_uuid (provider_uuid)
-        )
-        """)
-    )
-
-    ap.logger.info('API Chain tables created successfully')
diff --git a/src/langbot/pkg/persistence/migrations/dbm023_model_fallback_config.py b/src/langbot/pkg/persistence/migrations/dbm023_model_fallback_config.py
new file mode 100644
index 000000000..11ab3bb4e
--- /dev/null
+++ b/src/langbot/pkg/persistence/migrations/dbm023_model_fallback_config.py
@@ -0,0 +1,102 @@
+from .. import migration
+
+import sqlalchemy
+import json
+
+
+@migration.migration_class(23)
+class DBMigrateModelFallbackConfig(migration.DBMigration):
+    """Convert model field from plain UUID string to object with primary/fallbacks"""
+
+    async def upgrade(self):
+        """Upgrade"""
+        result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.text('SELECT uuid, config FROM legacy_pipelines')
+        )
+        pipelines = result.fetchall()
+
+        current_version = self.ap.ver_mgr.get_current_version()
+
+        for pipeline_row in pipelines:
+            uuid = pipeline_row[0]
+            config = json.loads(pipeline_row[1]) if isinstance(pipeline_row[1], str) else pipeline_row[1]
+
+            if 'ai' not in config or 'local-agent' not in config['ai']:
+                continue
+
+            local_agent = config['ai']['local-agent']
+            changed = False
+
+            # Convert model from string to object
+            model_value = local_agent.get('model', '')
+            if isinstance(model_value, str):
+                local_agent['model'] = {
+                    'primary': model_value,
+                    'fallbacks': [],
+                }
+                changed = True
+
+            # Remove leftover fallback-models field if present
+            if 'fallback-models' in local_agent:
+                del local_agent['fallback-models']
+                changed = True
+
+            if not changed:
+                continue
+
+            # Update using raw SQL with compatibility for both SQLite and PostgreSQL
+            if self.ap.persistence_mgr.db.name == 'postgresql':
+                await self.ap.persistence_mgr.execute_async(
+                    sqlalchemy.text(
+                        'UPDATE legacy_pipelines SET config = :config::jsonb, for_version = :for_version WHERE uuid = :uuid'
+                    ),
+                    {'config': json.dumps(config), 'for_version': current_version, 'uuid': uuid},
+                )
+            else:
+                await self.ap.persistence_mgr.execute_async(
+                    sqlalchemy.text(
+                        'UPDATE legacy_pipelines SET config = :config, for_version = :for_version WHERE uuid = :uuid'
+                    ),
+                    {'config': json.dumps(config), 'for_version': current_version, 'uuid': uuid},
+                )
+
+    async def downgrade(self):
+        """Downgrade"""
+        result = await self.ap.persistence_mgr.execute_async(
+            sqlalchemy.text('SELECT uuid, config FROM legacy_pipelines')
+        )
+        pipelines = result.fetchall()
+
+        current_version = self.ap.ver_mgr.get_current_version()
+
+        for pipeline_row in pipelines:
+            uuid = pipeline_row[0]
+            config = json.loads(pipeline_row[1]) if isinstance(pipeline_row[1], str) else pipeline_row[1]
+
+            if 'ai' not in config or 'local-agent' not in config['ai']:
+                continue
+
+            local_agent = config['ai']['local-agent']
+
+            # Convert model from object back to string
+            model_value = local_agent.get('model', '')
+            if isinstance(model_value, dict):
+                local_agent['model'] = model_value.get('primary', '')
+            else:
+                continue
+
+            # Update using raw SQL with compatibility for both SQLite and PostgreSQL
+            if self.ap.persistence_mgr.db.name == 'postgresql':
+                await self.ap.persistence_mgr.execute_async(
+                    sqlalchemy.text(
+                        'UPDATE legacy_pipelines SET config = :config::jsonb, for_version = :for_version WHERE uuid = :uuid'
+                    ),
+                    {'config': json.dumps(config), 'for_version': current_version, 'uuid': uuid},
+                )
+            else:
+                await self.ap.persistence_mgr.execute_async(
+                    sqlalchemy.text(
+                        'UPDATE legacy_pipelines SET config = :config, for_version = :for_version WHERE uuid = :uuid'
+                    ),
+                    {'config': json.dumps(config), 'for_version': current_version, 'uuid': uuid},
+                )
diff --git a/src/langbot/pkg/pipeline/preproc/preproc.py b/src/langbot/pkg/pipeline/preproc/preproc.py
index 9cf4d8b93..eacf47725 100644
--- a/src/langbot/pkg/pipeline/preproc/preproc.py
+++ b/src/langbot/pkg/pipeline/preproc/preproc.py
@@ -37,19 +37,35 @@ async def process(
 
         # When not local-agent, llm_model is None
         llm_model = None
-        use_api_chain_uuid = None
         if selected_runner == 'local-agent':
-            model_value = query.pipeline_config['ai']['local-agent'].get('model', '')
-            if model_value:
+            # Read model config — new format is { primary: str, fallbacks: [str] },
+            # but handle legacy plain string for backward compatibility
+            model_config = query.pipeline_config['ai']['local-agent'].get('model', {})
+            if isinstance(model_config, str):
+                # Legacy format: plain UUID string
+                primary_uuid = model_config
+                fallback_uuids = []
+            else:
+                primary_uuid = model_config.get('primary', '')
+                fallback_uuids = model_config.get('fallbacks', [])
+
+            if primary_uuid:
                 try:
-                    llm_model = await self.ap.model_mgr.get_model_by_uuid(model_value)
+                    llm_model = await self.ap.model_mgr.get_model_by_uuid(primary_uuid)
                 except ValueError:
-                    # Not a model UUID — try as API chain UUID
-                    chain = await self.ap.api_chain_mgr.get_chain(model_value)
-                    if chain:
-                        use_api_chain_uuid = model_value
-                    else:
-                        self.ap.logger.warning(f'LLM model/chain {model_value} not found or not configured')
+                    self.ap.logger.warning(f'LLM model {primary_uuid} not found or not configured')
+
+            # Resolve fallback model UUIDs
+            if fallback_uuids:
+                valid_fallbacks = []
+                for fb_uuid in fallback_uuids:
+                    try:
+                        await self.ap.model_mgr.get_model_by_uuid(fb_uuid)
+                        valid_fallbacks.append(fb_uuid)
+                    except ValueError:
+                        self.ap.logger.warning(f'Fallback model {fb_uuid} not found, skipping')
+                if valid_fallbacks:
+                    query.variables['_fallback_model_uuids'] = valid_fallbacks
 
         conversation = await self.ap.sess_mgr.get_conversation(
             query,
@@ -79,13 +95,12 @@ async def process(
                     self.ap.logger.debug(f'Bound MCP servers: {bound_mcp_servers}')
                     self.ap.logger.debug(f'Use funcs: {query.use_funcs}')
 
-            elif use_api_chain_uuid:
-                query.variables['_use_api_chain_uuid'] = use_api_chain_uuid
-                # Enable all tools for chain; individual models will decide capability
+            # If primary model doesn't support func_call but fallback models exist,
+            # load tools anyway since fallback models may support them
+            if not query.use_funcs and query.variables.get('_fallback_model_uuids'):
                 bound_plugins = query.variables.get('_pipeline_bound_plugins', None)
                 bound_mcp_servers = query.variables.get('_pipeline_bound_mcp_servers', None)
                 query.use_funcs = await self.ap.tool_mgr.get_all_tools(bound_plugins, bound_mcp_servers)
-                self.ap.logger.debug(f'Using API chain {use_api_chain_uuid} for local-agent')
 
         sender_name = ''
 
diff --git a/src/langbot/pkg/provider/modelmgr/api_chain.py b/src/langbot/pkg/provider/modelmgr/api_chain.py
deleted file mode 100644
index dc9316c77..000000000
--- a/src/langbot/pkg/provider/modelmgr/api_chain.py
+++ /dev/null
@@ -1,757 +0,0 @@
-"""API Chain Manager - handles API failover and health checking.
-
-chain_config item schema (per provider entry):
-{
-    "provider_uuid": "xxx",
-    "priority": 1,              # provider priority in the chain (lower = higher priority)
-    "is_aggregated": false,
-    "max_retries": 3,
-    "timeout_ms": 30000,
-    "model_configs": [          # optional: per-model configuration
-        {
-            "model_name": "gpt-4o",   # model name as stored in LLMModel.name
-            "priority": 1,             # priority within this provider
-            "api_key_indices": [        # optional: per-API-key priority
-                {"index": 0, "priority": 1},
-                {"index": 1, "priority": 2}
-            ]
-        }
-    ]
-}
-If model_configs is absent, the original query model is used with round-robin keys.
-If api_key_indices is absent for a model config, round-robin rotation is used.
-"""
-
-from __future__ import annotations
-
-import asyncio
-import uuid as uuid_lib
-from datetime import datetime
-from typing import List, Dict, Any, Optional, Tuple, AsyncGenerator
-
-import sqlalchemy
-from ...core import app
-from ...entity.persistence import api_chain as api_chain_entity
-from . import requester
-from . import token
-
-import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
-import langbot_plugin.api.entities.builtin.provider.message as provider_message
-import langbot_plugin.api.entities.builtin.resource.tool as resource_tool
-
-
-class APIChainManager:
-    """Manages API chains with per-model/per-API-key failover and health checking"""
-
-    def __init__(self, ap: app.Application):
-        self.ap = ap
-        self.chains: Dict[str, api_chain_entity.APIChain] = {}
-        self.health_check_tasks: Dict[str, asyncio.Task] = {}
-
-    async def initialize(self):
-        """Initialize API chain manager"""
-        await self.load_chains_from_db()
-        await self.start_health_check_tasks()
-
-    async def load_chains_from_db(self):
-        """Load all API chains from database"""
-        result = await self.ap.persistence_mgr.execute_async(sqlalchemy.select(api_chain_entity.APIChain))
-        for row in result.all():
-            # result.all() returns read-only Row objects; wrap them in mutable instances
-            chain = api_chain_entity.APIChain(
-                uuid=row.uuid,
-                name=row.name,
-                description=row.description,
-                chain_config=row.chain_config,
-                health_check_interval=row.health_check_interval,
-                health_check_enabled=row.health_check_enabled,
-            )
-            self.chains[chain.uuid] = chain
-
-    async def start_health_check_tasks(self):
-        """Start background health check tasks for all chains"""
-        for chain_uuid, chain in self.chains.items():
-            if chain.health_check_enabled:
-                task = asyncio.create_task(self._health_check_loop(chain_uuid))
-                self.health_check_tasks[chain_uuid] = task
-
-    async def stop_health_check_tasks(self):
-        """Stop all health check tasks"""
-        for task in self.health_check_tasks.values():
-            task.cancel()
-        self.health_check_tasks.clear()
-
-    # ==================== Health Check ====================
-
-    async def _health_check_loop(self, chain_uuid: str):
-        """Background loop for health checking failed APIs.
-
-        An immediate check is performed on startup so that pre-existing
-        unhealthy records are evaluated without waiting for the full interval.
-        """
-        # Immediate check on start
-        try:
-            await self._perform_health_checks(chain_uuid)
-        except asyncio.CancelledError:
-            return
-        except Exception as e:
-            self.ap.logger.error(f'Initial health check error for chain {chain_uuid}: {e}')
-
-        while True:
-            try:
-                chain = self.chains.get(chain_uuid)
-                if not chain or not chain.health_check_enabled:
-                    break
-                await asyncio.sleep(chain.health_check_interval)
-                await self._perform_health_checks(chain_uuid)
-            except asyncio.CancelledError:
-                break
-            except Exception as e:
-                self.ap.logger.error(f'Health check loop error for chain {chain_uuid}: {e}')
-                await asyncio.sleep(60)
-
-    async def _perform_health_checks(self, chain_uuid: str):
-        """Perform health checks on all unhealthy status records in a chain"""
-        result = await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.select(api_chain_entity.APIChainStatus).where(
-                sqlalchemy.and_(
-                    api_chain_entity.APIChainStatus.chain_uuid == chain_uuid,
-                    api_chain_entity.APIChainStatus.is_healthy == False,
-                )
-            )
-        )
-        for status in result.all():
-            try:
-                provider = self.ap.model_mgr.provider_dict.get(status.provider_uuid)
-                if not provider:
-                    continue
-
-                is_healthy = await self._check_api_health(status, provider)
-
-                if is_healthy:
-                    await self._update_status(
-                        status.uuid,
-                        is_healthy=True,
-                        failure_count=0,
-                        health_check_last_failed=False,
-                        last_success_time=datetime.now(),
-                        last_health_check_time=datetime.now(),
-                        last_error_message=None,
-                    )
-                    self.ap.logger.info(
-                        f'API recovered: provider={status.provider_uuid} '
-                        f'model={status.model_name} key_index={status.api_key_index}'
-                    )
-                else:
-                    # Health check probe failed: mark the flag but do NOT increment failure_count
-                    await self._update_status(
-                        status.uuid,
-                        health_check_last_failed=True,
-                        last_health_check_time=datetime.now(),
-                    )
-            except Exception as e:
-                self.ap.logger.error(
-                    f'Health check loop error for provider={status.provider_uuid} '
-                    f'model={status.model_name} key_index={status.api_key_index}: {e}'
-                )
-                try:
-                    await self._update_status(
-                        status.uuid,
-                        health_check_last_failed=True,
-                        last_health_check_time=datetime.now(),
-                    )
-                except Exception:
-                    pass
-
-    async def _check_api_health(
-        self,
-        status: api_chain_entity.APIChainStatus,
-        provider: requester.RuntimeProvider,
-    ) -> bool:
-        """Check API health by making a minimal test request to the LLM endpoint.
-
-        Returns True if the request succeeds (API is reachable and authenticated),
-        False otherwise.  Does NOT raise exceptions.
-        """
-        try:
-            temp_provider = self._create_provider_for_key(provider, status.api_key_index)
-            model_entity = self._resolve_model_entity(provider, None, status.model_name)
-            if model_entity is None:
-                self.ap.logger.warning(
-                    f'Health check: no model found for provider={status.provider_uuid} '
-                    f'model_name={status.model_name}, skipping'
-                )
-                return False
-
-            temp_model = requester.RuntimeLLMModel(
-                model_entity=model_entity,
-                provider=temp_provider,
-            )
-            test_msg = provider_message.Message(role='user', content='hi')
-
-            await temp_provider.invoke_llm(
-                query=None,
-                model=temp_model,
-                messages=[test_msg],
-                funcs=None,
-                extra_args={},
-                remove_think=True,
-            )
-            return True
-        except Exception as e:
-            self.ap.logger.debug(
-                f'Health check request failed for provider={status.provider_uuid} '
-                f'model={status.model_name} key={status.api_key_index}: {e}'
-            )
-            return False
-
-    # ==================== Status Helpers ====================
-
-    async def _ensure_status(
-        self,
-        chain_uuid: str,
-        provider_uuid: str,
-        model_name: Optional[str],
-        api_key_index: Optional[int],
-    ) -> api_chain_entity.APIChainStatus:
-        """Get or create a status record for the given (chain, provider, model, key) tuple"""
-        conditions = [
-            api_chain_entity.APIChainStatus.chain_uuid == chain_uuid,
-            api_chain_entity.APIChainStatus.provider_uuid == provider_uuid,
-        ]
-        if model_name is None:
-            conditions.append(api_chain_entity.APIChainStatus.model_name == None)  # noqa: E711
-        else:
-            conditions.append(api_chain_entity.APIChainStatus.model_name == model_name)
-
-        if api_key_index is None:
-            conditions.append(api_chain_entity.APIChainStatus.api_key_index == None)  # noqa: E711
-        else:
-            conditions.append(api_chain_entity.APIChainStatus.api_key_index == api_key_index)
-
-        result = await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.select(api_chain_entity.APIChainStatus).where(sqlalchemy.and_(*conditions))
-        )
-        existing = result.first()
-        if existing:
-            return existing
-
-        new_uuid = str(uuid_lib.uuid4())
-        await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.insert(api_chain_entity.APIChainStatus).values(
-                uuid=new_uuid,
-                chain_uuid=chain_uuid,
-                provider_uuid=provider_uuid,
-                model_name=model_name,
-                api_key_index=api_key_index,
-                is_healthy=True,
-                failure_count=0,
-            )
-        )
-        result2 = await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.select(api_chain_entity.APIChainStatus).where(api_chain_entity.APIChainStatus.uuid == new_uuid)
-        )
-        return result2.first()
-
-    async def _update_status(
-        self,
-        status_uuid: str,
-        is_healthy: Optional[bool] = None,
-        failure_count: Optional[int] = None,
-        last_failure_time: Optional[datetime] = None,
-        last_success_time: Optional[datetime] = None,
-        last_health_check_time: Optional[datetime] = None,
-        last_error_message: Optional[str] = None,
-        health_check_last_failed: Optional[bool] = None,
-    ):
-        """Update a status record by UUID"""
-        update_data: Dict[str, Any] = {}
-        if is_healthy is not None:
-            update_data['is_healthy'] = is_healthy
-        if failure_count is not None:
-            update_data['failure_count'] = failure_count
-        if last_failure_time is not None:
-            update_data['last_failure_time'] = last_failure_time
-        if last_success_time is not None:
-            update_data['last_success_time'] = last_success_time
-        if last_health_check_time is not None:
-            update_data['last_health_check_time'] = last_health_check_time
-        if last_error_message is not None:
-            update_data['last_error_message'] = last_error_message
-        elif is_healthy:
-            # Clear error message when marking healthy
-            update_data['last_error_message'] = None
-        if health_check_last_failed is not None:
-            update_data['health_check_last_failed'] = health_check_last_failed
-
-        if update_data:
-            await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.update(api_chain_entity.APIChainStatus)
-                .where(api_chain_entity.APIChainStatus.uuid == status_uuid)
-                .values(**update_data)
-            )
-
-    # ==================== Chain CRUD ====================
-
-    async def get_chain(self, chain_uuid: str) -> Optional[api_chain_entity.APIChain]:
-        """Get an API chain by UUID"""
-        return self.chains.get(chain_uuid)
-
-    async def create_chain(self, chain_data: Dict[str, Any]) -> str:
-        """Create a new API chain and start its health check loop"""
-        chain_uuid = chain_data.get('uuid', str(uuid_lib.uuid4()))
-
-        chain = api_chain_entity.APIChain(
-            uuid=chain_uuid,
-            name=chain_data['name'],
-            description=chain_data.get('description', ''),
-            chain_config=chain_data.get('chain_config', []),
-            health_check_interval=chain_data.get('health_check_interval', 300),
-            health_check_enabled=chain_data.get('health_check_enabled', True),
-        )
-
-        # Use explicit column values to avoid SQLAlchemy internal state pollution
-        await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.insert(api_chain_entity.APIChain).values(
-                uuid=chain.uuid,
-                name=chain.name,
-                description=chain.description,
-                chain_config=chain.chain_config,
-                health_check_interval=chain.health_check_interval,
-                health_check_enabled=chain.health_check_enabled,
-            )
-        )
-        self.chains[chain_uuid] = chain
-
-        if chain.health_check_enabled:
-            task = asyncio.create_task(self._health_check_loop(chain_uuid))
-            self.health_check_tasks[chain_uuid] = task
-
-        return chain_uuid
-
-    async def update_chain(self, chain_uuid: str, chain_data: Dict[str, Any]):
-        """Update an existing API chain"""
-        existing = self.chains.get(chain_uuid)
-
-        # Collect current attribute values (may come from an in-memory instance or DB)
-        if existing is not None:
-            current = {
-                'uuid': existing.uuid,
-                'name': existing.name,
-                'description': existing.description,
-                'chain_config': existing.chain_config,
-                'health_check_interval': existing.health_check_interval,
-                'health_check_enabled': existing.health_check_enabled,
-            }
-        else:
-            db_result = await self.ap.persistence_mgr.execute_async(
-                sqlalchemy.select(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
-            )
-            row = db_result.first()
-            if not row:
-                raise ValueError(f'Chain {chain_uuid} not found')
-            current = {
-                'uuid': row.uuid,
-                'name': row.name,
-                'description': row.description,
-                'chain_config': row.chain_config,
-                'health_check_interval': row.health_check_interval,
-                'health_check_enabled': row.health_check_enabled,
-            }
-
-        # Merge incoming changes
-        for key, value in chain_data.items():
-            if key in current and key != 'uuid':
-                current[key] = value
-
-        # Persist changes to DB
-        await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.update(api_chain_entity.APIChain)
-            .where(api_chain_entity.APIChain.uuid == chain_uuid)
-            .values(**{k: v for k, v in chain_data.items() if k != 'uuid'})
-        )
-
-        # Rebuild mutable in-memory instance with merged data
-        new_chain = api_chain_entity.APIChain(
-            uuid=current['uuid'],
-            name=current['name'],
-            description=current.get('description', ''),
-            chain_config=current.get('chain_config', []),
-            health_check_interval=current.get('health_check_interval', 300),
-            health_check_enabled=current.get('health_check_enabled', True),
-        )
-        self.chains[chain_uuid] = new_chain
-
-        # Cancel existing task and restart to pick up new config immediately
-        existing_task = self.health_check_tasks.pop(chain_uuid, None)
-        if existing_task is not None:
-            existing_task.cancel()
-        if new_chain.health_check_enabled:
-            task = asyncio.create_task(self._health_check_loop(chain_uuid))
-            self.health_check_tasks[chain_uuid] = task
-
-    async def delete_chain(self, chain_uuid: str):
-        """Delete an API chain"""
-        if chain_uuid in self.health_check_tasks:
-            self.health_check_tasks[chain_uuid].cancel()
-            del self.health_check_tasks[chain_uuid]
-
-        await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.delete(api_chain_entity.APIChain).where(api_chain_entity.APIChain.uuid == chain_uuid)
-        )
-        await self.ap.persistence_mgr.execute_async(
-            sqlalchemy.delete(api_chain_entity.APIChainStatus).where(
-                api_chain_entity.APIChainStatus.chain_uuid == chain_uuid
-            )
-        )
-        self.chains.pop(chain_uuid, None)
-
-    # ==================== Invoke Helpers ====================
-
-    def _build_invoke_tasks(
-        self,
-        model_configs: List[Dict[str, Any]],
-    ) -> List[Tuple[Optional[str], Optional[int]]]:
-        """Build an ordered list of (model_name, api_key_index) tuples to try.
-
-        Returns [(None, None)] when model_configs is empty, meaning the caller's
-        original model and round-robin key rotation will be used (legacy behaviour).
-        When api_key_indices is configured for a model, each key index becomes a
-        separate failover task ordered by priority. When api_key_indices is absent,
-        the entry uses (model_name, None) so the provider's TokenManager performs
-        round-robin rotation across all configured keys.
-        """
-        if not model_configs:
-            return [(None, None)]
-
-        tasks: List[Tuple[Optional[str], Optional[int]]] = []
-        sorted_models = sorted(model_configs, key=lambda x: x.get('priority', 0))
-        for mc in sorted_models:
-            model_name: Optional[str] = mc.get('model_name') or None
-            api_key_indices: List[Dict] = mc.get('api_key_indices') or []
-            if api_key_indices:
-                # Expand each configured key index as an independent failover task
-                sorted_keys = sorted(api_key_indices, key=lambda x: x.get('priority', 0))
-                for key_config in sorted_keys:
-                    tasks.append((model_name, key_config['index']))
-            else:
-                # No specific key configured: use round-robin rotation
-                tasks.append((model_name, None))
-        return tasks if tasks else [(None, None)]
-
-    def _create_provider_for_key(
-        self,
-        provider: requester.RuntimeProvider,
-        api_key_index: Optional[int],
-    ) -> requester.RuntimeProvider:
-        """Return a provider restricted to a single API key.
-
-        Creates a lightweight wrapper with a single-token TokenManager so that
-        shared mutable state on the original provider is not modified.
-        Returns the original provider unchanged when api_key_index is None.
-        """
-        if api_key_index is None:
-            return provider
-
-        tokens = provider.token_mgr.tokens
-        if not tokens or api_key_index >= len(tokens):
-            return provider  # index out of range 鈥?fall back gracefully
-
-        single_token_mgr = token.TokenManager(
-            name=provider.token_mgr.name,
-            tokens=[tokens[api_key_index]],
-        )
-        return requester.RuntimeProvider(
-            provider_entity=provider.provider_entity,
-            token_mgr=single_token_mgr,
-            requester=provider.requester,
-        )
-
-    def _resolve_model_entity(
-        self,
-        provider: requester.RuntimeProvider,
-        default_model: Optional[requester.RuntimeLLMModel],
-        model_name: Optional[str],
-    ) -> Any:
-        """Return the model entity for model_name under the given provider.
-
-        Falls back to default_model.model_entity when model_name is None or no
-        matching model is found. When default_model is also None, falls back to
-        the first available model for the provider.
-        """
-        if not model_name:
-            if default_model is not None:
-                return default_model.model_entity
-            for m in self.ap.model_mgr.llm_models:
-                if m.model_entity.provider_uuid == provider.provider_entity.uuid:
-                    return m.model_entity
-            return None
-
-        for m in self.ap.model_mgr.llm_models:
-            if m.model_entity.provider_uuid == provider.provider_entity.uuid and m.model_entity.name == model_name:
-                return m.model_entity
-
-        if default_model is not None:
-            return default_model.model_entity
-        for m in self.ap.model_mgr.llm_models:
-            if m.model_entity.provider_uuid == provider.provider_entity.uuid:
-                return m.model_entity
-        return None
-
-    # ==================== LLM Invocation ====================
-
-    async def invoke_chain_llm(
-        self,
-        chain_uuid: str,
-        query: pipeline_query.Query,
-        model: Optional[requester.RuntimeLLMModel],
-        messages: List[provider_message.Message],
-        funcs: Optional[List[resource_tool.LLMTool]] = None,
-        extra_args: Dict[str, Any] = {},
-        remove_think: bool = False,
-    ) -> provider_message.Message:
-        """Invoke LLM through API chain with per-model/per-API-key failover"""
-        chain = self.chains.get(chain_uuid)
-        if not chain:
-            raise ValueError(f'Chain {chain_uuid} not found')
-
-        sorted_items = sorted(chain.chain_config, key=lambda x: x.get('priority', 0))
-        last_error: Optional[Exception] = None
-
-        for item in sorted_items:
-            provider_uuid: str = item['provider_uuid']
-            is_aggregated: bool = item.get('is_aggregated', False)
-            max_retries: int = item.get('max_retries', 3)
-            model_configs: List[Dict] = item.get('model_configs') or []
-
-            provider = self.ap.model_mgr.provider_dict.get(provider_uuid)
-            if not provider:
-                self.ap.logger.warning(f'Provider {provider_uuid} not found in chain {chain_uuid}')
-                continue
-
-            tasks = self._build_invoke_tasks(model_configs)
-
-            for task_model_name, task_api_key_index in tasks:
-                status = await self._ensure_status(chain_uuid, provider_uuid, task_model_name, task_api_key_index)
-
-                if status and not status.is_healthy and not is_aggregated:
-                    self.ap.logger.debug(
-                        f'Skipping unhealthy: provider={provider_uuid} model={task_model_name} key={task_api_key_index}'
-                    )
-                    continue
-
-                temp_provider = self._create_provider_for_key(provider, task_api_key_index)
-                model_entity = self._resolve_model_entity(provider, model, task_model_name)
-                if model_entity is None:
-                    self.ap.logger.warning(
-                        f'No model found for provider {provider_uuid} in chain {chain_uuid}, skipping'
-                    )
-                    continue
-                temp_model = requester.RuntimeLLMModel(
-                    model_entity=model_entity,
-                    provider=temp_provider,
-                )
-
-                retry_count = 0 if is_aggregated else max_retries
-
-                for attempt in range(max(1, retry_count + 1)):
-                    try:
-                        result = await temp_provider.invoke_llm(
-                            query=query,
-                            model=temp_model,
-                            messages=messages,
-                            funcs=funcs,
-                            extra_args=extra_args,
-                            remove_think=remove_think,
-                        )
-
-                        # Advance round-robin token rotation on success
-                        if task_api_key_index is None:
-                            provider.token_mgr.next_token()
-
-                        if status:
-                            await self._update_status(
-                                status.uuid,
-                                is_healthy=True,
-                                failure_count=0,
-                                health_check_last_failed=False,
-                                last_success_time=datetime.now(),
-                            )
-                        return result
-
-                    except Exception as e:
-                        last_error = e
-                        self.ap.logger.warning(
-                            f'Chain {chain_uuid} provider={provider_uuid} '
-                            f'model={task_model_name} key={task_api_key_index} '
-                            f'attempt {attempt + 1}/{max(1, retry_count + 1)} failed: {e}'
-                        )
-                        # Advance round-robin token rotation on failure too
-                        if task_api_key_index is None:
-                            provider.token_mgr.next_token()
-
-                        if attempt + 1 >= max(1, retry_count + 1):
-                            # All retries exhausted for this (model, key) task
-                            if is_aggregated:
-                                # Aggregated: track failure count but keep is_healthy=True
-                                if status:
-                                    await self._update_status(
-                                        status.uuid,
-                                        failure_count=(status.failure_count or 0) + 1,
-                                        last_failure_time=datetime.now(),
-                                        last_error_message=str(e)[:1024],
-                                    )
-                            else:
-                                if status:
-                                    await self._update_status(
-                                        status.uuid,
-                                        is_healthy=False,
-                                        failure_count=(status.failure_count or 0) + 1,
-                                        health_check_last_failed=False,
-                                        last_failure_time=datetime.now(),
-                                        last_error_message=str(e)[:1024],
-                                    )
-                            break  # Move to next (model_name, key_index) task
-
-        error_msg = f'All providers in chain {chain_uuid} failed'
-        if last_error:
-            error_msg += f': {last_error}'
-        raise Exception(error_msg)
-
-    async def invoke_chain_llm_stream(
-        self,
-        chain_uuid: str,
-        query: pipeline_query.Query,
-        model: Optional[requester.RuntimeLLMModel],
-        messages: List[provider_message.Message],
-        funcs: Optional[List[resource_tool.LLMTool]] = None,
-        extra_args: Dict[str, Any] = {},
-        remove_think: bool = False,
-    ) -> AsyncGenerator[provider_message.MessageChunk, None]:
-        """Invoke LLM stream through API chain with per-model/per-API-key failover"""
-        chain = self.chains.get(chain_uuid)
-        if not chain:
-            raise ValueError(f'Chain {chain_uuid} not found')
-
-        sorted_items = sorted(chain.chain_config, key=lambda x: x.get('priority', 0))
-        last_error: Optional[Exception] = None
-        # True if the stream started yielding and then failed mid-flight.
-        # In this case we must NOT fall through to the next provider because
-        # partial output has already been sent to the caller.
-        failed_mid_stream: bool = False
-
-        for item in sorted_items:
-            provider_uuid: str = item['provider_uuid']
-            is_aggregated: bool = item.get('is_aggregated', False)
-            max_retries: int = item.get('max_retries', 3)
-            model_configs: List[Dict] = item.get('model_configs') or []
-
-            provider = self.ap.model_mgr.provider_dict.get(provider_uuid)
-            if not provider:
-                self.ap.logger.warning(f'Provider {provider_uuid} not found in chain {chain_uuid}')
-                continue
-
-            tasks = self._build_invoke_tasks(model_configs)
-
-            for task_model_name, task_api_key_index in tasks:
-                status = await self._ensure_status(chain_uuid, provider_uuid, task_model_name, task_api_key_index)
-
-                if status and not status.is_healthy and not is_aggregated:
-                    self.ap.logger.debug(
-                        f'Skipping unhealthy: provider={provider_uuid} model={task_model_name} key={task_api_key_index}'
-                    )
-                    continue
-
-                temp_provider = self._create_provider_for_key(provider, task_api_key_index)
-                model_entity = self._resolve_model_entity(provider, model, task_model_name)
-                if model_entity is None:
-                    self.ap.logger.warning(
-                        f'No model found for provider {provider_uuid} in chain {chain_uuid}, skipping'
-                    )
-                    continue
-                temp_model = requester.RuntimeLLMModel(
-                    model_entity=model_entity,
-                    provider=temp_provider,
-                )
-
-                retry_count = 0 if is_aggregated else max_retries
-
-                for attempt in range(max(1, retry_count + 1)):
-                    has_yielded = False
-                    try:
-                        async for chunk in temp_provider.invoke_llm_stream(
-                            query=query,
-                            model=temp_model,
-                            messages=messages,
-                            funcs=funcs,
-                            extra_args=extra_args,
-                            remove_think=remove_think,
-                        ):
-                            has_yielded = True
-                            yield chunk
-
-                        # Advance round-robin token rotation on success
-                        if task_api_key_index is None:
-                            provider.token_mgr.next_token()
-
-                        if status:
-                            await self._update_status(
-                                status.uuid,
-                                is_healthy=True,
-                                failure_count=0,
-                                health_check_last_failed=False,
-                                last_success_time=datetime.now(),
-                            )
-                        return
-
-                    except Exception as e:
-                        last_error = e
-                        self.ap.logger.warning(
-                            f'Chain {chain_uuid} provider={provider_uuid} '
-                            f'model={task_model_name} key={task_api_key_index} '
-                            f'stream attempt {attempt + 1}/{max(1, retry_count + 1)} failed: {e}'
-                        )
-                        # Advance round-robin token rotation on failure too
-                        if task_api_key_index is None:
-                            provider.token_mgr.next_token()
-
-                        if has_yielded or attempt + 1 >= max(1, retry_count + 1):
-                            # Cannot retry if chunks were already yielded (would duplicate output),
-                            # or all retries are exhausted for this task
-                            if is_aggregated:
-                                # Aggregated: track failure count but keep is_healthy=True
-                                if status:
-                                    await self._update_status(
-                                        status.uuid,
-                                        failure_count=(status.failure_count or 0) + 1,
-                                        last_failure_time=datetime.now(),
-                                        last_error_message=str(e)[:1024],
-                                    )
-                            else:
-                                if status:
-                                    await self._update_status(
-                                        status.uuid,
-                                        is_healthy=False,
-                                        failure_count=(status.failure_count or 0) + 1,
-                                        health_check_last_failed=False,
-                                        last_failure_time=datetime.now(),
-                                        last_error_message=str(e)[:1024],
-                                    )
-                            if has_yielded:
-                                # Partial output already sent to caller; stop processing
-                                # entirely to avoid mixing output from different providers.
-                                failed_mid_stream = True
-                            break  # Move to next (model_name, key_index) task
-                if failed_mid_stream:
-                    break  # Exit for-task loop
-            if failed_mid_stream:
-                break  # Exit for-item loop
-
-        if failed_mid_stream and last_error:
-            # Re-raise original exception; caller already received partial chunks
-            raise last_error
-
-        error_msg = f'All providers in chain {chain_uuid} failed'
-        if last_error:
-            error_msg += f': {last_error}'
-        raise Exception(error_msg)
diff --git a/src/langbot/pkg/provider/runners/localagent.py b/src/langbot/pkg/provider/runners/localagent.py
index a4ccbd8ee..7d45a1f2e 100644
--- a/src/langbot/pkg/provider/runners/localagent.py
+++ b/src/langbot/pkg/provider/runners/localagent.py
@@ -4,6 +4,7 @@
 import copy
 import typing
 from .. import runner
+from ..modelmgr import requester as modelmgr_requester
 import langbot_plugin.api.entities.builtin.pipeline.query as pipeline_query
 import langbot_plugin.api.entities.builtin.provider.message as provider_message
 import langbot_plugin.api.entities.builtin.rag.context as rag_context
@@ -26,19 +27,109 @@
 
 @runner.runner_class('local-agent')
 class LocalAgentRunner(runner.RequestRunner):
-    """本地Agent请求运行器"""
-
-    class ToolCallTracker:
-        """工具调用追踪器"""
-
-        def __init__(self):
-            self.active_calls: dict[str, dict] = {}
-            self.completed_calls: list[provider_message.ToolCall] = []
+    """Local agent request runner"""
+
+    async def _get_model_candidates(
+        self,
+        query: pipeline_query.Query,
+    ) -> list[modelmgr_requester.RuntimeLLMModel]:
+        """Build ordered list of models to try: primary model + fallback models."""
+        candidates = []
+
+        # Primary model
+        if query.use_llm_model_uuid:
+            try:
+                primary = await self.ap.model_mgr.get_model_by_uuid(query.use_llm_model_uuid)
+                candidates.append(primary)
+            except ValueError:
+                self.ap.logger.warning(f'Primary model {query.use_llm_model_uuid} not found')
+
+        # Fallback models
+        fallback_uuids = (query.variables or {}).get('_fallback_model_uuids', [])
+        for fb_uuid in fallback_uuids:
+            try:
+                fb_model = await self.ap.model_mgr.get_model_by_uuid(fb_uuid)
+                candidates.append(fb_model)
+            except ValueError:
+                self.ap.logger.warning(f'Fallback model {fb_uuid} not found, skipping')
+
+        return candidates
+
+    async def _invoke_with_fallback(
+        self,
+        query: pipeline_query.Query,
+        candidates: list[modelmgr_requester.RuntimeLLMModel],
+        messages: list,
+        funcs: list,
+        remove_think: bool,
+    ) -> tuple[provider_message.Message, modelmgr_requester.RuntimeLLMModel]:
+        """Try non-streaming invocation with sequential fallback. Returns (message, model_used)."""
+        last_error = None
+        for model in candidates:
+            try:
+                msg = await model.provider.invoke_llm(
+                    query,
+                    model,
+                    messages,
+                    funcs if model.model_entity.abilities.__contains__('func_call') else [],
+                    extra_args=model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
+                return msg, model
+            except Exception as e:
+                last_error = e
+                self.ap.logger.warning(f'Model {model.model_entity.name} failed: {e}, trying next fallback...')
+        raise last_error or RuntimeError('No model candidates available')
+
+    async def _invoke_stream_with_fallback(
+        self,
+        query: pipeline_query.Query,
+        candidates: list[modelmgr_requester.RuntimeLLMModel],
+        messages: list,
+        funcs: list,
+        remove_think: bool,
+    ) -> tuple[typing.AsyncGenerator, modelmgr_requester.RuntimeLLMModel]:
+        """Try streaming invocation with sequential fallback. Returns (stream_generator, model_used).
+
+        Fallback is only possible before any chunks have been yielded to the client.
+        Once streaming starts, the model is committed.
+        """
+        last_error = None
+        for model in candidates:
+            try:
+                stream = model.provider.invoke_llm_stream(
+                    query,
+                    model,
+                    messages,
+                    funcs if model.model_entity.abilities.__contains__('func_call') else [],
+                    extra_args=model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
+                # Attempt to get the first chunk to verify the stream works
+                first_chunk = await stream.__anext__()
+
+                async def _chain_stream(first, rest):
+                    yield first
+                    async for chunk in rest:
+                        yield chunk
+
+                return _chain_stream(first_chunk, stream), model
+            except StopAsyncIteration:
+                # Empty stream — treat as success (model returned nothing)
+                async def _empty_stream():
+                    return
+                    yield  # make it a generator
+
+                return _empty_stream(), model
+            except Exception as e:
+                last_error = e
+                self.ap.logger.warning(f'Model {model.model_entity.name} stream failed: {e}, trying next fallback...')
+        raise last_error or RuntimeError('No model candidates available')
 
     async def run(
         self, query: pipeline_query.Query
     ) -> typing.AsyncGenerator[provider_message.Message | provider_message.MessageChunk, None]:
-        """运行请求"""
+        """Run request"""
         pending_tool_calls = []
 
         # Get knowledge bases list (new field)
@@ -119,77 +210,51 @@ async def run(
 
         remove_think = query.pipeline_config['output'].get('misc', '').get('remove-think')
 
-        use_api_chain_uuid = (query.variables or {}).get('_use_api_chain_uuid')
-        use_llm_model = (
-            None if use_api_chain_uuid else await self.ap.model_mgr.get_model_by_uuid(query.use_llm_model_uuid)
-        )
+        # Build ordered candidate list (primary + fallbacks)
+        candidates = await self._get_model_candidates(query)
+        if not candidates:
+            raise RuntimeError('No LLM model configured for local-agent runner')
 
         self.ap.logger.debug(
             f'localagent req: query={query.query_id} req_messages={req_messages} '
-            f'use_llm_model={query.use_llm_model_uuid} use_api_chain={use_api_chain_uuid}'
+            f'candidates={[m.model_entity.name for m in candidates]}'
         )
 
         if not is_stream:
-            # 非流式输出，直接请求
-            if use_api_chain_uuid:
-                msg = await self.ap.api_chain_mgr.invoke_chain_llm(
-                    use_api_chain_uuid,
-                    query,
-                    None,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args={},
-                    remove_think=remove_think,
-                )
-            else:
-                msg = await use_llm_model.provider.invoke_llm(
-                    query,
-                    use_llm_model,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args=use_llm_model.model_entity.extra_args,
-                    remove_think=remove_think,
-                )
+            # Non-streaming: invoke with fallback
+            msg, use_llm_model = await self._invoke_with_fallback(
+                query,
+                candidates,
+                req_messages,
+                query.use_funcs,
+                remove_think,
+            )
             yield msg
             final_msg = msg
         else:
-            # 流式输出，需要处理工具调用
+            # Streaming: invoke with fallback
             tool_calls_map: dict[str, provider_message.ToolCall] = {}
             msg_idx = 0
-            accumulated_content = ''  # 从开始累积的所有内容
+            accumulated_content = ''
             last_role = 'assistant'
             msg_sequence = 1
-            if use_api_chain_uuid:
-                stream_src = self.ap.api_chain_mgr.invoke_chain_llm_stream(
-                    use_api_chain_uuid,
-                    query,
-                    None,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args={},
-                    remove_think=remove_think,
-                )
-            else:
-                stream_src = use_llm_model.provider.invoke_llm_stream(
-                    query,
-                    use_llm_model,
-                    req_messages,
-                    query.use_funcs,
-                    extra_args=use_llm_model.model_entity.extra_args,
-                    remove_think=remove_think,
-                )
+
+            stream_src, use_llm_model = await self._invoke_stream_with_fallback(
+                query,
+                candidates,
+                req_messages,
+                query.use_funcs,
+                remove_think,
+            )
             async for msg in stream_src:
                 msg_idx = msg_idx + 1
 
-                # 记录角色
                 if msg.role:
                     last_role = msg.role
 
-                # 累积内容
                 if msg.content:
                     accumulated_content += msg.content
 
-                # 处理工具调用
                 if msg.tool_calls:
                     for tool_call in msg.tool_calls:
                         if tool_call.id not in tool_calls_map:
@@ -201,21 +266,18 @@ async def run(
                                 ),
                             )
                         if tool_call.function and tool_call.function.arguments:
-                            # 流式处理中，工具调用参数可能分多个chunk返回，需要追加而不是覆盖
                             tool_calls_map[tool_call.id].function.arguments += tool_call.function.arguments
-                # continue
-                # 每8个chunk或最后一个chunk时，输出所有累积的内容
+
                 if msg_idx % 8 == 0 or msg.is_final:
                     msg_sequence += 1
                     yield provider_message.MessageChunk(
                         role=last_role,
-                        content=accumulated_content,  # 输出所有累积内容
+                        content=accumulated_content,
                         tool_calls=list(tool_calls_map.values()) if (tool_calls_map and msg.is_final) else None,
                         is_final=msg.is_final,
                         msg_sequence=msg_sequence,
                     )
 
-            # 创建最终消息用于后续处理
             final_msg = provider_message.MessageChunk(
                 role=last_role,
                 content=accumulated_content,
@@ -230,7 +292,8 @@ async def run(
 
         req_messages.append(final_msg)
 
-        # 持续请求，只要还有待处理的工具调用就继续处理调用
+        # Once a model succeeds, commit to it for the tool call loop
+        # (no fallback mid-conversation — different models may interpret tool results differently)
         while pending_tool_calls:
             for tool_call in pending_tool_calls:
                 try:
@@ -271,7 +334,6 @@ async def run(
 
                     req_messages.append(msg)
                 except Exception as e:
-                    # 工具调用出错，添加一个报错信息到 req_messages
                     err_msg = provider_message.Message(role='tool', content=f'err: {e}', tool_call_id=tool_call.id)
 
                     yield err_msg
@@ -280,51 +342,37 @@ async def run(
 
             self.ap.logger.debug(
                 f'localagent req: query={query.query_id} req_messages={req_messages} '
-                f'use_llm_model={query.use_llm_model_uuid} use_api_chain={use_api_chain_uuid}'
+                f'use_llm_model={use_llm_model.model_entity.name}'
             )
 
             if is_stream:
                 tool_calls_map = {}
                 msg_idx = 0
-                accumulated_content = ''  # 从开始累积的所有内容
+                accumulated_content = ''
                 last_role = 'assistant'
                 msg_sequence = first_end_sequence
 
-                if use_api_chain_uuid:
-                    tool_stream_src = self.ap.api_chain_mgr.invoke_chain_llm_stream(
-                        use_api_chain_uuid,
-                        query,
-                        None,
-                        req_messages,
-                        query.use_funcs,
-                        extra_args={},
-                        remove_think=remove_think,
-                    )
-                else:
-                    tool_stream_src = use_llm_model.provider.invoke_llm_stream(
-                        query,
-                        use_llm_model,
-                        req_messages,
-                        query.use_funcs,
-                        extra_args=use_llm_model.model_entity.extra_args,
-                        remove_think=remove_think,
-                    )
+                tool_stream_src = use_llm_model.provider.invoke_llm_stream(
+                    query,
+                    use_llm_model,
+                    req_messages,
+                    query.use_funcs if use_llm_model.model_entity.abilities.__contains__('func_call') else [],
+                    extra_args=use_llm_model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
                 async for msg in tool_stream_src:
                     msg_idx += 1
 
-                    # 记录角色
                     if msg.role:
                         last_role = msg.role
 
-                    # 第一次请求工具调用时的内容
+                    # Prepend first-round content on first chunk of tool-call round
                     if msg_idx == 1:
                         accumulated_content = first_content if first_content is not None else accumulated_content
 
-                    # 累积内容
                     if msg.content:
                         accumulated_content += msg.content
 
-                    # 处理工具调用
                     if msg.tool_calls:
                         for tool_call in msg.tool_calls:
                             if tool_call.id not in tool_calls_map:
@@ -336,15 +384,13 @@ async def run(
                                     ),
                                 )
                             if tool_call.function and tool_call.function.arguments:
-                                # 流式处理中，工具调用参数可能分多个chunk返回，需要追加而不是覆盖
                                 tool_calls_map[tool_call.id].function.arguments += tool_call.function.arguments
 
-                    # 每8个chunk或最后一个chunk时，输出所有累积的内容
                     if msg_idx % 8 == 0 or msg.is_final:
                         msg_sequence += 1
                         yield provider_message.MessageChunk(
                             role=last_role,
-                            content=accumulated_content,  # 输出所有累积内容
+                            content=accumulated_content,
                             tool_calls=list(tool_calls_map.values()) if (tool_calls_map and msg.is_final) else None,
                             is_final=msg.is_final,
                             msg_sequence=msg_sequence,
@@ -357,26 +403,15 @@ async def run(
                     msg_sequence=msg_sequence,
                 )
             else:
-                # 处理完所有调用，再次请求
-                if use_api_chain_uuid:
-                    msg = await self.ap.api_chain_mgr.invoke_chain_llm(
-                        use_api_chain_uuid,
-                        query,
-                        None,
-                        req_messages,
-                        query.use_funcs,
-                        extra_args={},
-                        remove_think=remove_think,
-                    )
-                else:
-                    msg = await use_llm_model.provider.invoke_llm(
-                        query,
-                        use_llm_model,
-                        req_messages,
-                        query.use_funcs,
-                        extra_args=use_llm_model.model_entity.extra_args,
-                        remove_think=remove_think,
-                    )
+                # Non-streaming: use committed model directly (no fallback in tool loop)
+                msg = await use_llm_model.provider.invoke_llm(
+                    query,
+                    use_llm_model,
+                    req_messages,
+                    query.use_funcs if use_llm_model.model_entity.abilities.__contains__('func_call') else [],
+                    extra_args=use_llm_model.model_entity.extra_args,
+                    remove_think=remove_think,
+                )
 
                 yield msg
                 final_msg = msg
diff --git a/src/langbot/pkg/utils/constants.py b/src/langbot/pkg/utils/constants.py
index d87efec7d..c1b854f29 100644
--- a/src/langbot/pkg/utils/constants.py
+++ b/src/langbot/pkg/utils/constants.py
@@ -2,7 +2,7 @@
 
 semantic_version = f'v{langbot.__version__}'
 
-required_database_version = 22
+required_database_version = 23
 """Tag the version of the database schema, used to check if the database needs to be migrated"""
 
 debug_mode = False
diff --git a/src/langbot/templates/metadata/pipeline/ai.yaml b/src/langbot/templates/metadata/pipeline/ai.yaml
index 974684475..46f5d4635 100644
--- a/src/langbot/templates/metadata/pipeline/ai.yaml
+++ b/src/langbot/templates/metadata/pipeline/ai.yaml
@@ -57,10 +57,13 @@ stages:
     config:
       - name: model
         label:
-          en_US: Model / API Chain
-          zh_Hans: 模型 / API 链
-        type: model-or-api-chain-selector
+          en_US: Model
+          zh_Hans: 模型
+        type: model-fallback-selector
         required: true
+        default:
+          primary: ''
+          fallbacks: []
       - name: max-round
         label:
           en_US: Max Round
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx b/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
deleted file mode 100644
index 9d7cb3e27..000000000
--- a/web/src/app/home/components/api-chains-dialog/APIChainCard.tsx
+++ /dev/null
@@ -1,495 +0,0 @@
-﻿'use client';
-
-import {
-  APIChain,
-  APIChainStatus,
-  LLMModel,
-  ModelProvider,
-} from '@/app/infra/entities/api';
-import { Card, CardContent } from '@/components/ui/card';
-import { Button } from '@/components/ui/button';
-import {
-  Edit,
-  Trash2,
-  ChevronDown,
-  ChevronRight,
-  AlertCircle,
-  CheckCircle2,
-  AlertTriangle,
-} from 'lucide-react';
-import { useState, useMemo } from 'react';
-import { useTranslation } from 'react-i18next';
-import { cn } from '@/lib/utils';
-
-interface APIChainCardProps {
-  chain: APIChain;
-  providers: ModelProvider[];
-  llmModels: LLMModel[];
-  onEdit: () => void;
-  onDelete: () => void;
-}
-
-function calculateHealthPercentage(
-  statuses: APIChainStatus[] | undefined,
-  chainConfig: APIChain['chain_config'],
-): number {
-  if (!statuses || statuses.length === 0 || chainConfig.length === 0)
-    return 100;
-  // Collect UUIDs of aggregated providers so their statuses are excluded from
-  // the unhealthy calculation (they never become unhealthy by design).
-  const aggregatedUuids = new Set(
-    chainConfig.filter((c) => c.is_aggregated).map((c) => c.provider_uuid),
-  );
-  const trackable = statuses.filter(
-    (s) => !aggregatedUuids.has(s.provider_uuid),
-  );
-  if (trackable.length === 0) return 100;
-  const healthyCount = trackable.filter((s) => s.is_healthy).length;
-  return Math.round((healthyCount / trackable.length) * 100);
-}
-
-function getErrorStats(statuses: APIChainStatus[] | undefined): {
-  totalFailures: number;
-} {
-  if (!statuses || statuses.length === 0) return { totalFailures: 0 };
-  return {
-    totalFailures: statuses.reduce((sum, s) => sum + (s.failure_count || 0), 0),
-  };
-}
-
-function getHealthColorClass(healthPercentage: number): string {
-  if (healthPercentage === 0) return 'border-destructive bg-destructive/5';
-  if (healthPercentage < 50) return 'border-yellow-500 bg-yellow-500/5';
-  return '';
-}
-
-function getHealthIcon(healthPercentage: number) {
-  if (healthPercentage === 0)
-    return <AlertCircle className="h-4 w-4 text-destructive" />;
-  if (healthPercentage < 50)
-    return <AlertTriangle className="h-4 w-4 text-yellow-500" />;
-  return <CheckCircle2 className="h-4 w-4 text-green-500" />;
-}
-
-export default function APIChainCard({
-  chain,
-  providers,
-  llmModels: _llmModels, // eslint-disable-line @typescript-eslint/no-unused-vars
-  onEdit,
-  onDelete,
-}: APIChainCardProps) {
-  const { t } = useTranslation();
-  const [expanded, setExpanded] = useState(false);
-
-  const getProviderName = (uuid: string) =>
-    providers.find((p) => p.uuid === uuid)?.name ?? uuid;
-
-  const sortedConfigs = [...chain.chain_config].sort(
-    (a, b) => a.priority - b.priority,
-  );
-
-  const healthPercentage = useMemo(
-    () => calculateHealthPercentage(chain.statuses, chain.chain_config),
-    [chain.statuses, chain.chain_config],
-  );
-
-  const { totalFailures } = useMemo(
-    () => getErrorStats(chain.statuses),
-    [chain.statuses],
-  );
-
-  /** Get all status records for a given (provider, model_name, api_key_index) combination */
-  function getStatus(
-    providerUuid: string,
-    modelName: string | null,
-    apiKeyIndex: number | null,
-  ): APIChainStatus | undefined {
-    return chain.statuses?.find(
-      (s) =>
-        s.provider_uuid === providerUuid &&
-        (s.model_name ?? null) === modelName &&
-        (s.api_key_index ?? null) === apiKeyIndex,
-    );
-  }
-
-  /** Get all status records for a provider (any granularity) */
-  function getProviderStatuses(providerUuid: string): APIChainStatus[] {
-    return (
-      chain.statuses?.filter((s) => s.provider_uuid === providerUuid) ?? []
-    );
-  }
-
-  /** Compute provider-level health summary */
-  function providerHealthSummary(
-    providerUuid: string,
-    isAggregated: boolean,
-  ): { healthy: number; total: number } {
-    // Aggregated providers never become unhealthy by design; always report full health.
-    if (isAggregated) return { healthy: 1, total: 1 };
-    const ss = getProviderStatuses(providerUuid);
-    if (ss.length === 0) return { healthy: 1, total: 1 }; // assume healthy if no data
-    return { healthy: ss.filter((s) => s.is_healthy).length, total: ss.length };
-  }
-
-  return (
-    <Card
-      className={cn(
-        'mb-3 transition-colors',
-        getHealthColorClass(healthPercentage),
-      )}
-    >
-      <CardContent className="p-4">
-        {/* Header */}
-        <div className="flex items-start justify-between">
-          <div className="flex-1 min-w-0">
-            <div className="flex items-center gap-2 mb-1">
-              <button
-                onClick={() => setExpanded(!expanded)}
-                className="p-0.5 hover:bg-accent rounded"
-              >
-                {expanded ? (
-                  <ChevronDown className="h-4 w-4" />
-                ) : (
-                  <ChevronRight className="h-4 w-4" />
-                )}
-              </button>
-              <h3 className="font-semibold text-base truncate">{chain.name}</h3>
-              {getHealthIcon(healthPercentage)}
-              <span
-                className={cn(
-                  'text-xs px-2 py-0.5 rounded',
-                  healthPercentage === 0
-                    ? 'bg-destructive/10 text-destructive'
-                    : healthPercentage < 50
-                      ? 'bg-yellow-500/10 text-yellow-600'
-                      : 'bg-green-500/10 text-green-600',
-                )}
-              >
-                {healthPercentage}%
-              </span>
-            </div>
-            {chain.description && (
-              <p className="text-sm text-muted-foreground ml-6 mb-2">
-                {chain.description}
-              </p>
-            )}
-            <div className="text-xs text-muted-foreground ml-6">
-              {t('apiChains.providerCount', {
-                count: chain.chain_config.length,
-              })}
-            </div>
-          </div>
-          <div className="flex gap-1 ml-2">
-            <Button
-              variant="ghost"
-              size="icon"
-              className="h-8 w-8"
-              onClick={onEdit}
-            >
-              <Edit className="h-4 w-4" />
-            </Button>
-            <Button
-              variant="ghost"
-              size="icon"
-              className="h-8 w-8 text-destructive hover:text-destructive"
-              onClick={onDelete}
-            >
-              <Trash2 className="h-4 w-4" />
-            </Button>
-          </div>
-        </div>
-
-        {/* Expanded: per-provider / per-model / per-key health */}
-        {expanded && (
-          <div className="mt-3 ml-6 space-y-2 border-l-2 border-border pl-3">
-            {sortedConfigs.map((config, index) => {
-              const { healthy, total } = providerHealthSummary(
-                config.provider_uuid,
-                config.is_aggregated,
-              );
-              const providerHealthy = healthy === total;
-              const modelConfigs = config.model_configs ?? [];
-
-              return (
-                <div
-                  key={config.provider_uuid + index}
-                  className={cn(
-                    'text-sm p-2 rounded bg-accent/50 border-l-4',
-                    providerHealthy
-                      ? 'border-l-green-500'
-                      : 'border-l-destructive',
-                  )}
-                >
-                  {/* Provider row */}
-                  <div className="flex items-center gap-2 mb-1">
-                    <span className="font-medium">
-                      {index + 1}. {getProviderName(config.provider_uuid)}
-                    </span>
-                    {config.is_aggregated && (
-                      <span className="text-xs bg-primary/10 text-primary px-2 py-0.5 rounded">
-                        {t('apiChains.aggregation')}
-                      </span>
-                    )}
-                    <span
-                      className={cn(
-                        'text-xs px-2 py-0.5 rounded',
-                        providerHealthy
-                          ? 'bg-green-500/10 text-green-600'
-                          : 'bg-destructive/10 text-destructive',
-                      )}
-                    >
-                      {providerHealthy
-                        ? t('apiChains.healthy')
-                        : `${healthy}/${total}`}
-                    </span>
-                  </div>
-
-                  {/* Per-model breakdown */}
-                  {modelConfigs.length > 0 ? (
-                    <div className="mt-1 space-y-1 pl-3 border-l border-border">
-                      {[...modelConfigs]
-                        .sort((a, b) => a.priority - b.priority)
-                        .map((mc, mi) => {
-                          // ── Aggregated mode ──────────────────────────────────────────
-                          // Aggregated providers never become unhealthy and are not subject
-                          // to health checks. After retries are exhausted the chain simply
-                          // moves to the next model. Always render a green "healthy" badge
-                          // and omit the per-key sub-list (not meaningful here).
-                          if (config.is_aggregated) {
-                            // Sum failure counts across all key variants for display.
-                            const aggStatuses = [
-                              getStatus(
-                                config.provider_uuid,
-                                mc.model_name,
-                                null,
-                              ),
-                              ...(mc.api_key_indices ?? []).map((k) =>
-                                getStatus(
-                                  config.provider_uuid,
-                                  mc.model_name,
-                                  k.index,
-                                ),
-                              ),
-                            ].filter(Boolean) as APIChainStatus[];
-                            const aggFailures = aggStatuses.reduce(
-                              (sum, s) => sum + (s.failure_count || 0),
-                              0,
-                            );
-                            return (
-                              <div key={mi} className="text-xs">
-                                <div className="flex items-center gap-1.5 flex-wrap">
-                                  <span className="text-muted-foreground">
-                                    #{mi + 1}
-                                  </span>
-                                  <span className="font-mono">
-                                    {mc.model_name}
-                                  </span>
-                                  <span className="px-1.5 py-0.5 rounded bg-green-500/10 text-green-600">
-                                    {t('apiChains.healthy')}
-                                  </span>
-                                  {aggFailures > 0 && (
-                                    <span className="text-muted-foreground">
-                                      {t('apiChains.failureCount')}:{' '}
-                                      {aggFailures}
-                                    </span>
-                                  )}
-                                </div>
-                              </div>
-                            );
-                          }
-
-                          // ── Non-aggregated mode ──────────────────────────────────────
-                          // When api_key_indices are configured, look up the status for
-                          // each specific key; otherwise fall back to the round-robin
-                          // (api_key_index=null) record.
-                          const apiKeyIndices = mc.api_key_indices ?? [];
-                          const relevantStatuses: APIChainStatus[] =
-                            apiKeyIndices.length > 0
-                              ? (apiKeyIndices
-                                  .map((k) =>
-                                    getStatus(
-                                      config.provider_uuid,
-                                      mc.model_name,
-                                      k.index,
-                                    ),
-                                  )
-                                  .filter(Boolean) as APIChainStatus[])
-                              : ([
-                                  getStatus(
-                                    config.provider_uuid,
-                                    mc.model_name,
-                                    null,
-                                  ),
-                                ].filter(Boolean) as APIChainStatus[]);
-                          const modelHealthy =
-                            relevantStatuses.length === 0 ||
-                            relevantStatuses.every((s) => s.is_healthy);
-                          const totalFailures = relevantStatuses.reduce(
-                            (sum, s) => sum + (s.failure_count || 0),
-                            0,
-                          );
-                          const modelHcFailed = relevantStatuses.some(
-                            (s) =>
-                              !s.is_healthy && !!s.health_check_last_failed,
-                          );
-                          const modelLastError = relevantStatuses.find(
-                            (s) =>
-                              s.last_error_message &&
-                              !s.health_check_last_failed,
-                          )?.last_error_message;
-                          return (
-                            <div key={mi} className="text-xs">
-                              <div className="flex items-center gap-1.5 flex-wrap">
-                                <span className="text-muted-foreground">
-                                  #{mi + 1}
-                                </span>
-                                <span className="font-mono">
-                                  {mc.model_name}
-                                </span>
-                                <span
-                                  className={cn(
-                                    'px-1.5 py-0.5 rounded',
-                                    modelHealthy
-                                      ? 'bg-green-500/10 text-green-600'
-                                      : 'bg-destructive/10 text-destructive',
-                                  )}
-                                >
-                                  {modelHealthy
-                                    ? t('apiChains.healthy')
-                                    : t('apiChains.unhealthy')}
-                                </span>
-                                {/* health check failed badge */}
-                                {!modelHealthy && modelHcFailed && (
-                                  <span className="px-1.5 py-0.5 rounded bg-yellow-500/10 text-yellow-600">
-                                    {t('apiChains.healthCheckFailed')}
-                                  </span>
-                                )}
-                                {totalFailures > 0 && (
-                                  <span className="text-destructive">
-                                    {t('apiChains.failureCount')}:{' '}
-                                    {totalFailures}
-                                  </span>
-                                )}
-                              </div>
-                              {modelLastError && (
-                                <p
-                                  className="text-destructive pl-4 truncate"
-                                  title={modelLastError}
-                                >
-                                  {t('apiChains.lastError')}: {modelLastError}
-                                </p>
-                              )}
-                              {/* Per-key sub-list when api_key_indices are configured */}
-                              {apiKeyIndices.length > 0 && (
-                                <div className="mt-0.5 ml-3 space-y-0.5 border-l border-border pl-2">
-                                  {[...apiKeyIndices]
-                                    .sort((a, b) => a.priority - b.priority)
-                                    .map((k) => {
-                                      const kst = getStatus(
-                                        config.provider_uuid,
-                                        mc.model_name,
-                                        k.index,
-                                      );
-                                      const keyHealthy = kst
-                                        ? kst.is_healthy
-                                        : true;
-                                      return (
-                                        <div
-                                          key={k.index}
-                                          className="flex items-center gap-1.5 flex-wrap"
-                                        >
-                                          <span className="text-muted-foreground font-mono">
-                                            key[{k.index}]
-                                          </span>
-                                          <span
-                                            className={cn(
-                                              'px-1.5 py-0.5 rounded',
-                                              keyHealthy
-                                                ? 'bg-green-500/10 text-green-600'
-                                                : 'bg-destructive/10 text-destructive',
-                                            )}
-                                          >
-                                            {keyHealthy
-                                              ? t('apiChains.healthy')
-                                              : t('apiChains.unhealthy')}
-                                          </span>
-                                          {kst &&
-                                            !kst.is_healthy &&
-                                            kst.health_check_last_failed && (
-                                              <span className="px-1.5 py-0.5 rounded bg-yellow-500/10 text-yellow-600">
-                                                {t(
-                                                  'apiChains.healthCheckFailed',
-                                                )}
-                                              </span>
-                                            )}
-                                          {kst && kst.failure_count > 0 && (
-                                            <span className="text-destructive">
-                                              {kst.failure_count}×
-                                            </span>
-                                          )}
-                                        </div>
-                                      );
-                                    })}
-                                </div>
-                              )}
-                            </div>
-                          );
-                        })}
-                    </div>
-                  ) : (
-                    /* No model configs: show provider-level status detail */
-                    <div className="text-xs text-muted-foreground space-y-0.5">
-                      <div>
-                        {t('apiChains.maxRetries')}: {config.max_retries}
-                      </div>
-                      <div>
-                        {t('apiChains.timeout')}: {config.timeout_ms}ms
-                      </div>
-                      {(() => {
-                        const st = getStatus(config.provider_uuid, null, null);
-                        if (!st) return null;
-                        return (
-                          <>
-                            {/* health check failed badge (only for non-aggregated unhealthy) */}
-                            {!st.is_healthy && st.health_check_last_failed && (
-                              <div className="text-yellow-600 font-medium">
-                                ⚠ {t('apiChains.healthCheckFailed')}
-                              </div>
-                            )}
-                            {st.failure_count > 0 && (
-                              <div className="text-destructive">
-                                {t('apiChains.failureCount')}:{' '}
-                                {st.failure_count}
-                              </div>
-                            )}
-                            {st.last_error_message &&
-                              !st.health_check_last_failed && (
-                                <div
-                                  className="text-destructive truncate"
-                                  title={st.last_error_message}
-                                >
-                                  {t('apiChains.lastError')}:{' '}
-                                  {st.last_error_message}
-                                </div>
-                              )}
-                          </>
-                        );
-                      })()}
-                    </div>
-                  )}
-                </div>
-              );
-            })}
-          </div>
-        )}
-
-        {/* Bottom summary */}
-        <div className="flex justify-end mt-2 gap-4 text-xs text-muted-foreground">
-          <span className={cn(totalFailures > 0 && 'text-destructive')}>
-            {t('apiChains.errorCount')}: {totalFailures}
-          </span>
-        </div>
-      </CardContent>
-    </Card>
-  );
-}
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx b/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
deleted file mode 100644
index 39568c956..000000000
--- a/web/src/app/home/components/api-chains-dialog/APIChainForm.tsx
+++ /dev/null
@@ -1,665 +0,0 @@
-﻿'use client';
-
-import { useState, useEffect } from 'react';
-import { httpClient } from '@/app/infra/http/HttpClient';
-import {
-  APIChainItem,
-  APIChainModelConfig,
-  LLMModel,
-  ModelProvider,
-} from '@/app/infra/entities/api';
-import { Button } from '@/components/ui/button';
-import { Input } from '@/components/ui/input';
-import { Label } from '@/components/ui/label';
-import { Textarea } from '@/components/ui/textarea';
-import { Switch } from '@/components/ui/switch';
-import {
-  Select,
-  SelectContent,
-  SelectItem,
-  SelectTrigger,
-  SelectValue,
-} from '@/components/ui/select';
-import { toast } from 'sonner';
-import { useTranslation } from 'react-i18next';
-import {
-  Plus,
-  Trash2,
-  GripVertical,
-  ChevronDown,
-  ChevronRight,
-} from 'lucide-react';
-
-interface APIChainFormProps {
-  chainId?: string;
-  providers: ModelProvider[];
-  llmModels: LLMModel[];
-  onFormSubmit: () => void;
-  onFormCancel: () => void;
-}
-
-export default function APIChainForm({
-  chainId,
-  providers,
-  llmModels,
-  onFormSubmit,
-  onFormCancel,
-}: APIChainFormProps) {
-  const { t } = useTranslation();
-  const [loading, setLoading] = useState(false);
-  const [name, setName] = useState('');
-  const [description, setDescription] = useState('');
-  const [chainConfig, setChainConfig] = useState<APIChainItem[]>([]);
-  const [healthCheckEnabled, setHealthCheckEnabled] = useState(true);
-  const [healthCheckInterval, setHealthCheckInterval] = useState(300);
-  /** Track which provider item has model_configs expanded */
-  const [expandedModelConfigs, setExpandedModelConfigs] = useState<Set<number>>(
-    new Set(),
-  );
-  /** Track which provider item has advanced config expanded */
-  const [expandedAdvanced, setExpandedAdvanced] = useState<Set<number>>(
-    new Set(),
-  );
-
-  useEffect(() => {
-    if (chainId) {
-      loadChain();
-    } else {
-      setChainConfig([
-        {
-          provider_uuid: '',
-          priority: 1,
-          is_aggregated: false,
-          max_retries: 3,
-          timeout_ms: 30000,
-          model_configs: [],
-        },
-      ]);
-    }
-  }, [chainId]);
-
-  async function loadChain() {
-    try {
-      setLoading(true);
-      const resp = await httpClient.getAPIChain(chainId!);
-      setName(resp.chain.name);
-      setDescription(resp.chain.description || '');
-      setChainConfig(resp.chain.chain_config);
-      setHealthCheckEnabled(resp.chain.health_check_enabled);
-      setHealthCheckInterval(resp.chain.health_check_interval);
-    } catch (err) {
-      toast.error(t('apiChains.loadError') + ': ' + (err as Error).message);
-    } finally {
-      setLoading(false);
-    }
-  }
-
-  /** Return models belonging to the given provider */
-  function modelsForProvider(providerUuid: string): LLMModel[] {
-    return llmModels.filter((m) => m.provider_uuid === providerUuid);
-  }
-
-  // ---- Provider item CRUD ----
-
-  function addProvider() {
-    const maxPriority = Math.max(...chainConfig.map((c) => c.priority), 0);
-    setChainConfig([
-      ...chainConfig,
-      {
-        provider_uuid: '',
-        priority: maxPriority + 1,
-        is_aggregated: false,
-        max_retries: 3,
-        timeout_ms: 30000,
-        model_configs: [],
-      },
-    ]);
-  }
-
-  function removeProvider(index: number) {
-    const newConfig = chainConfig.filter((_, i) => i !== index);
-    newConfig.forEach((c, i) => {
-      c.priority = i + 1;
-    });
-    setChainConfig(newConfig);
-    setExpandedModelConfigs((prev) => {
-      const next = new Set<number>();
-      prev.forEach((v) => {
-        if (v < index) next.add(v);
-        else if (v > index) next.add(v - 1);
-      });
-      return next;
-    });
-    setExpandedAdvanced((prev) => {
-      const next = new Set<number>();
-      prev.forEach((v) => {
-        if (v < index) next.add(v);
-        else if (v > index) next.add(v - 1);
-      });
-      return next;
-    });
-  }
-
-  function updateProvider(
-    index: number,
-    field: keyof APIChainItem,
-    value: string | number | boolean,
-  ) {
-    const newConfig = [...chainConfig];
-    newConfig[index] = { ...newConfig[index], [field]: value };
-    // If provider changes, reset model_configs
-    if (field === 'provider_uuid') {
-      newConfig[index].model_configs = [];
-    }
-    setChainConfig(newConfig);
-  }
-
-  function moveProvider(index: number, direction: 'up' | 'down') {
-    if (
-      (direction === 'up' && index === 0) ||
-      (direction === 'down' && index === chainConfig.length - 1)
-    )
-      return;
-    const newConfig = [...chainConfig];
-    const target = direction === 'up' ? index - 1 : index + 1;
-    [newConfig[index], newConfig[target]] = [
-      newConfig[target],
-      newConfig[index],
-    ];
-    newConfig.forEach((c, i) => {
-      c.priority = i + 1;
-    });
-    setChainConfig(newConfig);
-  }
-
-  // ---- Model config CRUD ----
-
-  function addModelConfig(providerIndex: number) {
-    const newConfig = [...chainConfig];
-    const existing = newConfig[providerIndex].model_configs ?? [];
-    const maxPriority = Math.max(...existing.map((m) => m.priority), 0);
-    newConfig[providerIndex] = {
-      ...newConfig[providerIndex],
-      model_configs: [
-        ...existing,
-        { model_name: '', priority: maxPriority + 1 },
-      ],
-    };
-    setChainConfig(newConfig);
-  }
-
-  function removeModelConfig(providerIndex: number, modelIndex: number) {
-    const newConfig = [...chainConfig];
-    const existing = (newConfig[providerIndex].model_configs ?? []).filter(
-      (_, i) => i !== modelIndex,
-    );
-    existing.forEach((m, i) => {
-      m.priority = i + 1;
-    });
-    newConfig[providerIndex] = {
-      ...newConfig[providerIndex],
-      model_configs: existing,
-    };
-    setChainConfig(newConfig);
-  }
-
-  function updateModelConfig(
-    providerIndex: number,
-    modelIndex: number,
-    field: keyof APIChainModelConfig,
-    value: string | number | boolean,
-  ) {
-    const newConfig = [...chainConfig];
-    const models = [...(newConfig[providerIndex].model_configs ?? [])];
-    models[modelIndex] = { ...models[modelIndex], [field]: value };
-    newConfig[providerIndex] = {
-      ...newConfig[providerIndex],
-      model_configs: models,
-    };
-    setChainConfig(newConfig);
-  }
-
-  function moveModelConfig(
-    providerIndex: number,
-    modelIndex: number,
-    direction: 'up' | 'down',
-  ) {
-    const models = [...(chainConfig[providerIndex].model_configs ?? [])];
-    if (
-      (direction === 'up' && modelIndex === 0) ||
-      (direction === 'down' && modelIndex === models.length - 1)
-    )
-      return;
-    const target = direction === 'up' ? modelIndex - 1 : modelIndex + 1;
-    [models[modelIndex], models[target]] = [models[target], models[modelIndex]];
-    models.forEach((m, i) => {
-      m.priority = i + 1;
-    });
-    const newConfig = [...chainConfig];
-    newConfig[providerIndex] = {
-      ...newConfig[providerIndex],
-      model_configs: models,
-    };
-    setChainConfig(newConfig);
-  }
-
-  // ---- Submit ----
-
-  async function handleSubmit() {
-    if (!name.trim()) {
-      toast.error(t('apiChains.nameRequired'));
-      return;
-    }
-    if (chainConfig.length === 0) {
-      toast.error(t('apiChains.atLeastOneProvider'));
-      return;
-    }
-    for (const config of chainConfig) {
-      if (!config.provider_uuid) {
-        toast.error(t('apiChains.selectAllProviders'));
-        return;
-      }
-      for (const mc of config.model_configs ?? []) {
-        if (!mc.model_name) {
-          toast.error(t('apiChains.selectAllModels'));
-          return;
-        }
-      }
-    }
-
-    setLoading(true);
-    try {
-      const data = {
-        name,
-        description: description || undefined,
-        chain_config: chainConfig,
-        health_check_enabled: healthCheckEnabled,
-        health_check_interval: healthCheckInterval,
-      };
-
-      if (chainId) {
-        await httpClient.updateAPIChain(chainId, data);
-        toast.success(t('apiChains.updateSuccess'));
-      } else {
-        await httpClient.createAPIChain(data);
-        toast.success(t('apiChains.createSuccess'));
-      }
-      onFormSubmit();
-    } catch (err) {
-      toast.error(
-        t(chainId ? 'apiChains.updateError' : 'apiChains.createError') +
-          ': ' +
-          (err as Error).message,
-      );
-    } finally {
-      setLoading(false);
-    }
-  }
-
-  return (
-    <div className="space-y-4">
-      {/* Name */}
-      <div className="space-y-2">
-        <Label htmlFor="name">
-          {t('apiChains.name')}
-          <span className="text-red-500 ml-1">*</span>
-        </Label>
-        <Input
-          id="name"
-          value={name}
-          onChange={(e) => setName(e.target.value)}
-          placeholder={t('apiChains.namePlaceholder')}
-        />
-      </div>
-
-      {/* Description */}
-      <div className="space-y-2">
-        <Label htmlFor="description">{t('apiChains.description')}</Label>
-        <Textarea
-          id="description"
-          value={description}
-          onChange={(e) => setDescription(e.target.value)}
-          placeholder={t('apiChains.descriptionPlaceholder')}
-          className="min-h-[60px]"
-        />
-      </div>
-
-      {/* Provider Chain */}
-      <div className="space-y-2">
-        <div className="flex items-center justify-between">
-          <Label>
-            {t('apiChains.providers')}
-            <span className="text-red-500 ml-1">*</span>
-          </Label>
-          <Button
-            type="button"
-            size="sm"
-            variant="outline"
-            onClick={addProvider}
-          >
-            <Plus className="h-4 w-4 mr-1" />
-            {t('apiChains.addProvider')}
-          </Button>
-        </div>
-
-        <div className="space-y-3 max-h-[420px] overflow-y-auto pr-1">
-          {chainConfig.map((config, idx) => {
-            const providerModels = modelsForProvider(config.provider_uuid);
-            const modelConfigsExpanded = expandedModelConfigs.has(idx);
-
-            return (
-              <div
-                key={idx}
-                className="border rounded-lg p-3 space-y-3 bg-accent/30"
-              >
-                {/* Provider row */}
-                <div className="flex items-start gap-2">
-                  {/* Up/Down buttons */}
-                  <div className="flex flex-col gap-0.5 pt-1">
-                    <button
-                      type="button"
-                      onClick={() => moveProvider(idx, 'up')}
-                      disabled={idx === 0}
-                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
-                    >
-                      <GripVertical className="h-3 w-3" />
-                    </button>
-                    <button
-                      type="button"
-                      onClick={() => moveProvider(idx, 'down')}
-                      disabled={idx === chainConfig.length - 1}
-                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
-                    >
-                      <GripVertical className="h-3 w-3" />
-                    </button>
-                  </div>
-
-                  <div className="flex-1 space-y-2">
-                    {/* Provider selector */}
-                    <div className="flex items-center gap-2">
-                      <span className="text-sm font-medium w-6">
-                        #{idx + 1}
-                      </span>
-                      <Select
-                        value={config.provider_uuid}
-                        onValueChange={(v) =>
-                          updateProvider(idx, 'provider_uuid', v)
-                        }
-                      >
-                        <SelectTrigger className="flex-1">
-                          <SelectValue
-                            placeholder={t('apiChains.selectProvider')}
-                          />
-                        </SelectTrigger>
-                        <SelectContent>
-                          {providers.map((p) => (
-                            <SelectItem key={p.uuid} value={p.uuid}>
-                              {p.name}
-                            </SelectItem>
-                          ))}
-                        </SelectContent>
-                      </Select>
-                    </div>
-
-                    {/* Advanced config expander */}
-                    <button
-                      type="button"
-                      className="flex items-center gap-1 text-xs text-muted-foreground hover:text-foreground"
-                      onClick={() =>
-                        setExpandedAdvanced((prev) => {
-                          const next = new Set(prev);
-                          if (next.has(idx)) {
-                            next.delete(idx);
-                          } else {
-                            next.add(idx);
-                          }
-                          return next;
-                        })
-                      }
-                    >
-                      {expandedAdvanced.has(idx) ? (
-                        <ChevronDown className="h-3 w-3" />
-                      ) : (
-                        <ChevronRight className="h-3 w-3" />
-                      )}
-                      {t('apiChains.advanced')}
-                    </button>
-
-                    {expandedAdvanced.has(idx) && (
-                      <div className="space-y-2 pl-2 border-l-2 border-border">
-                        {/* Retries / Timeout */}
-                        <div className="grid grid-cols-2 gap-2">
-                          <div className="space-y-1">
-                            <Label className="text-xs">
-                              {t('apiChains.maxRetries')}
-                            </Label>
-                            <Input
-                              type="number"
-                              min="0"
-                              value={config.max_retries}
-                              onChange={(e) =>
-                                updateProvider(
-                                  idx,
-                                  'max_retries',
-                                  Number(e.target.value),
-                                )
-                              }
-                            />
-                          </div>
-                          <div className="space-y-1">
-                            <Label className="text-xs">
-                              {t('apiChains.timeout')}
-                            </Label>
-                            <Input
-                              type="number"
-                              min="1000"
-                              step="1000"
-                              value={config.timeout_ms}
-                              onChange={(e) =>
-                                updateProvider(
-                                  idx,
-                                  'timeout_ms',
-                                  Number(e.target.value),
-                                )
-                              }
-                            />
-                          </div>
-                        </div>
-
-                        {/* Aggregation toggle */}
-                        <div className="flex items-center gap-2">
-                          <Switch
-                            checked={config.is_aggregated}
-                            onCheckedChange={(v) =>
-                              updateProvider(idx, 'is_aggregated', v)
-                            }
-                          />
-                          <Label className="text-xs">
-                            {t('apiChains.aggregation')}
-                          </Label>
-                        </div>
-                      </div>
-                    )}
-
-                    {/* Model configs expander */}
-                    {config.provider_uuid && (
-                      <div className="mt-1">
-                        <button
-                          type="button"
-                          className="flex items-center gap-1 text-xs text-muted-foreground hover:text-foreground"
-                          onClick={() =>
-                            setExpandedModelConfigs((prev) => {
-                              const next = new Set(prev);
-                              if (next.has(idx)) {
-                                next.delete(idx);
-                              } else {
-                                next.add(idx);
-                              }
-                              return next;
-                            })
-                          }
-                        >
-                          {modelConfigsExpanded ? (
-                            <ChevronDown className="h-3 w-3" />
-                          ) : (
-                            <ChevronRight className="h-3 w-3" />
-                          )}
-                          {t('apiChains.modelConfigs')}
-                          {(config.model_configs?.length ?? 0) > 0 && (
-                            <span className="ml-1 bg-primary/10 text-primary px-1.5 py-0.5 rounded text-[10px]">
-                              {config.model_configs!.length}
-                            </span>
-                          )}
-                        </button>
-
-                        {modelConfigsExpanded && (
-                          <div className="mt-2 space-y-2 pl-2 border-l-2 border-border">
-                            <p className="text-xs text-muted-foreground">
-                              {t('apiChains.modelConfigsHint')}
-                            </p>
-
-                            {(config.model_configs ?? []).map((mc, mi) => (
-                              <div
-                                key={mi}
-                                className="border rounded p-2 space-y-2 bg-background"
-                              >
-                                {/* Model selector + move + delete */}
-                                <div className="flex items-center gap-1">
-                                  <div className="flex flex-col gap-0.5">
-                                    <button
-                                      type="button"
-                                      onClick={() =>
-                                        moveModelConfig(idx, mi, 'up')
-                                      }
-                                      disabled={mi === 0}
-                                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
-                                    >
-                                      <GripVertical className="h-3 w-3" />
-                                    </button>
-                                    <button
-                                      type="button"
-                                      onClick={() =>
-                                        moveModelConfig(idx, mi, 'down')
-                                      }
-                                      disabled={
-                                        mi ===
-                                        (config.model_configs?.length ?? 0) - 1
-                                      }
-                                      className="p-0.5 hover:bg-accent rounded disabled:opacity-30"
-                                    >
-                                      <GripVertical className="h-3 w-3" />
-                                    </button>
-                                  </div>
-                                  <span className="text-xs font-medium w-5">
-                                    #{mi + 1}
-                                  </span>
-                                  <Select
-                                    value={mc.model_name}
-                                    onValueChange={(v) =>
-                                      updateModelConfig(
-                                        idx,
-                                        mi,
-                                        'model_name',
-                                        v,
-                                      )
-                                    }
-                                  >
-                                    <SelectTrigger className="flex-1 h-8 text-xs">
-                                      <SelectValue
-                                        placeholder={t('apiChains.selectModel')}
-                                      />
-                                    </SelectTrigger>
-                                    <SelectContent>
-                                      {providerModels.map((m) => (
-                                        <SelectItem key={m.uuid} value={m.name}>
-                                          {m.name}
-                                        </SelectItem>
-                                      ))}
-                                    </SelectContent>
-                                  </Select>
-                                  <Button
-                                    type="button"
-                                    variant="ghost"
-                                    size="icon"
-                                    className="h-7 w-7 text-destructive hover:text-destructive"
-                                    onClick={() => removeModelConfig(idx, mi)}
-                                  >
-                                    <Trash2 className="h-3 w-3" />
-                                  </Button>
-                                </div>
-                              </div>
-                            ))}
-
-                            <Button
-                              type="button"
-                              variant="outline"
-                              size="sm"
-                              className="h-7 text-xs"
-                              onClick={() => addModelConfig(idx)}
-                            >
-                              <Plus className="h-3 w-3 mr-1" />
-                              {t('apiChains.addModelConfig')}
-                            </Button>
-                          </div>
-                        )}
-                      </div>
-                    )}
-                  </div>
-
-                  <Button
-                    type="button"
-                    variant="ghost"
-                    size="icon"
-                    onClick={() => removeProvider(idx)}
-                    disabled={chainConfig.length === 1}
-                    className="text-destructive hover:text-destructive mt-0.5"
-                  >
-                    <Trash2 className="h-4 w-4" />
-                  </Button>
-                </div>
-              </div>
-            );
-          })}
-        </div>
-      </div>
-
-      {/* Health Check */}
-      <div className="space-y-3 border-t pt-3">
-        <div className="flex items-center justify-between">
-          <Label>{t('apiChains.healthCheck')}</Label>
-          <Switch
-            checked={healthCheckEnabled}
-            onCheckedChange={setHealthCheckEnabled}
-          />
-        </div>
-        {healthCheckEnabled && (
-          <div className="space-y-2">
-            <Label htmlFor="interval">
-              {t('apiChains.healthCheckInterval')}
-            </Label>
-            <Input
-              id="interval"
-              type="number"
-              min="60"
-              value={healthCheckInterval}
-              onChange={(e) => setHealthCheckInterval(Number(e.target.value))}
-            />
-            <p className="text-xs text-muted-foreground">
-              {t('apiChains.healthCheckIntervalHint')}
-            </p>
-          </div>
-        )}
-      </div>
-
-      {/* Actions */}
-      <div className="flex justify-end gap-2 pt-2">
-        <Button variant="outline" onClick={onFormCancel} disabled={loading}>
-          {t('common.cancel')}
-        </Button>
-        <Button onClick={handleSubmit} disabled={loading}>
-          {loading ? t('common.saving') : t('common.save')}
-        </Button>
-      </div>
-    </div>
-  );
-}
diff --git a/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx b/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
deleted file mode 100644
index 0d4435fdb..000000000
--- a/web/src/app/home/components/api-chains-dialog/APIChainsDialog.tsx
+++ /dev/null
@@ -1,179 +0,0 @@
-'use client';
-
-import { useState, useEffect } from 'react';
-import { Plus, Link2 } from 'lucide-react';
-import { httpClient } from '@/app/infra/http/HttpClient';
-import { APIChain, LLMModel, ModelProvider } from '@/app/infra/entities/api';
-import {
-  Dialog,
-  DialogContent,
-  DialogHeader,
-  DialogTitle,
-} from '@/components/ui/dialog';
-import { Button } from '@/components/ui/button';
-import { toast } from 'sonner';
-import { useTranslation } from 'react-i18next';
-import APIChainForm from './APIChainForm';
-import APIChainCard from './APIChainCard';
-
-interface APIChainsDialogProps {
-  open: boolean;
-  onOpenChange: (open: boolean) => void;
-}
-
-export default function APIChainsDialog({
-  open,
-  onOpenChange,
-}: APIChainsDialogProps) {
-  const { t } = useTranslation();
-
-  const [chains, setChains] = useState<APIChain[]>([]);
-  const [providers, setProviders] = useState<ModelProvider[]>([]);
-  const [llmModels, setLlmModels] = useState<LLMModel[]>([]);
-  const [chainFormOpen, setChainFormOpen] = useState(false);
-  const [editingChainId, setEditingChainId] = useState<string | null>(null);
-
-  useEffect(() => {
-    if (open) {
-      loadChains();
-      loadProviders();
-      loadLLMModels();
-    }
-  }, [open]);
-
-  async function loadChains() {
-    try {
-      if (typeof httpClient.getAPIChains !== 'function') {
-        console.error('httpClient.getAPIChains is not defined');
-        toast.error(t('apiChains.loadError') + ': API method not found');
-        return;
-      }
-      const resp = await httpClient.getAPIChains();
-      setChains(resp.chains);
-    } catch (err) {
-      console.error('Failed to load API chains', err);
-      toast.error(t('apiChains.loadError') + ': ' + (err as Error).message);
-    }
-  }
-
-  async function loadProviders() {
-    try {
-      if (typeof httpClient.getModelProviders !== 'function') {
-        console.error('httpClient.getModelProviders is not defined');
-        return;
-      }
-      const resp = await httpClient.getModelProviders();
-      setProviders(resp.providers);
-    } catch (err) {
-      console.error('Failed to load providers', err);
-      toast.error((err as Error).message);
-    }
-  }
-
-  async function loadLLMModels() {
-    try {
-      const resp = await httpClient.getProviderLLMModels();
-      setLlmModels(resp.models);
-    } catch (err) {
-      console.error('Failed to load LLM models', err);
-    }
-  }
-
-  function handleCreateChain() {
-    setEditingChainId(null);
-    setChainFormOpen(true);
-  }
-
-  function handleEditChain(chainId: string) {
-    setEditingChainId(chainId);
-    setChainFormOpen(true);
-  }
-
-  async function handleDeleteChain(chainId: string) {
-    try {
-      await httpClient.deleteAPIChain(chainId);
-      toast.success(t('apiChains.chainDeleted'));
-      loadChains();
-    } catch (err) {
-      toast.error(t('apiChains.chainDeleteError') + (err as Error).message);
-    }
-  }
-
-  function handleFormClose() {
-    setChainFormOpen(false);
-    loadChains();
-  }
-
-  return (
-    <>
-      <Dialog
-        open={open}
-        onOpenChange={(newOpen) => {
-          if (!newOpen && chainFormOpen) return;
-          onOpenChange(newOpen);
-        }}
-      >
-        <DialogContent className="overflow-hidden p-0 h-[80vh] flex flex-col !max-w-[37rem]">
-          <DialogHeader className="px-6 pt-6 pb-0 flex-shrink-0">
-            <DialogTitle>{t('apiChains.title')}</DialogTitle>
-          </DialogHeader>
-
-          <div className="flex-1 overflow-auto px-6 pb-6 mt-0">
-            {/* Add Chain Button */}
-            <div className="mb-3 flex justify-between items-center sticky top-0 bg-background py-2 z-10">
-              <span className="text-sm text-muted-foreground">
-                {chains.length === 0
-                  ? t('apiChains.addChainHint')
-                  : t('apiChains.chainCount', { count: chains.length })}
-              </span>
-              <Button size="sm" variant="outline" onClick={handleCreateChain}>
-                <Plus className="h-4 w-4 mr-1" />
-                {t('apiChains.addChain')}
-              </Button>
-            </div>
-
-            {/* Chain List */}
-            {chains.length === 0 ? (
-              <div className="flex flex-col items-center justify-center py-12 text-muted-foreground">
-                <Link2 className="h-12 w-12 mb-3 opacity-50" />
-                <p className="text-sm">{t('apiChains.noChains')}</p>
-              </div>
-            ) : (
-              chains.map((chain) => (
-                <APIChainCard
-                  key={chain.uuid}
-                  chain={chain}
-                  providers={providers}
-                  llmModels={llmModels}
-                  onEdit={() => handleEditChain(chain.uuid)}
-                  onDelete={() => handleDeleteChain(chain.uuid)}
-                />
-              ))
-            )}
-          </div>
-        </DialogContent>
-      </Dialog>
-
-      <Dialog open={chainFormOpen} onOpenChange={setChainFormOpen}>
-        <DialogContent className="overflow-hidden p-0 h-[80vh] flex flex-col !max-w-[37rem]">
-          <DialogHeader className="px-6 pt-6 pb-0 flex-shrink-0">
-            <DialogTitle>
-              {editingChainId
-                ? t('apiChains.editChain')
-                : t('apiChains.addChain')}
-            </DialogTitle>
-          </DialogHeader>
-          <div className="flex-1 overflow-y-auto px-6 pb-6 pt-4">
-            <APIChainForm
-              chainId={editingChainId || undefined}
-              providers={providers}
-              llmModels={llmModels}
-              onFormSubmit={handleFormClose}
-              onFormCancel={() => setChainFormOpen(false)}
-            />
-          </div>
-        </DialogContent>
-      </Dialog>
-    </>
-  );
-}
diff --git a/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx b/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
index 5ee04b3d6..7ebfcec12 100644
--- a/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
+++ b/web/src/app/home/components/dynamic-form/DynamicFormComponent.tsx
@@ -73,6 +73,12 @@ export default function DynamicFormComponent({
           case 'bot-selector':
             fieldSchema = z.string();
             break;
+          case 'model-fallback-selector':
+            fieldSchema = z.object({
+              primary: z.string(),
+              fallbacks: z.array(z.string()),
+            });
+            break;
           case 'prompt-editor':
             fieldSchema = z.array(
               z.object({
@@ -226,6 +232,7 @@ export default function DynamicFormComponent({
 
           // All fields are disabled when editing (creation_settings are immutable)
           const isFieldDisabled = !!isEditing;
+
           return (
             <FormField
               key={config.id}
diff --git a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
index 7c7a13efd..b400c1dc1 100644
--- a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
+++ b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
@@ -23,9 +23,7 @@ import {
   Bot,
   KnowledgeBase,
   EmbeddingModel,
-  ExternalKnowledgeBase,
   ApiRespPluginSystemStatus,
-  APIChain,
 } from '@/app/infra/entities/api';
 import { toast } from 'sonner';
 import { useTranslation } from 'react-i18next';
@@ -54,7 +52,6 @@ export default function DynamicFormItemComponent({
 }) {
   const [llmModels, setLlmModels] = useState<LLMModel[]>([]);
   const [embeddingModels, setEmbeddingModels] = useState<EmbeddingModel[]>([]);
-  const [apiChains, setApiChains] = useState<APIChain[]>([]);
   const [knowledgeBases, setKnowledgeBases] = useState<KnowledgeBase[]>([]);
   const [bots, setBots] = useState<Bot[]>([]);
   const [uploading, setUploading] = useState<boolean>(false);
@@ -129,7 +126,7 @@ export default function DynamicFormItemComponent({
   }, [config.type]);
 
   useEffect(() => {
-    if (config.type === DynamicFormItemType.MODEL_OR_API_CHAIN_SELECTOR) {
+    if (config.type === DynamicFormItemType.MODEL_FALLBACK_SELECTOR) {
       httpClient
         .getProviderLLMModels()
         .then((resp) => {
@@ -147,15 +144,6 @@ export default function DynamicFormItemComponent({
         .catch((err) => {
           toast.error('Failed to get LLM model list: ' + err.msg);
         });
-
-      httpClient
-        .getAPIChains()
-        .then((resp) => {
-          setApiChains(resp.chains);
-        })
-        .catch((err) => {
-          console.error('Failed to get API chains:', err);
-        });
     }
   }, [config.type]);
 
@@ -348,9 +336,9 @@ export default function DynamicFormItemComponent({
         </Select>
       );
 
-    case DynamicFormItemType.MODEL_OR_API_CHAIN_SELECTOR:
+    case DynamicFormItemType.MODEL_FALLBACK_SELECTOR: {
       // Group models by provider
-      const groupedModelsForChain = llmModels.reduce(
+      const groupedModelsForFallback = llmModels.reduce(
         (acc, model) => {
           const providerName =
             model.provider?.name || model.provider?.requester || 'Unknown';
@@ -361,53 +349,159 @@ export default function DynamicFormItemComponent({
         {} as Record<string, LLMModel[]>,
       );
 
-      return (
-        <Select value={field.value} onValueChange={field.onChange}>
+      const modelValue = field.value as {
+        primary: string;
+        fallbacks: string[];
+      };
+
+      const renderModelSelect = (
+        value: string,
+        onChange: (val: string) => void,
+        placeholder: string,
+      ) => (
+        <Select value={value} onValueChange={onChange}>
           <SelectTrigger className="bg-[#ffffff] dark:bg-[#2a2a2e]">
-            <SelectValue placeholder={t('common.selectOption')} />
+            <SelectValue placeholder={placeholder} />
           </SelectTrigger>
           <SelectContent>
-            {/* Models Section */}
-            {Object.entries(groupedModelsForChain).length > 0 && (
-              <SelectGroup>
-                <SelectLabel>{t('models.title')}</SelectLabel>
-                {Object.entries(groupedModelsForChain).map(
-                  ([providerName, models]) => (
-                    <SelectGroup key={providerName}>
-                      <SelectLabel className="pl-4">{providerName}</SelectLabel>
-                      {models.map((model) => (
-                        <SelectItem key={model.uuid} value={model.uuid}>
-                          <span className="inline-flex items-center gap-1">
-                            {model.name}
-                            {model.abilities?.includes('vision') && (
-                              <Eye className="h-3 w-3 text-muted-foreground" />
-                            )}
-                            {model.abilities?.includes('func_call') && (
-                              <Wrench className="h-3 w-3 text-muted-foreground" />
-                            )}
-                          </span>
-                        </SelectItem>
-                      ))}
-                    </SelectGroup>
-                  ),
-                )}
-              </SelectGroup>
-            )}
-            {/* API Chains Section */}
-            {apiChains.length > 0 && (
-              <SelectGroup>
-                <SelectLabel>{t('apiChains.title')}</SelectLabel>
-                {apiChains.map((chain) => (
-                  <SelectItem key={chain.uuid} value={chain.uuid}>
-                    {chain.name}
-                  </SelectItem>
-                ))}
-              </SelectGroup>
+            {Object.entries(groupedModelsForFallback).map(
+              ([providerName, models]) => (
+                <SelectGroup key={providerName}>
+                  <SelectLabel>{providerName}</SelectLabel>
+                  {models.map((model) => (
+                    <SelectItem key={model.uuid} value={model.uuid}>
+                      <span className="inline-flex items-center gap-1">
+                        {model.name}
+                        {model.abilities?.includes('vision') && (
+                          <Eye className="h-3 w-3 text-muted-foreground" />
+                        )}
+                        {model.abilities?.includes('func_call') && (
+                          <Wrench className="h-3 w-3 text-muted-foreground" />
+                        )}
+                      </span>
+                    </SelectItem>
+                  ))}
+                </SelectGroup>
+              ),
             )}
           </SelectContent>
         </Select>
       );
 
+      const updateValue = (patch: Partial<typeof modelValue>) => {
+        field.onChange({ ...modelValue, ...patch });
+      };
+
+      const addFallbackModel = () => {
+        updateValue({ fallbacks: [...modelValue.fallbacks, ''] });
+      };
+
+      const updateFallbackModel = (index: number, value: string) => {
+        const updated = [...modelValue.fallbacks];
+        updated[index] = value;
+        updateValue({ fallbacks: updated });
+      };
+
+      const removeFallbackModel = (index: number) => {
+        const updated = [...modelValue.fallbacks];
+        updated.splice(index, 1);
+        updateValue({ fallbacks: updated });
+      };
+
+      const moveFallbackModel = (index: number, direction: 'up' | 'down') => {
+        const updated = [...modelValue.fallbacks];
+        const newIndex = direction === 'up' ? index - 1 : index + 1;
+        if (newIndex < 0 || newIndex >= updated.length) return;
+        [updated[index], updated[newIndex]] = [
+          updated[newIndex],
+          updated[index],
+        ];
+        updateValue({ fallbacks: updated });
+      };
+
+      return (
+        <div className="space-y-3">
+          {/* Primary model selector */}
+          <div>
+            <p className="text-xs text-muted-foreground mb-1">
+              {t('models.fallback.primary')}
+            </p>
+            {renderModelSelect(
+              modelValue.primary,
+              (val) => updateValue({ primary: val }),
+              t('models.selectModel'),
+            )}
+          </div>
+
+          {/* Fallback models */}
+          {modelValue.fallbacks.length > 0 && (
+            <div className="space-y-2">
+              <p className="text-xs text-muted-foreground">
+                {t('models.fallback.fallbackList')}
+              </p>
+              {modelValue.fallbacks.map((fbUuid: string, index: number) => (
+                <div key={index} className="flex items-center gap-2">
+                  <span className="text-xs text-muted-foreground w-4 shrink-0">
+                    {index + 1}.
+                  </span>
+                  <div className="flex-1">
+                    {renderModelSelect(
+                      fbUuid,
+                      (val) => updateFallbackModel(index, val),
+                      t('models.selectModel'),
+                    )}
+                  </div>
+                  <div className="flex gap-1 shrink-0">
+                    <Button
+                      type="button"
+                      variant="ghost"
+                      size="sm"
+                      className="h-8 w-8 p-0"
+                      onClick={() => moveFallbackModel(index, 'up')}
+                      disabled={index === 0}
+                    >
+                      ↑
+                    </Button>
+                    <Button
+                      type="button"
+                      variant="ghost"
+                      size="sm"
+                      className="h-8 w-8 p-0"
+                      onClick={() => moveFallbackModel(index, 'down')}
+                      disabled={index === modelValue.fallbacks.length - 1}
+                    >
+                      ↓
+                    </Button>
+                    <Button
+                      type="button"
+                      variant="ghost"
+                      size="sm"
+                      className="h-8 w-8 p-0 text-destructive"
+                      onClick={() => removeFallbackModel(index)}
+                    >
+                      <X className="h-4 w-4" />
+                    </Button>
+                  </div>
+                </div>
+              ))}
+            </div>
+          )}
+
+          {/* Add fallback button */}
+          <Button
+            type="button"
+            variant="outline"
+            size="sm"
+            className="w-full"
+            onClick={addFallbackModel}
+          >
+            <Plus className="h-4 w-4 mr-1" />
+            {t('models.fallback.addFallback')}
+          </Button>
+        </div>
+      );
+    }
+
     case DynamicFormItemType.KNOWLEDGE_BASE_SELECTOR:
       // Group KBs by Knowledge Engine name
       const kbsByEngine = knowledgeBases.reduce(
diff --git a/web/src/app/home/components/models-dialog/ModelsDialog.tsx b/web/src/app/home/components/models-dialog/ModelsDialog.tsx
index 4b361f56b..c32e56f14 100644
--- a/web/src/app/home/components/models-dialog/ModelsDialog.tsx
+++ b/web/src/app/home/components/models-dialog/ModelsDialog.tsx
@@ -1,10 +1,9 @@
 'use client';
 
 import { useState, useEffect } from 'react';
-import { Plus, Boxes, Link2 } from 'lucide-react';
+import { Plus, Boxes } from 'lucide-react';
 import { httpClient, systemInfo } from '@/app/infra/http/HttpClient';
 import { ModelProvider } from '@/app/infra/entities/api';
-import APIChainsDialog from '../api-chains-dialog/APIChainsDialog';
 import {
   Dialog,
   DialogContent,
@@ -71,9 +70,6 @@ export default function ModelsDialog({
     null,
   );
 
-  // API Chains dialog
-  const [apiChainsDialogOpen, setApiChainsDialogOpen] = useState(false);
-
   // Popover states
   const [addModelPopoverOpen, setAddModelPopoverOpen] = useState<string | null>(
     null,
@@ -468,14 +464,6 @@ export default function ModelsDialog({
                   : t('models.providerCount', { count: otherProviders.length })}
               </span>
               <div className="flex gap-2">
-                <Button
-                  size="sm"
-                  variant="outline"
-                  onClick={() => setApiChainsDialogOpen(true)}
-                >
-                  <Link2 className="h-4 w-4 mr-1" />
-                  {t('apiChains.manageChains')}
-                </Button>
                 <Button
                   size="sm"
                   variant="outline"
@@ -516,11 +504,6 @@ export default function ModelsDialog({
           />
         </DialogContent>
       </Dialog>
-
-      <APIChainsDialog
-        open={apiChainsDialogOpen}
-        onOpenChange={setApiChainsDialogOpen}
-      />
     </>
   );
 }
diff --git a/web/src/app/infra/entities/api/api_chain.ts b/web/src/app/infra/entities/api/api_chain.ts
deleted file mode 100644
index 05efc386e..000000000
--- a/web/src/app/infra/entities/api/api_chain.ts
+++ /dev/null
@@ -1,64 +0,0 @@
-export interface APIChain {
-  uuid: string;
-  name: string;
-  description?: string;
-  chain_config: APIChainItem[];
-  health_check_interval: number;
-  health_check_enabled: boolean;
-  created_at?: string;
-  updated_at?: string;
-  statuses?: APIChainStatus[];
-}
-
-export interface APIChainKeyPriority {
-  index: number;
-  priority: number;
-}
-
-export interface APIChainModelConfig {
-  model_name: string;
-  priority: number;
-  api_key_indices?: APIChainKeyPriority[];
-}
-
-export interface APIChainItem {
-  provider_uuid: string;
-  priority: number;
-  is_aggregated: boolean;
-  max_retries: number;
-  timeout_ms: number;
-  /** Per-model configuration (optional). Empty = use original query model */
-  model_configs?: APIChainModelConfig[];
-}
-
-export interface APIChainStatus {
-  provider_uuid: string;
-  /** null = provider-level, non-null = specific model */
-  model_name: string | null;
-  /** null = round-robin, non-null = specific API key index */
-  api_key_index: number | null;
-  is_healthy: boolean;
-  failure_count: number;
-  last_failure_time?: string;
-  last_success_time?: string;
-  last_health_check_time?: string;
-  last_error_message?: string;
-  /** True when the last health-check probe itself failed (not a normal request failure) */
-  health_check_last_failed?: boolean;
-}
-
-export interface CreateAPIChainRequest {
-  name: string;
-  description?: string;
-  chain_config: APIChainItem[];
-  health_check_interval?: number;
-  health_check_enabled?: boolean;
-}
-
-export interface UpdateAPIChainRequest {
-  name?: string;
-  description?: string;
-  chain_config?: APIChainItem[];
-  health_check_interval?: number;
-  health_check_enabled?: boolean;
-}
diff --git a/web/src/app/infra/entities/api/index.ts b/web/src/app/infra/entities/api/index.ts
index 223f83473..b9af3d93c 100644
--- a/web/src/app/infra/entities/api/index.ts
+++ b/web/src/app/infra/entities/api/index.ts
@@ -451,61 +451,3 @@ export interface MCPTool {
   description: string;
   parameters?: object;
 }
-
-// API Chain
-export interface APIChain {
-  uuid: string;
-  name: string;
-  description?: string;
-  chain_config: APIChainItem[];
-  health_check_interval: number;
-  health_check_enabled: boolean;
-  created_at?: string;
-  updated_at?: string;
-  statuses?: APIChainStatus[];
-}
-
-export interface APIChainKeyPriority {
-  index: number;
-  priority: number;
-}
-
-export interface APIChainModelConfig {
-  model_name: string;
-  priority: number;
-  api_key_indices?: APIChainKeyPriority[];
-}
-
-export interface APIChainItem {
-  provider_uuid: string;
-  priority: number;
-  is_aggregated: boolean;
-  max_retries: number;
-  timeout_ms: number;
-  /** Per-model configuration (optional). Empty = use original query model */
-  model_configs?: APIChainModelConfig[];
-}
-
-export interface APIChainStatus {
-  provider_uuid: string;
-  /** null = provider-level, non-null = specific model */
-  model_name: string | null;
-  /** null = round-robin, non-null = specific API key index */
-  api_key_index: number | null;
-  is_healthy: boolean;
-  failure_count: number;
-  last_failure_time?: string;
-  last_success_time?: string;
-  last_health_check_time?: string;
-  last_error_message?: string;
-  /** True when the last health-check probe itself failed (not a normal request failure) */
-  health_check_last_failed?: boolean;
-}
-
-export interface ApiRespAPIChains {
-  chains: APIChain[];
-}
-
-export interface ApiRespAPIChain {
-  chain: APIChain;
-}
diff --git a/web/src/app/infra/entities/form/dynamic.ts b/web/src/app/infra/entities/form/dynamic.ts
index 3c641ef33..3f57b0f91 100644
--- a/web/src/app/infra/entities/form/dynamic.ts
+++ b/web/src/app/infra/entities/form/dynamic.ts
@@ -35,7 +35,7 @@ export enum DynamicFormItemType {
   SELECT = 'select',
   LLM_MODEL_SELECTOR = 'llm-model-selector',
   EMBEDDING_MODEL_SELECTOR = 'embedding-model-selector',
-  MODEL_OR_API_CHAIN_SELECTOR = 'model-or-api-chain-selector',
+  MODEL_FALLBACK_SELECTOR = 'model-fallback-selector',
   PROMPT_EDITOR = 'prompt-editor',
   UNKNOWN = 'unknown',
   KNOWLEDGE_BASE_SELECTOR = 'knowledge-base-selector',
diff --git a/web/src/app/infra/http/BackendClient.ts b/web/src/app/infra/http/BackendClient.ts
index 9e144ad3f..d234ddd11 100644
--- a/web/src/app/infra/http/BackendClient.ts
+++ b/web/src/app/infra/http/BackendClient.ts
@@ -41,9 +41,6 @@ import {
   ApiRespKnowledgeEngines,
   ApiRespParsers,
   RagMigrationStatusResp,
-  ApiRespAPIChains,
-  ApiRespAPIChain,
-  APIChain,
 } from '@/app/infra/entities/api';
 import { Plugin } from '@/app/infra/entities/plugin';
 import { GetBotLogsRequest } from '@/app/infra/http/requestParam/bots/GetBotLogsRequest';
@@ -107,32 +104,6 @@ export class BackendClient extends BaseHttpClient {
     return this.delete(`/api/v1/provider/providers/${uuid}`);
   }
 
-  // ============ API Chains ============
-  public getAPIChains(): Promise<ApiRespAPIChains> {
-    return this.get('/api/v1/provider/api-chains');
-  }
-
-  public getAPIChain(uuid: string): Promise<ApiRespAPIChain> {
-    return this.get(`/api/v1/provider/api-chains/${uuid}`);
-  }
-
-  public createAPIChain(
-    chain: Omit<APIChain, 'uuid'>,
-  ): Promise<{ uuid: string }> {
-    return this.post('/api/v1/provider/api-chains', chain);
-  }
-
-  public updateAPIChain(
-    uuid: string,
-    chain: Partial<APIChain>,
-  ): Promise<object> {
-    return this.put(`/api/v1/provider/api-chains/${uuid}`, chain);
-  }
-
-  public deleteAPIChain(uuid: string): Promise<object> {
-    return this.delete(`/api/v1/provider/api-chains/${uuid}`);
-  }
-
   // ============ Provider Model LLM ============
   public getProviderLLMModels(
     providerUuid?: string,
diff --git a/web/src/i18n/locales/en-US.ts b/web/src/i18n/locales/en-US.ts
index 88becc75c..1a5d52676 100644
--- a/web/src/i18n/locales/en-US.ts
+++ b/web/src/i18n/locales/en-US.ts
@@ -236,6 +236,11 @@ const enUS = {
     modelsCount: '{{count}} model(s)',
     expandModels: 'Expand',
     collapseModels: 'Collapse',
+    fallback: {
+      primary: 'Primary Model',
+      fallbackList: 'Fallback Models',
+      addFallback: 'Add Fallback Model',
+    },
   },
   bots: {
     title: 'Bots',
@@ -1040,62 +1045,6 @@ const enUS = {
     maxExtensionsReached:
       'Maximum number of extensions ({{max}}) reached. Please remove an existing MCP server or plugin before adding a new one.',
   },
-  apiChains: {
-    title: 'API Chains',
-    description: 'Manage API chains for failover and load balancing',
-    name: 'Chain Name',
-    namePlaceholder: 'Enter chain name',
-    nameRequired: 'Chain name is required',
-    descriptionPlaceholder: 'Enter description (optional)',
-    providers: 'Provider Chain',
-    addProvider: 'Add Provider',
-    selectProvider: 'Select Provider',
-    selectAllProviders: 'Please select all providers',
-    atLeastOneProvider: 'At least one provider is required',
-    maxRetries: 'Max Retries',
-    timeout: 'Timeout (ms)',
-    aggregation: 'Enable Aggregation',
-    healthCheck: 'Health Check',
-    healthCheckInterval: 'Check Interval (seconds)',
-    healthCheckIntervalHint: 'Minimum 60 seconds',
-    createSuccess: 'API chain created successfully',
-    createError: 'Failed to create API chain',
-    updateSuccess: 'API chain updated successfully',
-    updateError: 'Failed to update API chain',
-    deleteSuccess: 'API chain deleted successfully',
-    deleteError: 'Failed to delete API chain',
-    deleteConfirm: 'Are you sure you want to delete this API chain?',
-    loadError: 'Failed to load API chain',
-    noChains: 'No API chains configured',
-    createChain: 'Create API Chain',
-    editChain: 'Edit API Chain',
-    addChain: 'Add Chain',
-    addChainHint: 'Add API chains to manage failover',
-    chainCount: '{{count}} chain(s)',
-    chainDeleted: 'API chain deleted successfully',
-    chainDeleteError: 'Failed to delete API chain: ',
-    providerCount: '{{count}} provider(s)',
-    status: 'Status',
-    active: 'Active',
-    inactive: 'Inactive',
-    manageChains: 'Manage API Chains',
-    selectChain: 'Select API Chain',
-    healthy: 'Healthy',
-    unhealthy: 'Unhealthy',
-    failureCount: 'Failures',
-    lastError: 'Last Error',
-    retryCount: 'Retries',
-    errorCount: 'Errors',
-    // Model configuration
-    modelConfigs: 'Model Configuration',
-    modelConfigsHint:
-      'Optional: specify model priority for this provider. Without this the original query model is used and API keys are rotated per provider settings.',
-    addModelConfig: 'Add Model',
-    selectModel: 'Select Model',
-    selectAllModels: 'Please select a model for each model config entry',
-    advanced: 'Advanced',
-    healthCheckFailed: 'Health Check Failed',
-  },
 };
 
 export default enUS;
diff --git a/web/src/i18n/locales/ja-JP.ts b/web/src/i18n/locales/ja-JP.ts
index 4ec21a370..475affaa3 100644
--- a/web/src/i18n/locales/ja-JP.ts
+++ b/web/src/i18n/locales/ja-JP.ts
@@ -241,6 +241,11 @@
     modelsCount: '{{count}} 個のモデル',
     expandModels: '展開',
     collapseModels: '折りたたむ',
+    fallback: {
+      primary: 'プライマリモデル',
+      fallbackList: 'フォールバックモデル',
+      addFallback: 'フォールバックモデルを追加',
+    },
   },
   bots: {
     title: 'ボット',
@@ -1016,62 +1021,6 @@
     maxExtensionsReached:
       '拡張機能数が上限（{{max}}個）に達しました。新しい MCP サーバーやプラグインを追加するには、既存のものを削除してください。',
   },
-
-  apiChains: {
-    title: 'API チェーン',
-    description: 'フェイルオーバーと負荷分散のための API チェーンを管理する',
-    name: 'チェーン名',
-    namePlaceholder: 'チェーン名を入力',
-    nameRequired: 'チェーン名は必須です',
-    descriptionPlaceholder: '説明を入力（任意）',
-    providers: 'プロバイダーチェーン',
-    addProvider: 'プロバイダーを追加',
-    selectProvider: 'プロバイダーを選択',
-    selectAllProviders: 'すべてのプロバイダーを選択してください',
-    atLeastOneProvider: 'プロバイダーが少なくとも 1 つ必要です',
-    maxRetries: '最大リトライ回数',
-    timeout: 'タイムアウト（ミリ秒）',
-    aggregation: '集約モードを有効にする',
-    healthCheck: 'ヘルスチェック',
-    healthCheckInterval: 'チェック間隔（秒）',
-    healthCheckIntervalHint: '最小 60 秒',
-    createSuccess: 'API チェーンが作成されました',
-    createError: 'API チェーンの作成に失敗しました',
-    updateSuccess: 'API チェーンが更新されました',
-    updateError: 'API チェーンの更新に失敗しました',
-    deleteSuccess: 'API チェーンが削除されました',
-    deleteError: 'API チェーンの削除に失敗しました',
-    deleteConfirm: 'この API チェーンを削除してもよいですか？',
-    loadError: 'API チェーンの読み込みに失敗しました',
-    noChains: 'API チェーンが設定されていません',
-    createChain: 'API チェーンを作成',
-    editChain: 'API チェーンを編集',
-    addChain: 'チェーンを追加',
-    addChainHint: 'フェイルオーバー管理用の API チェーンを追加',
-    chainCount: '{{count}} 個のチェーン',
-    chainDeleted: 'API チェーンが削除されました',
-    chainDeleteError: 'API チェーンの削除に失敗しました：',
-    providerCount: '{{count}} 個のプロバイダー',
-    status: 'ステータス',
-    active: 'アクティブ',
-    inactive: '非アクティブ',
-    manageChains: 'API チェーンを管理',
-    selectChain: 'API チェーンを選択',
-    healthy: '正常',
-    unhealthy: '異常',
-    failureCount: '失敗回数',
-    lastError: '直近のエラー',
-    retryCount: 'リトライ回数',
-    errorCount: 'エラー回数',
-    modelConfigs: 'モデル設定',
-    modelConfigsHint:
-      '任意：このプロバイダーのモデル優先度を指定します。未設定の場合はリクエストのモデルをそのまま使用し、API キーはプロバイダー設定に従って自動ローテーションされます',
-    addModelConfig: 'モデルを追加',
-    selectModel: 'モデルを選択',
-    selectAllModels: 'すべてのモデル設定にモデルを選択してください',
-    advanced: '詳細',
-    healthCheckFailed: 'ヘルスチェック失敗',
-  },
 };
 
 export default jaJP;
diff --git a/web/src/i18n/locales/zh-Hans.ts b/web/src/i18n/locales/zh-Hans.ts
index 083674e2d..ce3548298 100644
--- a/web/src/i18n/locales/zh-Hans.ts
+++ b/web/src/i18n/locales/zh-Hans.ts
@@ -227,6 +227,11 @@ const zhHans = {
     modelsCount: '{{count}} 个模型',
     expandModels: '展开',
     collapseModels: '收起',
+    fallback: {
+      primary: '主模型',
+      fallbackList: '备用模型',
+      addFallback: '添加备用模型',
+    },
   },
   bots: {
     title: '机器人',
@@ -998,62 +1003,6 @@ const zhHans = {
     maxExtensionsReached:
       '已达到扩展数量上限（{{max}}个）。请先删除已有的 MCP 服务器或插件后再添加新的。',
   },
-  apiChains: {
-    title: 'API 链',
-    description: '管理 API 链以实现故障转移和负载均衡',
-    name: '链名称',
-    namePlaceholder: '输入链名称',
-    nameRequired: '链名称不能为空',
-    descriptionPlaceholder: '输入描述（可选）',
-    providers: '供应商链',
-    addProvider: '添加供应商',
-    selectProvider: '选择供应商',
-    selectAllProviders: '请选择所有供应商',
-    atLeastOneProvider: '至少需要一个供应商',
-    maxRetries: '最大重试次数',
-    timeout: '超时时间 (毫秒)',
-    aggregation: '启用聚合模式',
-    healthCheck: '健康检查',
-    healthCheckInterval: '检查间隔（秒）',
-    healthCheckIntervalHint: '最小 60 秒',
-    createSuccess: 'API 链创建成功',
-    createError: '创建 API 链失败',
-    updateSuccess: 'API 链更新成功',
-    updateError: '更新 API 链失败',
-    deleteSuccess: 'API 链删除成功',
-    deleteError: '删除 API 链失败',
-    deleteConfirm: '确定要删除此 API 链吗？',
-    loadError: '加载 API 链失败',
-    noChains: '暂无 API 链配置',
-    createChain: '创建 API 链',
-    editChain: '编辑 API 链',
-    addChain: '添加链',
-    addChainHint: '添加 API 链以管理故障转移',
-    chainCount: '共 {{count}} 个链',
-    chainDeleted: 'API 链删除成功',
-    chainDeleteError: '删除 API 链失败：',
-    providerCount: '{{count}} 个供应商',
-    status: '状态',
-    active: '活跃',
-    inactive: '不活跃',
-    manageChains: '管理 API 链',
-    selectChain: '选择 API 链',
-    healthy: '健康',
-    unhealthy: '不健康',
-    failureCount: '失败次数',
-    lastError: '最近错误',
-    retryCount: '重试次数',
-    errorCount: '错误次数',
-    // Model configuration
-    modelConfigs: '模型配置',
-    modelConfigsHint:
-      '可选：为该供应商指定模型优先级。不配置时使用请求的原始模型，API 将按厂商配置轮询',
-    addModelConfig: '添加模型',
-    selectModel: '选择模型',
-    selectAllModels: '请为所有模型配置条目选择模型',
-    advanced: '高级',
-    healthCheckFailed: '健康检查失败',
-  },
 };
 
 export default zhHans;
diff --git a/web/src/i18n/locales/zh-Hant.ts b/web/src/i18n/locales/zh-Hant.ts
index f1abc1325..d6bfc6d60 100644
--- a/web/src/i18n/locales/zh-Hant.ts
+++ b/web/src/i18n/locales/zh-Hant.ts
@@ -226,6 +226,11 @@ const zhHant = {
     modelsCount: '{{count}} 個模型',
     expandModels: '展開',
     collapseModels: '收起',
+    fallback: {
+      primary: '主模型',
+      fallbackList: '備用模型',
+      addFallback: '新增備用模型',
+    },
   },
   bots: {
     title: '機器人',
@@ -962,61 +967,6 @@ const zhHant = {
     maxExtensionsReached:
       '已達到擴充功能數量上限（{{max}}個）。請先刪除已有的 MCP 伺服器或外掛後再新增。',
   },
-  apiChains: {
-    title: 'API 鏈',
-    description: '管理 API 鏈以實現故障轉移和負載均衡',
-    name: '鏈名稱',
-    namePlaceholder: '輸入鏈名稱',
-    nameRequired: '鏈名稱不能為空',
-    descriptionPlaceholder: '輸入描述（可選）',
-    providers: '供應商鏈',
-    addProvider: '新增供應商',
-    selectProvider: '選擇供應商',
-    selectAllProviders: '請選擇所有供應商',
-    atLeastOneProvider: '至少需要一個供應商',
-    maxRetries: '最大重試次數',
-    timeout: '逾時時間（毫秒）',
-    aggregation: '啟用聚合模式',
-    healthCheck: '健康檢查',
-    healthCheckInterval: '檢查間隔（秒）',
-    healthCheckIntervalHint: '最少 60 秒',
-    createSuccess: 'API 鏈建立成功',
-    createError: '建立 API 鏈失敗',
-    updateSuccess: 'API 鏈更新成功',
-    updateError: '更新 API 鏈失敗',
-    deleteSuccess: 'API 鏈刪除成功',
-    deleteError: '刪除 API 鏈失敗',
-    deleteConfirm: '確定要刪除此 API 鏈嗎？',
-    loadError: '載入 API 鏈失敗',
-    noChains: '暫無 API 鏈設定',
-    createChain: '建立 API 鏈',
-    editChain: '編輯 API 鏈',
-    addChain: '新增鏈',
-    addChainHint: '新增 API 鏈以管理故障轉移',
-    chainCount: '共 {{count}} 個鏈',
-    chainDeleted: 'API 鏈刪除成功',
-    chainDeleteError: '刪除 API 鏈失敗：',
-    providerCount: '{{count}} 個供應商',
-    status: '狀態',
-    active: '活躍',
-    inactive: '不活躍',
-    manageChains: '管理 API 鏈',
-    selectChain: '選擇 API 鏈',
-    healthy: '健康',
-    unhealthy: '不健康',
-    failureCount: '失敗次數',
-    lastError: '最近錯誤',
-    retryCount: '重試次數',
-    errorCount: '錯誤次數',
-    modelConfigs: '模型設定',
-    modelConfigsHint:
-      '可選：為該供應商指定模型優先級。不設定時使用請求的原始模型，API 將依廠商設定輪詢',
-    addModelConfig: '新增模型',
-    selectModel: '選擇模型',
-    selectAllModels: '請為所有模型設定條目選擇模型',
-    advanced: '進階',
-    healthCheckFailed: '健康檢查失敗',
-  },
 };
 
 export default zhHant;

From 0bd37fc0c83a8bd22510ff67d8024ed92d2139ab Mon Sep 17 00:00:00 2001
From: RockChinQ <rockchinq@gmail.com>
Date: Wed, 11 Mar 2026 15:17:47 -0400
Subject: [PATCH 7/7] fix: remove unused import ApiRespPluginSystemStatus

---
 .../home/components/dynamic-form/DynamicFormItemComponent.tsx    | 1 -
 1 file changed, 1 deletion(-)

diff --git a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
index b400c1dc1..a00e42947 100644
--- a/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
+++ b/web/src/app/home/components/dynamic-form/DynamicFormItemComponent.tsx
@@ -23,7 +23,6 @@ import {
   Bot,
   KnowledgeBase,
   EmbeddingModel,
-  ApiRespPluginSystemStatus,
 } from '@/app/infra/entities/api';
 import { toast } from 'sonner';
 import { useTranslation } from 'react-i18next';